From 5a644cad50457d22cdde183020abdfb5d00fd800 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Wed, 22 May 2024 09:34:59 +0900
Subject: [PATCH 01/36] =?UTF-8?q?onnxruntime-rs=E3=81=8B=E3=82=89ort?=
 =?UTF-8?q?=E3=81=AB=E4=B9=97=E3=82=8A=E6=8F=9B=E3=81=88=E3=82=8B=20(#725)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* onnxruntime-rsからortに乗り換える

* `--features onnxruntime/disable-sys-build-script`を消す

* ortをアップデート

* ortをアップデート

* `onnxruntimeVersion`をアップデート

* libonnxruntimeのコピー処理を更新

* ortをアップデート

* libonnxruntimeのコピー処理を更新

* ortをアップデート

* ortをアップデート

* `ort::ExecutionProvider::is_available`を使う

* `todo!`を消す

* ortをアップデート

* ortにあったAPIを使う

* ortをアップデート

* `$ORT_OUT_DIR`を削除

* ortをアップデート

* ログのフィルタを更新

* ortをアップデート

* tracingのレベルでortのログを抑える

* Minor refactor

* ortをアップデート

* Fix Cargo.lock

* Gradleのlibonnxruntimeのバージョンを更新

* ort v2.0.0-rc.1ベースに切り替える

* Gradleのlibonnxruntimeのバージョンを更新

* `with_execution_provider` → `register`

* ort v2.0.0-rc.2ベースに切り替える

* Gradleのlibonnxruntimeのバージョンを更新

* voicevox-ortを更新

* VOICEVOX/ort#2 に追従する
---
 .cargo/config.toml                            |   4 -
 .github/workflows/build_and_deploy.yml        |  23 +-
 .github/workflows/test.yml                    |  14 +-
 Cargo.lock                                    | 123 +++++---
 Cargo.toml                                    |   6 +-
 crates/voicevox_core/Cargo.toml               |   5 +-
 crates/voicevox_core/src/infer.rs             |  16 +-
 .../src/infer/runtimes/onnxruntime.rs         | 284 ++++++++----------
 crates/voicevox_core/src/infer/session_set.rs |   7 +-
 crates/voicevox_core_c_api/Cargo.toml         |   1 +
 crates/voicevox_core_c_api/src/lib.rs         |   8 +-
 .../tests/e2e/assert_cdylib.rs                |   7 +-
 crates/voicevox_core_c_api/tests/e2e/main.rs  |  10 -
 crates/voicevox_core_java_api/Cargo.toml      |   1 +
 crates/voicevox_core_java_api/settings.gradle |   2 +-
 crates/voicevox_core_java_api/src/logger.rs   |  12 +-
 .../src/inference_domain.rs                   |  18 +-
 crates/voicevox_core_python_api/Cargo.toml    |   1 +
 18 files changed, 269 insertions(+), 273 deletions(-)

diff --git a/.cargo/config.toml b/.cargo/config.toml
index 64fcc6aea..f015cd17a 100644
--- a/.cargo/config.toml
+++ b/.cargo/config.toml
@@ -4,10 +4,6 @@ xtask = "run -p xtask --"
 [env]
 CARGO_WORKSPACE_DIR = { value = "", relative = true }
 
-# Windows環境でテストエラーになるのを防ぐために設定するworkaround
-# https://github.com/VOICEVOX/onnxruntime-rs/issues/3#issuecomment-1207381367
-ORT_OUT_DIR = { value = "target/debug/deps", relative = true }
-
 [target.aarch64-unknown-linux-gnu]
 linker = "aarch64-linux-gnu-gcc"
 
diff --git a/.github/workflows/build_and_deploy.yml b/.github/workflows/build_and_deploy.yml
index 83d895c77..01ddfc434 100644
--- a/.github/workflows/build_and_deploy.yml
+++ b/.github/workflows/build_and_deploy.yml
@@ -58,7 +58,6 @@ jobs:
               "target": "x86_64-pc-windows-msvc",
               "artifact_name": "windows-x64-cpu",
               "whl_local_version": "cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -67,16 +66,14 @@ jobs:
               "target": "x86_64-pc-windows-msvc",
               "artifact_name": "windows-x64-directml",
               "whl_local_version": "directml",
-              "use_cuda": false,
               "can_skip_in_simple_test": false
             },
             {
               "os": "windows-2019",
-              "features": "",
+              "features": "cuda",
               "target": "x86_64-pc-windows-msvc",
               "artifact_name": "windows-x64-cuda",
               "whl_local_version": "cuda",
-              "use_cuda": true,
               "can_skip_in_simple_test": true
             },
             {
@@ -85,7 +82,6 @@ jobs:
               "target": "i686-pc-windows-msvc",
               "artifact_name": "windows-x86-cpu",
               "whl_local_version": "cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -94,16 +90,14 @@ jobs:
               "target": "x86_64-unknown-linux-gnu",
               "artifact_name": "linux-x64-cpu",
               "whl_local_version": "cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
               "os": "ubuntu-20.04",
-              "features": "",
+              "features": "cuda",
               "target": "x86_64-unknown-linux-gnu",
               "artifact_name": "linux-x64-gpu",
               "whl_local_version": "cuda",
-              "use_cuda": true,
               "can_skip_in_simple_test": false
             },
             {
@@ -112,7 +106,6 @@ jobs:
               "target": "aarch64-unknown-linux-gnu",
               "artifact_name": "linux-arm64-cpu",
               "whl_local_version": "cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -120,7 +113,6 @@ jobs:
               "features": "",
               "target": "aarch64-linux-android",
               "artifact_name": "android-arm64-cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -128,7 +120,6 @@ jobs:
               "features": "",
               "target": "x86_64-linux-android",
               "artifact_name": "android-x86_64-cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -137,7 +128,6 @@ jobs:
               "target": "aarch64-apple-darwin",
               "artifact_name": "osx-arm64-cpu",
               "whl_local_version": "cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": false
             },
             {
@@ -146,7 +136,6 @@ jobs:
               "target": "x86_64-apple-darwin",
               "artifact_name": "osx-x64-cpu",
               "whl_local_version": "cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -154,7 +143,6 @@ jobs:
               "features": "",
               "target": "aarch64-apple-ios",
               "artifact_name": "ios-arm64-cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -162,7 +150,6 @@ jobs:
               "features": "",
               "target": "aarch64-apple-ios-sim",
               "artifact_name": "ios-arm64-cpu-sim",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             },
             {
@@ -170,7 +157,6 @@ jobs:
               "features": "",
               "target": "x86_64-apple-ios",
               "artifact_name": "ios-x64-cpu",
-              "use_cuda": false,
               "can_skip_in_simple_test": true
             }
           ]'
@@ -268,7 +254,6 @@ jobs:
           fi
         env:
           RUSTFLAGS: -C panic=abort
-          ORT_USE_CUDA: ${{ matrix.use_cuda }}
       - name: build voicevox_core_python_api
         if: matrix.whl_local_version
         id: build-voicevox-core-python-api
@@ -286,8 +271,6 @@ jobs:
             build > /dev/null 2>&1
           fi
           echo "whl=$(find ./target/wheels -type f)" >> "$GITHUB_OUTPUT"
-        env:
-          ORT_USE_CUDA: ${{ matrix.use_cuda }}
       - name: build voicevox_core_java_api
         if: contains(matrix.target, 'android')
         run: |
@@ -305,7 +288,7 @@ jobs:
           cp -v crates/voicevox_core_c_api/include/voicevox_core.h "artifact/${{ env.ASSET_NAME }}"
           cp -v target/${{ matrix.target }}/release/*voicevox_core.{dll,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
           cp -v target/${{ matrix.target }}/release/voicevox_core.dll.lib "artifact/${{ env.ASSET_NAME }}/voicevox_core.lib" || true
-          cp -v -n target/${{ matrix.target }}/release/build/onnxruntime-sys-*/out/onnxruntime_*/onnxruntime-*/lib/*.{dll,so.*,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
+          cp -v -n target/${{ matrix.target }}/release/{,lib}onnxruntime*.{dll,so.*,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
           # libonnxruntimeについてはバージョン付のshared libraryを使用するためバージョンがついてないものを削除する
           rm -f artifact/${{ env.ASSET_NAME }}/libonnxruntime.{so,dylib}
           cp -v README.md "artifact/${{ env.ASSET_NAME }}/README.txt"
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 0496eebdb..d0639d045 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -72,8 +72,8 @@ jobs:
         with:
           python-version: "3.8"
       - uses: Swatinem/rust-cache@v2
-      - run: cargo clippy -vv --all-features --features onnxruntime/disable-sys-build-script --tests -- -D clippy::all -D warnings --no-deps
-      - run: cargo clippy -vv --all-features --features onnxruntime/disable-sys-build-script -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv --all-features --tests -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv --all-features -- -D clippy::all -D warnings --no-deps
       - run: cargo fmt -- --check
 
   rust-unit-test:
@@ -199,8 +199,8 @@ jobs:
           mkdir -p example/cpp/unix/voicevox_core/
           cp -v crates/voicevox_core_c_api/include/voicevox_core.h example/cpp/unix/voicevox_core/
           cp -v target/debug/libvoicevox_core.{so,dylib} example/cpp/unix/voicevox_core/ || true
-          cp -v target/debug/build/onnxruntime-sys-*/out/onnxruntime_*/onnxruntime-*/lib/libonnxruntime.so.* example/cpp/unix/voicevox_core/ || true
-          cp -v target/debug/build/onnxruntime-sys-*/out/onnxruntime_*/onnxruntime-*/lib/libonnxruntime.*.dylib example/cpp/unix/voicevox_core/ || true
+          cp -v target/debug/libonnxruntime.so.* example/cpp/unix/voicevox_core/ || true
+          cp -v target/debug/libonnxruntime.*.dylib example/cpp/unix/voicevox_core/ || true
 
       - if: startsWith(matrix.os, 'mac')
         uses: jwlawson/actions-setup-cmake@v1.13
@@ -281,9 +281,9 @@ jobs:
       - run: poetry run maturin develop --locked
       - name: 必要なDLLをコピーしてpytestを実行
         run: |
-          cp -v ../../target/debug/build/onnxruntime-sys-*/out/onnxruntime_*/onnxruntime-*/lib/onnxruntime.dll . || true
-          cp -v ../../target/debug/build/onnxruntime-sys-*/out/onnxruntime_*/onnxruntime-*/lib/libonnxruntime.so.* . || true
-          cp -v ../../target/debug/build/onnxruntime-sys-*/out/onnxruntime_*/onnxruntime-*/lib/libonnxruntime.*.dylib . || true
+          cp -v ../../target/debug/onnxruntime.dll . || true
+          cp -v ../../target/debug/libonnxruntime.so.* . || true
+          cp -v ../../target/debug/libonnxruntime.*.dylib . || true
 
           poetry run pytest
       - name: Exampleを実行
diff --git a/Cargo.lock b/Cargo.lock
index 4015b7e36..0f9a78469 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -426,12 +426,6 @@ dependencies = [
  "winapi",
 ]
 
-[[package]]
-name = "chunked_transfer"
-version = "1.4.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fff857943da45f546682664a79488be82e69e43c1a7a2307679ab9afb3a66d2e"
-
 [[package]]
 name = "cipher"
 version = "0.3.0"
@@ -684,6 +678,12 @@ dependencies = [
  "cfg-if",
 ]
 
+[[package]]
+name = "crunchy"
+version = "0.2.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7a81dae078cea95a014a339291cec439d2f232ebe854a9d672b796c6afafa9b7"
+
 [[package]]
 name = "crypto-common"
 version = "0.1.6"
@@ -1278,6 +1278,16 @@ dependencies = [
  "tracing",
 ]
 
+[[package]]
+name = "half"
+version = "2.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bc52e53916c08643f1b56ec082790d1e86a32e58dc5268f897f313fbae7b4872"
+dependencies = [
+ "cfg-if",
+ "crunchy",
+]
+
 [[package]]
 name = "hashbrown"
 version = "0.12.3"
@@ -1410,7 +1420,7 @@ checksum = "1788965e61b367cd03a62950836d5cd41560c3577d90e40e0819373194d1661c"
 dependencies = [
  "http",
  "hyper",
- "rustls",
+ "rustls 0.20.6",
  "tokio",
  "tokio-rustls",
 ]
@@ -1993,30 +2003,6 @@ version = "1.18.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
 
-[[package]]
-name = "onnxruntime"
-version = "0.1.0"
-source = "git+https://github.com/VOICEVOX/onnxruntime-rs.git?rev=ebb9dcb9b26ee681889b52b6db3b4f642b04a250#ebb9dcb9b26ee681889b52b6db3b4f642b04a250"
-dependencies = [
- "lazy_static",
- "ndarray",
- "onnxruntime-sys",
- "thiserror",
- "tracing",
-]
-
-[[package]]
-name = "onnxruntime-sys"
-version = "0.0.25"
-source = "git+https://github.com/VOICEVOX/onnxruntime-rs.git?rev=ebb9dcb9b26ee681889b52b6db3b4f642b04a250#ebb9dcb9b26ee681889b52b6db3b4f642b04a250"
-dependencies = [
- "flate2",
- "once_cell",
- "tar",
- "ureq",
- "zip",
-]
-
 [[package]]
 name = "opaque-debug"
 version = "0.3.0"
@@ -2598,7 +2584,7 @@ dependencies = [
  "once_cell",
  "percent-encoding",
  "pin-project-lite",
- "rustls",
+ "rustls 0.20.6",
  "rustls-pemfile",
  "serde",
  "serde_json",
@@ -2611,7 +2597,7 @@ dependencies = [
  "wasm-bindgen",
  "wasm-bindgen-futures",
  "web-sys",
- "webpki-roots",
+ "webpki-roots 0.22.5",
  "winreg",
 ]
 
@@ -2728,6 +2714,18 @@ dependencies = [
  "webpki",
 ]
 
+[[package]]
+name = "rustls"
+version = "0.21.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cd8d6c9f025a446bc4d18ad9632e69aec8f287aa84499ee335599fabd20c3fd8"
+dependencies = [
+ "log",
+ "ring",
+ "rustls-webpki",
+ "sct",
+]
+
 [[package]]
 name = "rustls-pemfile"
 version = "1.0.2"
@@ -2737,6 +2735,16 @@ dependencies = [
  "base64 0.21.0",
 ]
 
+[[package]]
+name = "rustls-webpki"
+version = "0.101.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3c7d5dece342910d9ba34d259310cae3e0154b873b35408b787b59bce53d34fe"
+dependencies = [
+ "ring",
+ "untrusted",
+]
+
 [[package]]
 name = "rustversion"
 version = "1.0.11"
@@ -3262,7 +3270,7 @@ version = "0.23.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c43ee83903113e03984cb9e5cebe6c04a5116269e900e3ddba8f068a62adda59"
 dependencies = [
- "rustls",
+ "rustls 0.20.6",
  "tokio",
  "webpki",
 ]
@@ -3480,19 +3488,17 @@ checksum = "a156c684c91ea7d62626509bce3cb4e1d9ed5c4d978f7b4352658f96a4c26b4a"
 
 [[package]]
 name = "ureq"
-version = "2.5.0"
+version = "2.8.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b97acb4c28a254fd7a4aeec976c46a7fa404eac4d7c134b30c75144846d7cb8f"
+checksum = "f5ccd538d4a604753ebc2f17cd9946e89b77bf87f6a8e2309667c6f2e87855e3"
 dependencies = [
- "base64 0.13.0",
- "chunked_transfer",
- "flate2",
+ "base64 0.21.0",
  "log",
  "once_cell",
- "rustls",
+ "rustls 0.21.7",
+ "rustls-webpki",
  "url",
- "webpki",
- "webpki-roots",
+ "webpki-roots 0.25.4",
 ]
 
 [[package]]
@@ -3535,6 +3541,31 @@ version = "0.9.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "49874b5167b65d7193b8aba1567f5c7d93d001cafc34600cee003eda787e483f"
 
+[[package]]
+name = "voicevox-ort"
+version = "2.0.0-rc.2"
+source = "git+https://github.com/VOICEVOX/ort.git?rev=a2d6ae22327869e896bf4c16828734d09516d2d9#a2d6ae22327869e896bf4c16828734d09516d2d9"
+dependencies = [
+ "half",
+ "js-sys",
+ "ndarray",
+ "thiserror",
+ "tracing",
+ "voicevox-ort-sys",
+ "web-sys",
+]
+
+[[package]]
+name = "voicevox-ort-sys"
+version = "2.0.0-rc.2"
+source = "git+https://github.com/VOICEVOX/ort.git?rev=a2d6ae22327869e896bf4c16828734d09516d2d9#a2d6ae22327869e896bf4c16828734d09516d2d9"
+dependencies = [
+ "flate2",
+ "sha2",
+ "tar",
+ "ureq",
+]
+
 [[package]]
 name = "voicevox_core"
 version = "0.0.0"
@@ -3559,7 +3590,6 @@ dependencies = [
  "nanoid",
  "ndarray",
  "once_cell",
- "onnxruntime",
  "open_jtalk",
  "ouroboros",
  "pretty_assertions",
@@ -3578,6 +3608,7 @@ dependencies = [
  "tokio",
  "tracing",
  "uuid",
+ "voicevox-ort",
  "voicevox_core_macros",
  "windows",
  "zip",
@@ -3797,6 +3828,12 @@ dependencies = [
  "webpki",
 ]
 
+[[package]]
+name = "webpki-roots"
+version = "0.25.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5f20c57d8d7db6d3b86154206ae5d8fba62dd39573114de97c2cb0578251f8e1"
+
 [[package]]
 name = "which"
 version = "4.3.0"
diff --git a/Cargo.toml b/Cargo.toml
index 69d924a16..7102127d5 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -86,9 +86,9 @@ voicevox_core = { path = "crates/voicevox_core" }
 windows = "0.43.0"
 zip = "0.6.3"
 
-[workspace.dependencies.onnxruntime]
-git = "https://github.com/VOICEVOX/onnxruntime-rs.git"
-rev = "ebb9dcb9b26ee681889b52b6db3b4f642b04a250"
+[workspace.dependencies.voicevox-ort]
+git = "https://github.com/VOICEVOX/ort.git"
+rev = "a2d6ae22327869e896bf4c16828734d09516d2d9"
 
 [workspace.dependencies.open_jtalk]
 git = "https://github.com/VOICEVOX/open_jtalk-rs.git"
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index 5c8dd440d..731862356 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -6,7 +6,8 @@ publish.workspace = true
 
 [features]
 default = []
-directml = ["onnxruntime/directml"]
+cuda = ["voicevox-ort/cuda"]
+directml = ["voicevox-ort/directml"]
 
 [dependencies]
 anyhow.workspace = true
@@ -27,7 +28,6 @@ jlabel.workspace = true
 nanoid.workspace = true
 ndarray.workspace = true
 once_cell.workspace = true
-onnxruntime.workspace = true
 open_jtalk.workspace = true
 ouroboros.workspace = true
 rayon.workspace = true
@@ -43,6 +43,7 @@ tokio = { workspace = true, features = ["rt"] } # FIXME: feature-gateする
 tracing.workspace = true
 uuid = { workspace = true, features = ["v4", "serde"] }
 voicevox_core_macros = { path = "../voicevox_core_macros" }
+voicevox-ort = { workspace = true, features = ["ndarray", "download-binaries"] }
 zip.workspace = true
 
 [dev-dependencies]
diff --git a/crates/voicevox_core/src/infer.rs b/crates/voicevox_core/src/infer.rs
index fc8954e7d..c2cad1d7d 100644
--- a/crates/voicevox_core/src/infer.rs
+++ b/crates/voicevox_core/src/infer.rs
@@ -79,16 +79,20 @@ pub(crate) trait InferenceSignature: Sized + Send + 'static {
 pub(crate) trait InferenceInputSignature: Send + 'static {
     type Signature: InferenceSignature<Input = Self>;
     const PARAM_INFOS: &'static [ParamInfo<InputScalarKind>];
-    fn make_run_context<R: InferenceRuntime>(self, sess: &mut R::Session) -> R::RunContext<'_>;
+    fn make_run_context<R: InferenceRuntime>(
+        self,
+        sess: &mut R::Session,
+    ) -> anyhow::Result<R::RunContext<'_>>;
 }
 
 pub(crate) trait InputScalar: Sized {
     const KIND: InputScalarKind;
 
+    // TODO: `Array`ではなく`ArrayView`を取ることができるかもしれない
     fn push_tensor_to_ctx(
         tensor: Array<Self, impl Dimension + 'static>,
         visitor: &mut impl PushInputTensor,
-    );
+    ) -> anyhow::Result<()>;
 }
 
 #[duplicate_item(
@@ -102,8 +106,8 @@ impl InputScalar for T {
     fn push_tensor_to_ctx(
         tensor: Array<Self, impl Dimension + 'static>,
         ctx: &mut impl PushInputTensor,
-    ) {
-        ctx.push(tensor);
+    ) -> anyhow::Result<()> {
+        ctx.push(tensor)
     }
 }
 
@@ -117,8 +121,8 @@ pub(crate) enum InputScalarKind {
 }
 
 pub(crate) trait PushInputTensor {
-    fn push_int64(&mut self, tensor: Array<i64, impl Dimension + 'static>);
-    fn push_float32(&mut self, tensor: Array<f32, impl Dimension + 'static>);
+    fn push_int64(&mut self, tensor: Array<i64, impl Dimension + 'static>) -> anyhow::Result<()>;
+    fn push_float32(&mut self, tensor: Array<f32, impl Dimension + 'static>) -> anyhow::Result<()>;
 }
 
 /// 推論操作の出力シグネチャ。
diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
index 0556b6d51..f8f376837 100644
--- a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
+++ b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -1,18 +1,15 @@
 use std::{fmt::Debug, vec};
 
-use anyhow::anyhow;
+use anyhow::{anyhow, bail, ensure};
 use duplicate::duplicate_item;
 use ndarray::{Array, Dimension};
-use once_cell::sync::Lazy;
-use onnxruntime::{
-    environment::Environment, GraphOptimizationLevel, LoggingLevel, TensorElementDataType,
-    TypeToTensorElementDataType,
+use ort::{
+    CPUExecutionProvider, CUDAExecutionProvider, DirectMLExecutionProvider, ExecutionProvider as _,
+    GraphOptimizationLevel, IntoTensorElementType, TensorElementType, ValueType,
 };
 
 use crate::{devices::SupportedDevices, error::ErrorRepr};
 
-use self::assert_send::AssertSend;
-
 use super::super::{
     DecryptModelError, InferenceRuntime, InferenceSessionOptions, InputScalarKind,
     OutputScalarKind, OutputTensor, ParamInfo, PushInputTensor,
@@ -22,29 +19,28 @@ use super::super::{
 pub(crate) enum Onnxruntime {}
 
 impl InferenceRuntime for Onnxruntime {
-    type Session = AssertSend<onnxruntime::session::Session<'static>>;
+    type Session = ort::Session;
     type RunContext<'a> = OnnxruntimeRunContext<'a>;
 
     fn supported_devices() -> crate::Result<SupportedDevices> {
-        let mut cuda_support = false;
-        let mut dml_support = false;
-        for provider in onnxruntime::session::get_available_providers()
-            .map_err(Into::into)
-            .map_err(ErrorRepr::GetSupportedDevices)?
-            .iter()
-        {
-            match provider.as_str() {
-                "CUDAExecutionProvider" => cuda_support = true,
-                "DmlExecutionProvider" => dml_support = true,
-                _ => {}
-            }
-        }
+        // TODO: `InferenceRuntime::init`と`InitInferenceRuntimeError`を作る
+        build_ort_env_once().unwrap();
+
+        (|| {
+            let cpu = CPUExecutionProvider::default().is_available()?;
+            let cuda = CUDAExecutionProvider::default().is_available()?;
+            let dml = DirectMLExecutionProvider::default().is_available()?;
 
-        Ok(SupportedDevices {
-            cpu: true,
-            cuda: cuda_support,
-            dml: dml_support,
-        })
+            ensure!(cpu, "missing `CPUExecutionProvider`");
+
+            Ok(SupportedDevices {
+                cpu: true,
+                cuda,
+                dml,
+            })
+        })()
+        .map_err(ErrorRepr::GetSupportedDevices)
+        .map_err(Into::into)
     }
 
     fn new_session(
@@ -55,48 +51,52 @@ impl InferenceRuntime for Onnxruntime {
         Vec<ParamInfo<InputScalarKind>>,
         Vec<ParamInfo<OutputScalarKind>>,
     )> {
-        let mut builder = ENVIRONMENT
-            .new_session_builder()?
-            .with_optimization_level(GraphOptimizationLevel::Basic)?
-            .with_intra_op_num_threads(options.cpu_num_threads.into())?
-            .with_inter_op_num_threads(options.cpu_num_threads.into())?;
-
-        if options.use_gpu {
-            #[cfg(feature = "directml")]
-            {
-                use onnxruntime::ExecutionMode;
-
-                builder = builder
-                    .with_disable_mem_pattern()?
-                    .with_execution_mode(ExecutionMode::ORT_SEQUENTIAL)?
-                    .with_append_execution_provider_directml(0)?;
-            }
-
-            #[cfg(not(feature = "directml"))]
-            {
-                builder = builder.with_append_execution_provider_cuda(Default::default())?;
-            }
+        // TODO: `InferenceRuntime::init`と`InitInferenceRuntimeError`を作る
+        build_ort_env_once().unwrap();
+
+        let mut builder = ort::Session::builder()?
+            .with_optimization_level(GraphOptimizationLevel::Level1)?
+            .with_intra_threads(options.cpu_num_threads.into())?;
+
+        if options.use_gpu && cfg!(feature = "directml") {
+            builder = builder
+                .with_parallel_execution(false)?
+                .with_memory_pattern(false)?;
+            DirectMLExecutionProvider::default().register(&builder)?;
+        } else if options.use_gpu && cfg!(feature = "cuda") {
+            CUDAExecutionProvider::default().register(&builder)?;
         }
 
         let model = model()?;
-        let sess = AssertSend::from(builder.with_model_from_memory(model)?);
+        let sess = builder.commit_from_memory(&{ model })?;
 
         let input_param_infos = sess
             .inputs
             .iter()
             .map(|info| {
-                let dt = match info.input_type {
-                    TensorElementDataType::Float => Ok(InputScalarKind::Float32),
-                    TensorElementDataType::Uint8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT8"),
-                    TensorElementDataType::Int8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT8"),
-                    TensorElementDataType::Uint16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT16"),
-                    TensorElementDataType::Int16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT16"),
-                    TensorElementDataType::Int32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT32"),
-                    TensorElementDataType::Int64 => Ok(InputScalarKind::Int64),
-                    TensorElementDataType::String => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_STRING"),
-                    TensorElementDataType::Double => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_DOUBLE"),
-                    TensorElementDataType::Uint32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT32"),
-                    TensorElementDataType::Uint64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT64"),
+                let ValueType::Tensor { ty, .. } = info.input_type else {
+                    bail!(
+                        "unexpected input value type for `{}`. currently `ONNX_TYPE_TENSOR` and \
+                         `ONNX_TYPE_SPARSETENSOR` is supported",
+                        info.name,
+                    );
+                };
+
+                let dt = match ty {
+                    TensorElementType::Float32 => Ok(InputScalarKind::Float32),
+                    TensorElementType::Uint8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT8"),
+                    TensorElementType::Int8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT8"),
+                    TensorElementType::Uint16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT16"),
+                    TensorElementType::Int16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT16"),
+                    TensorElementType::Int32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT32"),
+                    TensorElementType::Int64 => Ok(InputScalarKind::Int64),
+                    TensorElementType::String => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_STRING"),
+                    TensorElementType::Bfloat16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_BFLOAT16"),
+                    TensorElementType::Float16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT16"),
+                    TensorElementType::Float64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_DOUBLE"),
+                    TensorElementType::Uint32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT32"),
+                    TensorElementType::Uint64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT64"),
+                    TensorElementType::Bool => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_BOOL"),
                 }
                 .map_err(|actual| {
                     anyhow!("unsupported input datatype `{actual}` for `{}`", info.name)
@@ -105,7 +105,7 @@ impl InferenceRuntime for Onnxruntime {
                 Ok(ParamInfo {
                     name: info.name.clone().into(),
                     dt,
-                    ndim: Some(info.dimensions.len()),
+                    ndim: info.input_type.tensor_dimensions().map(Vec::len),
                 })
             })
             .collect::<anyhow::Result<_>>()?;
@@ -114,18 +114,29 @@ impl InferenceRuntime for Onnxruntime {
             .outputs
             .iter()
             .map(|info| {
-                let dt = match info.output_type {
-                    TensorElementDataType::Float => Ok(OutputScalarKind::Float32),
-                    TensorElementDataType::Uint8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT8"),
-                    TensorElementDataType::Int8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT8"),
-                    TensorElementDataType::Uint16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT16"),
-                    TensorElementDataType::Int16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT16"),
-                    TensorElementDataType::Int32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT32"),
-                    TensorElementDataType::Int64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT64"),
-                    TensorElementDataType::String => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_STRING"),
-                    TensorElementDataType::Double => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_DOUBLE"),
-                    TensorElementDataType::Uint32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT32"),
-                    TensorElementDataType::Uint64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT64"),
+                let ValueType::Tensor { ty, .. } = info.output_type else {
+                    bail!(
+                        "unexpected output value type for `{}`. currently `ONNX_TYPE_TENSOR` and \
+                         `ONNX_TYPE_SPARSETENSOR` is supported",
+                        info.name,
+                    );
+                };
+
+                let dt = match ty {
+                    TensorElementType::Float32 => Ok(OutputScalarKind::Float32),
+                    TensorElementType::Uint8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT8"),
+                    TensorElementType::Int8 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT8"),
+                    TensorElementType::Uint16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT16"),
+                    TensorElementType::Int16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT16"),
+                    TensorElementType::Int32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT32"),
+                    TensorElementType::Int64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_INT64"),
+                    TensorElementType::String => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_STRING"),
+                    TensorElementType::Bfloat16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_BFLOAT16"),
+                    TensorElementType::Float16 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT16"),
+                    TensorElementType::Float64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_DOUBLE"),
+                    TensorElementType::Uint32 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT32"),
+                    TensorElementType::Uint64 => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_UINT64"),
+                    TensorElementType::Bool => Err("ONNX_TENSOR_ELEMENT_DATA_TYPE_BOOL"),
                 }
                 .map_err(|actual| {
                     anyhow!("unsupported output datatype `{actual}` for `{}`", info.name)
@@ -134,73 +145,69 @@ impl InferenceRuntime for Onnxruntime {
                 Ok(ParamInfo {
                     name: info.name.clone().into(),
                     dt,
-                    ndim: Some(info.dimensions.len()),
+                    ndim: info.output_type.tensor_dimensions().map(|d| d.len()),
                 })
             })
             .collect::<anyhow::Result<_>>()?;
 
-        return Ok((sess, input_param_infos, output_param_infos));
-
-        static ENVIRONMENT: Lazy<Environment> = Lazy::new(|| {
-            Environment::builder()
-                .with_name(env!("CARGO_PKG_NAME"))
-                .with_log_level(LOGGING_LEVEL)
-                .build()
-                .unwrap()
-        });
-
-        const LOGGING_LEVEL: LoggingLevel = if cfg!(debug_assertions) {
-            LoggingLevel::Verbose
-        } else {
-            LoggingLevel::Warning
-        };
+        Ok((sess, input_param_infos, output_param_infos))
     }
 
     fn run(
-        OnnxruntimeRunContext { sess, mut inputs }: OnnxruntimeRunContext<'_>,
+        OnnxruntimeRunContext { sess, inputs }: OnnxruntimeRunContext<'_>,
     ) -> anyhow::Result<Vec<OutputTensor>> {
-        // FIXME: 現状では`f32`のみ対応。実行時にsessionからdatatypeが取れるので、別の型の対応も
-        // おそらく可能ではあるが、それが必要になるよりもortクレートへの引越しが先になると思われる
-        // のでこのままにする。
-
-        if !sess
-            .outputs
-            .iter()
-            .all(|info| matches!(info.output_type, TensorElementDataType::Float))
-        {
-            unimplemented!(
-                "currently only `ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT` is supported for output",
-            );
-        }
-
-        let outputs = sess.run::<f32>(inputs.iter_mut().map(|t| &mut **t as &mut _).collect())?;
-
-        Ok(outputs
-            .iter()
-            .map(|o| OutputTensor::Float32((*o).clone().into_owned()))
-            .collect())
+        let outputs = sess.run(&*inputs)?;
+
+        (0..outputs.len())
+            .map(|i| {
+                let output = &outputs[i];
+
+                let ValueType::Tensor { ty, .. } = output.dtype()? else {
+                    bail!(
+                        "unexpected output. currently `ONNX_TYPE_TENSOR` and \
+                         `ONNX_TYPE_SPARSETENSOR` is supported",
+                    );
+                };
+
+                match ty {
+                    TensorElementType::Float32 => {
+                        let output = output.try_extract_tensor::<f32>()?;
+                        Ok(OutputTensor::Float32(output.into_owned()))
+                    }
+                    _ => bail!("unexpected output tensor element data type"),
+                }
+            })
+            .collect()
     }
 }
 
+fn build_ort_env_once() -> ort::Result<()> {
+    static ONCE: once_cell::sync::OnceCell<()> = once_cell::sync::OnceCell::new();
+    ONCE.get_or_try_init(|| ort::init().with_name(env!("CARGO_PKG_NAME")).commit())?;
+    Ok(())
+}
+
 pub(crate) struct OnnxruntimeRunContext<'sess> {
-    sess: &'sess mut AssertSend<onnxruntime::session::Session<'static>>,
-    inputs: Vec<Box<dyn onnxruntime::session::AnyArray>>,
+    sess: &'sess ort::Session,
+    inputs: Vec<ort::SessionInputValue<'static>>,
 }
 
 impl OnnxruntimeRunContext<'_> {
     fn push_input(
         &mut self,
-        input: Array<impl TypeToTensorElementDataType + Debug + 'static, impl Dimension + 'static>,
-    ) {
-        self.inputs
-            .push(Box::new(onnxruntime::session::NdArray::new(input)));
+        input: Array<
+            impl IntoTensorElementType + Debug + Clone + 'static,
+            impl Dimension + 'static,
+        >,
+    ) -> anyhow::Result<()> {
+        let input = ort::Value::from_array(input)?.into();
+        self.inputs.push(input);
+        Ok(())
     }
 }
 
-impl<'sess> From<&'sess mut AssertSend<onnxruntime::session::Session<'static>>>
-    for OnnxruntimeRunContext<'sess>
-{
-    fn from(sess: &'sess mut AssertSend<onnxruntime::session::Session<'static>>) -> Self {
+impl<'sess> From<&'sess mut ort::Session> for OnnxruntimeRunContext<'sess> {
+    fn from(sess: &'sess mut ort::Session) -> Self {
         Self {
             sess,
             inputs: vec![],
@@ -214,40 +221,7 @@ impl PushInputTensor for OnnxruntimeRunContext<'_> {
         [ push_int64 ]   [ i64 ];
         [ push_float32 ] [ f32 ];
     )]
-    fn method(&mut self, tensor: Array<T, impl Dimension + 'static>) {
-        self.push_input(tensor);
-    }
-}
-
-// FIXME: 以下のことをちゃんと確認した後、onnxruntime-rs側で`Session`が`Send`であると宣言する。
-// https://github.com/VOICEVOX/voicevox_core/issues/307#issuecomment-1276184614
-mod assert_send {
-    use std::ops::{Deref, DerefMut};
-
-    pub(crate) struct AssertSend<T>(T);
-
-    impl From<onnxruntime::session::Session<'static>>
-        for AssertSend<onnxruntime::session::Session<'static>>
-    {
-        fn from(session: onnxruntime::session::Session<'static>) -> Self {
-            Self(session)
-        }
+    fn method(&mut self, tensor: Array<T, impl Dimension + 'static>) -> anyhow::Result<()> {
+        self.push_input(tensor)
     }
-
-    impl<T> Deref for AssertSend<T> {
-        type Target = T;
-
-        fn deref(&self) -> &Self::Target {
-            &self.0
-        }
-    }
-
-    impl<T> DerefMut for AssertSend<T> {
-        fn deref_mut(&mut self) -> &mut Self::Target {
-            &mut self.0
-        }
-    }
-
-    // SAFETY: `Session` is probably "send"able.
-    unsafe impl<T> Send for AssertSend<T> {}
 }
diff --git a/crates/voicevox_core/src/infer/session_set.rs b/crates/voicevox_core/src/infer/session_set.rs
index 56d570f98..cdd179680 100644
--- a/crates/voicevox_core/src/infer/session_set.rs
+++ b/crates/voicevox_core/src/infer/session_set.rs
@@ -94,9 +94,8 @@ impl<R: InferenceRuntime, I: InferenceInputSignature> InferenceSessionCell<R, I>
         input: I,
     ) -> crate::Result<<I::Signature as InferenceSignature>::Output> {
         let inner = &mut self.inner.lock().unwrap();
-        let ctx = input.make_run_context::<R>(inner);
-        R::run(ctx)
-            .and_then(TryInto::try_into)
-            .map_err(|e| ErrorRepr::InferenceFailed(e).into())
+        (|| R::run(input.make_run_context::<R>(inner)?)?.try_into())()
+            .map_err(ErrorRepr::InferenceFailed)
+            .map_err(Into::into)
     }
 }
diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml
index a6314f105..ad3a65fa7 100644
--- a/crates/voicevox_core_c_api/Cargo.toml
+++ b/crates/voicevox_core_c_api/Cargo.toml
@@ -13,6 +13,7 @@ harness = false
 name = "e2e"
 
 [features]
+cuda = ["voicevox_core/cuda"]
 directml = ["voicevox_core/directml"]
 
 [dependencies]
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index a5da9b6d3..fbb0bf6bf 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -59,7 +59,13 @@ fn init_logger_once() {
             .with_env_filter(if env::var_os(EnvFilter::DEFAULT_ENV).is_some() {
                 EnvFilter::from_default_env()
             } else {
-                "error,voicevox_core=info,voicevox_core_c_api=info,onnxruntime=info".into()
+                pub const ORT_LOGGING_LEVEL: &str = if cfg!(debug_assertions) {
+                    "info"
+                } else {
+                    "warn"
+                };
+                format!("error,voicevox_core=info,voicevox_core_c_api=info,ort={ORT_LOGGING_LEVEL}")
+                    .into()
             })
             .with_timer(local_time as fn(&mut Writer<'_>) -> _)
             .with_ansi(ansi)
diff --git a/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs b/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs
index 1e4958eda..cfbec5c31 100644
--- a/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs
@@ -46,11 +46,7 @@ pub(crate) fn exec<C: TestContext>() -> anyhow::Result<()> {
     // テスト対象が無いときに`cargo build`をスキップしたいが、判定部分がプライベート。
     // そのためスキップするのはCLIオプションに`--ignored`か`--include-ignored`が無いときのみ
     if args.ignored || args.include_ignored {
-        let mut cmd = cmd!(env!("CARGO"), "build", "--release", "--lib");
-        for (k, v) in C::BUILD_ENVS {
-            cmd = cmd.env(k, v);
-        }
-        cmd.run()?;
+        cmd!(env!("CARGO"), "build", "--release", "--lib").run()?;
 
         ensure!(
             C::cdylib_path().exists(),
@@ -102,7 +98,6 @@ pub(crate) fn exec<C: TestContext>() -> anyhow::Result<()> {
 pub(crate) trait TestContext {
     const TARGET_DIR: &'static str;
     const CDYLIB_NAME: &'static str;
-    const BUILD_ENVS: &'static [(&'static str, &'static str)];
     const RUNTIME_ENVS: &'static [(&'static str, &'static str)];
 }
 
diff --git a/crates/voicevox_core_c_api/tests/e2e/main.rs b/crates/voicevox_core_c_api/tests/e2e/main.rs
index 91f5e06e9..43dc3a95e 100644
--- a/crates/voicevox_core_c_api/tests/e2e/main.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/main.rs
@@ -24,16 +24,6 @@ fn main() -> anyhow::Result<()> {
     impl assert_cdylib::TestContext for TestContext {
         const TARGET_DIR: &'static str = "../../target";
         const CDYLIB_NAME: &'static str = "voicevox_core";
-        const BUILD_ENVS: &'static [(&'static str, &'static str)] = &[
-            // 他の単体テストが動いているときにonnxruntime-sysの初回ビルドを行うと、Windows環境だと
-            // `$ORT_OUT_DIR`のハックが問題を起こす。そのためこのハック自体を無効化する
-            //
-            // featuresの差分を出さないように`cargo build`することができればonnxruntime-sysの
-            // ビルド自体がされないのだが、このバイナリから`cargo build`の状況を知るのは無理に近い
-            ("ORT_OUT_DIR", ""),
-            // DirectMLとCUDAは無効化
-            ("ORT_USE_CUDA", "0"),
-        ];
         const RUNTIME_ENVS: &'static [(&'static str, &'static str)] =
             &[("VV_MODELS_ROOT_DIR", VV_MODELS_ROOT_DIR)];
     }
diff --git a/crates/voicevox_core_java_api/Cargo.toml b/crates/voicevox_core_java_api/Cargo.toml
index 887813685..06b2af618 100644
--- a/crates/voicevox_core_java_api/Cargo.toml
+++ b/crates/voicevox_core_java_api/Cargo.toml
@@ -8,6 +8,7 @@ publish.workspace = true
 crate-type = ["cdylib"]
 
 [features]
+cuda = ["voicevox_core/cuda"]
 directml = ["voicevox_core/directml"]
 
 [dependencies]
diff --git a/crates/voicevox_core_java_api/settings.gradle b/crates/voicevox_core_java_api/settings.gradle
index 20a5e2c6a..75f5810ac 100644
--- a/crates/voicevox_core_java_api/settings.gradle
+++ b/crates/voicevox_core_java_api/settings.gradle
@@ -40,5 +40,5 @@ gradle.ext {
   gsonVersion = '2.10.1'
   jakartaValidationVersion = '3.0.2'
   jakartaAnnotationVersion = '2.1.1'
-  onnxruntimeVersion = '1.14.0'
+  onnxruntimeVersion = '1.17.3'
 }
diff --git a/crates/voicevox_core_java_api/src/logger.rs b/crates/voicevox_core_java_api/src/logger.rs
index 4800452ca..30545725e 100644
--- a/crates/voicevox_core_java_api/src/logger.rs
+++ b/crates/voicevox_core_java_api/src/logger.rs
@@ -10,10 +10,11 @@ extern "system" fn Java_jp_hiroshiba_voicevoxcore_Dll_00024LoggerInitializer_ini
             android_logger::Config::default()
                 .with_tag("VoicevoxCore")
                 .with_filter(
-                android_logger::FilterBuilder::new()
-                    .parse("error,voicevox_core=info,voicevox_core_java_api=info,onnxruntime=error")
-                    .build(),
-            ),
+                    android_logger::FilterBuilder::new()
+                        // FIXME: ortも`warn`は出すべき
+                        .parse("error,voicevox_core=info,voicevox_core_java_api=info,ort=error")
+                        .build(),
+                ),
         );
     } else {
         // TODO: Android以外でのログ出力を良い感じにする。（System.Loggerを使う？）
@@ -29,7 +30,8 @@ extern "system" fn Java_jp_hiroshiba_voicevoxcore_Dll_00024LoggerInitializer_ini
             .with_env_filter(if env::var_os(EnvFilter::DEFAULT_ENV).is_some() {
                 EnvFilter::from_default_env()
             } else {
-                "error,voicevox_core=info,voicevox_core_c_api=info,onnxruntime=error".into()
+                // FIXME: `c_api`じゃないし、ortも`warn`は出すべき
+                "error,voicevox_core=info,voicevox_core_c_api=info,ort=error".into()
             })
             .with_timer(local_time as fn(&mut Writer<'_>) -> _)
             .with_ansi(out().is_terminal() && env_allows_ansi())
diff --git a/crates/voicevox_core_macros/src/inference_domain.rs b/crates/voicevox_core_macros/src/inference_domain.rs
index 72bc4d18a..d24a20ab1 100644
--- a/crates/voicevox_core_macros/src/inference_domain.rs
+++ b/crates/voicevox_core_macros/src/inference_domain.rs
@@ -223,22 +223,28 @@ pub(crate) fn derive_inference_input_signature(
             fn make_run_context<R: crate::infer::InferenceRuntime>(
                 self,
                 sess: &mut R::Session,
-            ) -> R::RunContext<'_> {
+            ) -> ::anyhow::Result<R::RunContext<'_>> {
                 let mut ctx = <R::RunContext<'_> as ::std::convert::From<_>>::from(sess);
                 #(
-                    __ArrayExt::push_to_ctx(self.#field_names, &mut ctx);
+                    __ArrayExt::push_to_ctx(self.#field_names, &mut ctx)?;
                 )*
-                return ctx;
+                return ::std::result::Result::Ok(ctx);
 
                 trait __ArrayExt {
-                    fn push_to_ctx(self, ctx: &mut impl crate::infer::PushInputTensor);
+                    fn push_to_ctx(
+                        self,
+                        ctx: &mut impl crate::infer::PushInputTensor,
+                    ) -> ::anyhow::Result<()>;
                 }
 
                 impl<A: crate::infer::InputScalar, D: ::ndarray::Dimension + 'static> __ArrayExt
                     for ::ndarray::Array<A, D>
                 {
-                    fn push_to_ctx(self, ctx: &mut impl crate::infer::PushInputTensor) {
-                        A::push_tensor_to_ctx(self, ctx);
+                    fn push_to_ctx(
+                        self,
+                        ctx: &mut impl crate::infer::PushInputTensor,
+                    ) -> ::anyhow::Result<()> {
+                        A::push_tensor_to_ctx(self, ctx)
                     }
                 }
             }
diff --git a/crates/voicevox_core_python_api/Cargo.toml b/crates/voicevox_core_python_api/Cargo.toml
index be3ecbf27..5ccd1dc41 100644
--- a/crates/voicevox_core_python_api/Cargo.toml
+++ b/crates/voicevox_core_python_api/Cargo.toml
@@ -8,6 +8,7 @@ publish.workspace = true
 crate-type = ["cdylib"]
 
 [features]
+cuda = ["voicevox_core/cuda"]
 directml = ["voicevox_core/directml"]
 
 [dependencies]

From 9c3a94e663263595e9e9df0c0b763620c0e1615c Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 24 May 2024 08:00:24 +0900
Subject: [PATCH 02/36] =?UTF-8?q?change:=20`style=5Fid=5Fto=5Fmodel=5Finne?=
 =?UTF-8?q?r=5Fid`=20=E2=86=92=20`style=5Fid=5Fto=5Finner=5Fvoice=5Fid`=20?=
 =?UTF-8?q?(#795)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crates/voicevox_core/src/manifest.rs    | 16 ++++----
 crates/voicevox_core/src/status.rs      | 50 ++++++++++++-------------
 crates/voicevox_core/src/synthesizer.rs | 12 +++---
 crates/voicevox_core/src/voice_model.rs | 24 ++++++------
 model/sample.vvm/manifest.json          |  2 +-
 5 files changed, 52 insertions(+), 52 deletions(-)

diff --git a/crates/voicevox_core/src/manifest.rs b/crates/voicevox_core/src/manifest.rs
index 3b17ae3f1..a22b66e8b 100644
--- a/crates/voicevox_core/src/manifest.rs
+++ b/crates/voicevox_core/src/manifest.rs
@@ -19,18 +19,18 @@ impl Display for ManifestVersion {
 }
 
 /// モデル内IDの実体
-pub type RawModelInnerId = u32;
+pub type RawInnerVoiceId = u32;
 /// モデル内ID
 #[derive(PartialEq, Eq, Clone, Copy, Ord, PartialOrd, Deserialize, Serialize, new, Debug)]
-pub struct ModelInnerId(RawModelInnerId);
+pub struct InnerVoiceId(RawInnerVoiceId);
 
-impl ModelInnerId {
-    pub fn raw_id(self) -> RawModelInnerId {
+impl InnerVoiceId {
+    pub fn raw_id(self) -> RawInnerVoiceId {
         self.0
     }
 }
 
-impl Display for ModelInnerId {
+impl Display for InnerVoiceId {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         write!(f, "{}", self.raw_id())
     }
@@ -58,12 +58,12 @@ pub(crate) struct TalkManifest {
     pub(crate) predict_intonation_filename: String,
     pub(crate) decode_filename: String,
     #[serde(default)]
-    pub(crate) style_id_to_model_inner_id: StyleIdToModelInnerId,
+    pub(crate) style_id_to_inner_voice_id: StyleIdToInnerVoiceId,
 }
 
 #[serde_as]
 #[derive(Default, Clone, Deref, Deserialize)]
 #[deref(forward)]
-pub(crate) struct StyleIdToModelInnerId(
-    #[serde_as(as = "Arc<BTreeMap<DisplayFromStr, _>>")] Arc<BTreeMap<StyleId, ModelInnerId>>,
+pub(crate) struct StyleIdToInnerVoiceId(
+    #[serde_as(as = "Arc<BTreeMap<DisplayFromStr, _>>")] Arc<BTreeMap<StyleId, InnerVoiceId>>,
 );
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index a47de689b..6980ab7fc 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -14,9 +14,9 @@ use crate::{
         InferenceDomain, InferenceInputSignature, InferenceRuntime, InferenceSessionOptions,
         InferenceSignature,
     },
-    manifest::{ModelInnerId, StyleIdToModelInnerId},
+    manifest::{InnerVoiceId, StyleIdToInnerVoiceId},
     metas::{self, SpeakerMeta, StyleId, StyleMeta, VoiceModelMeta},
-    voice_model::{ModelBytesWithInnerIdsByDomain, VoiceModelHeader, VoiceModelId},
+    voice_model::{ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId},
     Result,
 };
 
@@ -36,7 +36,7 @@ impl<R: InferenceRuntime> Status<R> {
     pub(crate) fn insert_model(
         &self,
         model_header: &VoiceModelHeader,
-        model_contents: &InferenceDomainMap<ModelBytesWithInnerIdsByDomain>,
+        model_contents: &InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>,
     ) -> Result<()> {
         self.loaded_models
             .lock()
@@ -66,14 +66,14 @@ impl<R: InferenceRuntime> Status<R> {
         self.loaded_models.lock().unwrap().metas()
     }
 
-    /// あるスタイルに対応する`VoiceModelId`と`ModelInnerId`の組を返す。
+    /// あるスタイルに対応する`VoiceModelId`と`InnerVoiceId`の組を返す。
     ///
-    /// `StyleId` → `ModelInnerId`のマッピングが存在しない場合は、`ModelInnerId`としては
+    /// `StyleId` → `InnerVoiceId`のマッピングが存在しない場合は、`InnerVoiceId`としては
     /// `style_id`と同じ値を返す。
     pub(crate) fn ids_for<D: InferenceDomainExt>(
         &self,
         style_id: StyleId,
-    ) -> Result<(VoiceModelId, ModelInnerId)> {
+    ) -> Result<(VoiceModelId, InnerVoiceId)> {
         self.loaded_models.lock().unwrap().ids_for::<D>(style_id)
     }
 
@@ -122,7 +122,7 @@ struct LoadedModels<R: InferenceRuntime>(IndexMap<VoiceModelId, LoadedModel<R>>)
 
 struct LoadedModel<R: InferenceRuntime> {
     metas: VoiceModelMeta,
-    session_sets_with_inner_ids: InferenceDomainMap<SessionSetsWithInnerIdsByDomain<R>>,
+    session_sets_with_inner_ids: InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>>,
 }
 
 impl<R: InferenceRuntime> LoadedModels<R> {
@@ -133,7 +133,7 @@ impl<R: InferenceRuntime> LoadedModels<R> {
     fn ids_for<D: InferenceDomainExt>(
         &self,
         style_id: StyleId,
-    ) -> Result<(VoiceModelId, ModelInnerId)> {
+    ) -> Result<(VoiceModelId, InnerVoiceId)> {
         let (
             model_id,
             LoadedModel {
@@ -153,13 +153,13 @@ impl<R: InferenceRuntime> LoadedModels<R> {
                 style_types: D::style_types(),
             })?;
 
-        let model_inner_id = session_sets_with_inner_ids
+        let inner_voice_id = session_sets_with_inner_ids
             .get::<D>()
             .as_ref()
-            .and_then(|(model_inner_ids, _)| model_inner_ids.get(&style_id).copied())
-            .unwrap_or_else(|| ModelInnerId::new(style_id.raw_id()));
+            .and_then(|(inner_voice_ids, _)| inner_voice_ids.get(&style_id).copied())
+            .unwrap_or_else(|| InnerVoiceId::new(style_id.raw_id()));
 
-        Ok((model_id.clone(), model_inner_id))
+        Ok((model_id.clone(), inner_voice_id))
     }
 
     /// # Panics
@@ -250,7 +250,7 @@ impl<R: InferenceRuntime> LoadedModels<R> {
     fn insert(
         &mut self,
         model_header: &VoiceModelHeader,
-        session_sets_with_inner_ids: InferenceDomainMap<SessionSetsWithInnerIdsByDomain<R>>,
+        session_sets_with_inner_ids: InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>>,
     ) -> Result<()> {
         self.ensure_acceptable(model_header)?;
 
@@ -286,8 +286,8 @@ impl<R: InferenceRuntime> LoadedModels<R> {
 
 pub(crate) trait InferenceDomainExt: InferenceDomain {
     fn visit<R: InferenceRuntime>(
-        map: &InferenceDomainMap<SessionSetsWithInnerIdsByDomain<R>>,
-    ) -> Option<&(StyleIdToModelInnerId, InferenceSessionSet<R, Self>)>;
+        map: &InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>>,
+    ) -> Option<&(StyleIdToInnerVoiceId, InferenceSessionSet<R, Self>)>;
 }
 
 #[duplicate_item(
@@ -296,25 +296,25 @@ pub(crate) trait InferenceDomainExt: InferenceDomain {
 )]
 impl InferenceDomainExt for T {
     fn visit<R: InferenceRuntime>(
-        map: &InferenceDomainMap<SessionSetsWithInnerIdsByDomain<R>>,
-    ) -> Option<&(StyleIdToModelInnerId, InferenceSessionSet<R, Self>)> {
+        map: &InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>>,
+    ) -> Option<&(StyleIdToInnerVoiceId, InferenceSessionSet<R, Self>)> {
         map.field.as_ref()
     }
 }
 
-impl<R: InferenceRuntime> InferenceDomainMap<SessionSetsWithInnerIdsByDomain<R>> {
+impl<R: InferenceRuntime> InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>> {
     fn get<D: InferenceDomainExt>(
         &self,
-    ) -> Option<&(StyleIdToModelInnerId, InferenceSessionSet<R, D>)> {
+    ) -> Option<&(StyleIdToInnerVoiceId, InferenceSessionSet<R, D>)> {
         D::visit(self)
     }
 }
 
-impl InferenceDomainMap<ModelBytesWithInnerIdsByDomain> {
+impl InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain> {
     fn create_session_sets<R: InferenceRuntime>(
         &self,
         session_options: &InferenceDomainMap<SessionOptionsByDomain>,
-    ) -> anyhow::Result<InferenceDomainMap<SessionSetsWithInnerIdsByDomain<R>>> {
+    ) -> anyhow::Result<InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>>> {
         duplicate! {
             [
                 field;
@@ -323,9 +323,9 @@ impl InferenceDomainMap<ModelBytesWithInnerIdsByDomain> {
             let field = self
                 .field
                 .as_ref()
-                .map(|(model_inner_ids, model_bytes)| {
+                .map(|(inner_voice_ids, model_bytes)| {
                     let session_set = InferenceSessionSet::new(model_bytes, &session_options.field)?;
-                    Ok::<_, anyhow::Error>((model_inner_ids.clone(), session_set))
+                    Ok::<_, anyhow::Error>((inner_voice_ids.clone(), session_set))
                 })
                 .transpose()?;
         }
@@ -336,8 +336,8 @@ impl InferenceDomainMap<ModelBytesWithInnerIdsByDomain> {
 
 type SessionOptionsByDomain = (EnumMap<TalkOperation, InferenceSessionOptions>,);
 
-type SessionSetsWithInnerIdsByDomain<R> =
-    (Option<(StyleIdToModelInnerId, InferenceSessionSet<R, TalkDomain>)>,);
+type SessionSetsWithInnerVoiceIdsByDomain<R> =
+    (Option<(StyleIdToInnerVoiceId, InferenceSessionSet<R, TalkDomain>)>,);
 
 #[cfg(test)]
 mod tests {
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 5e4894415..06555ea28 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -836,7 +836,7 @@ pub(crate) mod blocking {
 
     impl<O> PerformInference for self::Synthesizer<O> {
         fn predict_duration(&self, phoneme_vector: &[i64], style_id: StyleId) -> Result<Vec<f32>> {
-            let (model_id, model_inner_id) = self.status.ids_for::<TalkDomain>(style_id)?;
+            let (model_id, inner_voice_id) = self.status.ids_for::<TalkDomain>(style_id)?;
 
             let PredictDurationOutput {
                 phoneme_length: output,
@@ -844,7 +844,7 @@ pub(crate) mod blocking {
                 &model_id,
                 PredictDurationInput {
                     phoneme_list: ndarray::arr1(phoneme_vector),
-                    speaker_id: ndarray::arr1(&[model_inner_id.raw_id().into()]),
+                    speaker_id: ndarray::arr1(&[inner_voice_id.raw_id().into()]),
                 },
             )?;
             let mut output = output.into_raw_vec();
@@ -871,7 +871,7 @@ pub(crate) mod blocking {
             end_accent_phrase_vector: &[i64],
             style_id: StyleId,
         ) -> Result<Vec<f32>> {
-            let (model_id, model_inner_id) = self.status.ids_for::<TalkDomain>(style_id)?;
+            let (model_id, inner_voice_id) = self.status.ids_for::<TalkDomain>(style_id)?;
 
             let PredictIntonationOutput { f0_list: output } = self.status.run_session(
                 &model_id,
@@ -883,7 +883,7 @@ pub(crate) mod blocking {
                     end_accent_list: ndarray::arr1(end_accent_vector),
                     start_accent_phrase_list: ndarray::arr1(start_accent_phrase_vector),
                     end_accent_phrase_list: ndarray::arr1(end_accent_phrase_vector),
-                    speaker_id: ndarray::arr1(&[model_inner_id.raw_id().into()]),
+                    speaker_id: ndarray::arr1(&[inner_voice_id.raw_id().into()]),
                 },
             )?;
 
@@ -898,7 +898,7 @@ pub(crate) mod blocking {
             phoneme_vector: &[f32],
             style_id: StyleId,
         ) -> Result<Vec<f32>> {
-            let (model_id, model_inner_id) = self.status.ids_for::<TalkDomain>(style_id)?;
+            let (model_id, inner_voice_id) = self.status.ids_for::<TalkDomain>(style_id)?;
 
             // 音が途切れてしまうのを避けるworkaround処理が入っている
             // TODO: 改善したらここのpadding処理を取り除く
@@ -925,7 +925,7 @@ pub(crate) mod blocking {
                     phoneme: ndarray::arr1(&phoneme_with_padding)
                         .into_shape([length_with_padding, phoneme_size])
                         .unwrap(),
-                    speaker_id: ndarray::arr1(&[model_inner_id.raw_id().into()]),
+                    speaker_id: ndarray::arr1(&[inner_voice_id.raw_id().into()]),
                 },
             )?;
 
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index 364c8db0a..358d0153c 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -16,7 +16,7 @@ use crate::{
         domains::{TalkDomain, TalkOperation},
         InferenceDomain,
     },
-    manifest::{Manifest, ManifestDomains, StyleIdToModelInnerId},
+    manifest::{Manifest, ManifestDomains, StyleIdToInnerVoiceId},
     SpeakerMeta, StyleMeta, StyleType, VoiceModelMeta,
 };
 use std::path::{Path, PathBuf};
@@ -26,8 +26,8 @@ use std::path::{Path, PathBuf};
 /// [`VoiceModelId`]: VoiceModelId
 pub type RawVoiceModelId = String;
 
-pub(crate) type ModelBytesWithInnerIdsByDomain =
-    (Option<(StyleIdToModelInnerId, EnumMap<TalkOperation, Vec<u8>>)>,);
+pub(crate) type ModelBytesWithInnerVoiceIdsByDomain =
+    (Option<(StyleIdToInnerVoiceId, EnumMap<TalkOperation, Vec<u8>>)>,);
 
 /// 音声モデルID。
 #[derive(
@@ -164,7 +164,7 @@ pub(crate) mod blocking {
         VoiceModelMeta,
     };
 
-    use super::{ModelBytesWithInnerIdsByDomain, VoiceModelHeader, VoiceModelId};
+    use super::{ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
 
     /// 音声モデル。
     ///
@@ -177,7 +177,7 @@ pub(crate) mod blocking {
     impl self::VoiceModel {
         pub(crate) fn read_inference_models(
             &self,
-        ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerIdsByDomain>> {
+        ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
             let reader = BlockingVvmEntryReader::open(&self.header.path)?;
 
             let talk = self
@@ -191,7 +191,7 @@ pub(crate) mod blocking {
                          predict_duration_filename,
                          predict_intonation_filename,
                          decode_filename,
-                         style_id_to_model_inner_id,
+                         style_id_to_inner_voice_id,
                      }| {
                         let model_bytes = [
                             predict_duration_filename,
@@ -206,7 +206,7 @@ pub(crate) mod blocking {
 
                         let model_bytes = EnumMap::from_array(model_bytes);
 
-                        Ok((style_id_to_model_inner_id.clone(), model_bytes))
+                        Ok((style_id_to_inner_voice_id.clone(), model_bytes))
                     },
                 )
                 .transpose()?;
@@ -307,7 +307,7 @@ pub(crate) mod tokio {
         Result, VoiceModelMeta,
     };
 
-    use super::{ModelBytesWithInnerIdsByDomain, VoiceModelHeader, VoiceModelId};
+    use super::{ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
 
     /// 音声モデル。
     ///
@@ -320,7 +320,7 @@ pub(crate) mod tokio {
     impl self::VoiceModel {
         pub(crate) async fn read_inference_models(
             &self,
-        ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerIdsByDomain>> {
+        ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
             let reader = AsyncVvmEntryReader::open(&self.header.path).await?;
 
             let talk = OptionFuture::from(self.header.manifest.domains().talk.as_ref().map(
@@ -328,7 +328,7 @@ pub(crate) mod tokio {
                      predict_duration_filename,
                      predict_intonation_filename,
                      decode_filename,
-                     style_id_to_model_inner_id,
+                     style_id_to_inner_voice_id,
                  }| async {
                     let (
                         decode_model_result,
@@ -347,7 +347,7 @@ pub(crate) mod tokio {
                         decode_model_result?,
                     ]);
 
-                    Ok((style_id_to_model_inner_id.clone(), model_bytes))
+                    Ok((style_id_to_inner_voice_id.clone(), model_bytes))
                 },
             ))
             .await
@@ -505,7 +505,7 @@ mod tests {
         predict_duration_filename: "".to_owned(),
         predict_intonation_filename: "".to_owned(),
         decode_filename: "".to_owned(),
-        style_id_to_model_inner_id: Default::default(),
+        style_id_to_inner_voice_id: Default::default(),
     });
 
     #[fixture]
diff --git a/model/sample.vvm/manifest.json b/model/sample.vvm/manifest.json
index 2c6721d08..0b82d0c3f 100644
--- a/model/sample.vvm/manifest.json
+++ b/model/sample.vvm/manifest.json
@@ -5,7 +5,7 @@
     "predict_duration_filename": "predict_duration.onnx",
     "predict_intonation_filename": "predict_intonation.onnx",
     "decode_filename": "decode.onnx",
-    "style_id_to_model_inner_id": {
+    "style_id_to_inner_voice_id": {
       "302": 2,
       "303": 3
     }

From 484bd6247a8d2500104e1fc0882a9e9a8a22d2dc Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 24 May 2024 22:27:50 +0900
Subject: [PATCH 03/36] =?UTF-8?q?change:=20VVM=E3=81=ABUUID=E3=82=92?=
 =?UTF-8?q?=E5=89=B2=E3=82=8A=E6=8C=AF=E3=82=8A=E3=80=81=E3=81=9D=E3=82=8C?=
 =?UTF-8?q?=E3=82=92`VoiceModelId`=E3=81=A8=E3=81=99=E3=82=8B=20(#796)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* change: VVMにUUIDを割り振り、それを`VoiceModelId`とする

* 不要となったコメントを削除

* UUIDを分解する部分を修正し、テストも追加

以下のためuuidもアップデートする。
<https://github.com/uuid-rs/uuid/issues/741>
---
 Cargo.lock                                    | 17 ++----
 Cargo.toml                                    |  3 +-
 crates/voicevox_core/Cargo.toml               |  1 -
 .../voicevox_core/src/__internal/interop.rs   |  5 +-
 crates/voicevox_core/src/manifest.rs          |  5 +-
 crates/voicevox_core/src/status.rs            | 35 +++++------
 crates/voicevox_core/src/synthesizer.rs       | 14 ++---
 crates/voicevox_core/src/voice_model.rs       | 43 +++++++-------
 crates/voicevox_core_c_api/Cargo.toml         |  1 +
 .../include/voicevox_core.h                   |  6 +-
 crates/voicevox_core_c_api/src/c_impls.rs     |  8 ++-
 .../src/compatible_engine.rs                  |  7 +--
 crates/voicevox_core_c_api/src/helpers.rs     | 11 +++-
 crates/voicevox_core_c_api/src/lib.rs         | 41 +++++--------
 crates/voicevox_core_java_api/Cargo.toml      |  3 +
 .../hiroshiba/voicevoxcore/Synthesizer.java   |  9 +--
 .../jp/hiroshiba/voicevoxcore/VoiceModel.java |  5 +-
 crates/voicevox_core_java_api/src/common.rs   | 55 +++++++++++++++++-
 .../voicevox_core_java_api/src/synthesizer.rs | 14 ++---
 .../voicevox_core_java_api/src/voice_model.rs |  6 +-
 .../python/voicevox_core/_models.py           |  5 +-
 .../python/voicevox_core/_rust/asyncio.pyi    |  4 +-
 .../python/voicevox_core/_rust/blocking.pyi   |  4 +-
 .../voicevox_core_python_api/src/convert.rs   |  1 +
 crates/voicevox_core_python_api/src/lib.rs    | 58 ++++++++++---------
 model/sample.vvm/manifest.json                |  1 +
 26 files changed, 209 insertions(+), 153 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 0f9a78469..d3846b8a0 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1822,15 +1822,6 @@ dependencies = [
  "windows-sys 0.42.0",
 ]
 
-[[package]]
-name = "nanoid"
-version = "0.4.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3ffa00dec017b5b1a8b7cf5e2c008bfda1aa7e0697ac1508b491fdf2622fb4d8"
-dependencies = [
- "rand",
-]
-
 [[package]]
 name = "ndarray"
 version = "0.15.6"
@@ -3521,9 +3512,9 @@ checksum = "711b9620af191e0cdc7468a8d14e709c3dcdb115b36f838e601583af800a370a"
 
 [[package]]
 name = "uuid"
-version = "1.4.0"
+version = "1.8.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d023da39d1fde5a8a3fe1f3e01ca9632ada0a63e9797de55a879d6e2236277be"
+checksum = "a183cf7feeba97b4dd1c0d46788634f6221d87fa961b305bed08c851829efcc0"
 dependencies = [
  "getrandom",
  "serde",
@@ -3587,7 +3578,6 @@ dependencies = [
  "indexmap 2.0.0",
  "itertools 0.10.5",
  "jlabel",
- "nanoid",
  "ndarray",
  "once_cell",
  "open_jtalk",
@@ -3662,8 +3652,11 @@ dependencies = [
  "android_logger",
  "chrono",
  "derive_more",
+ "easy-ext",
  "jni",
  "once_cell",
+ "pretty_assertions",
+ "rstest",
  "serde_json",
  "tracing",
  "tracing-subscriber",
diff --git a/Cargo.toml b/Cargo.toml
index 7102127d5..4ea3d3757 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -47,7 +47,6 @@ libc = "0.2.134"
 libloading = "0.7.3"
 libtest-mimic = "0.6.0"
 log = "0.4.17"
-nanoid = "0.4.0"
 ndarray = "0.15.6"
 ndarray-stats = "0.5.1"
 octocrab = { version = "0.19.0", default-features = false }
@@ -81,7 +80,7 @@ tracing = "0.1.37"
 tracing-subscriber = "0.3.16"
 typetag = "0.2.5"
 url = "2.3.0"
-uuid = "1.4.0"
+uuid = "1.6.1"
 voicevox_core = { path = "crates/voicevox_core" }
 windows = "0.43.0"
 zip = "0.6.3"
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index 731862356..9957c1373 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -25,7 +25,6 @@ futures.workspace = true
 indexmap = { workspace = true, features = ["serde"] }
 itertools.workspace = true
 jlabel.workspace = true
-nanoid.workspace = true
 ndarray.workspace = true
 once_cell.workspace = true
 open_jtalk.workspace = true
diff --git a/crates/voicevox_core/src/__internal/interop.rs b/crates/voicevox_core/src/__internal/interop.rs
index fe46d10bc..677f5515a 100644
--- a/crates/voicevox_core/src/__internal/interop.rs
+++ b/crates/voicevox_core/src/__internal/interop.rs
@@ -1 +1,4 @@
-pub use crate::{metas::merge as merge_metas, synthesizer::blocking::PerformInference};
+pub use crate::{
+    metas::merge as merge_metas, synthesizer::blocking::PerformInference,
+    voice_model::blocking::IdRef,
+};
diff --git a/crates/voicevox_core/src/manifest.rs b/crates/voicevox_core/src/manifest.rs
index a22b66e8b..8464a48ab 100644
--- a/crates/voicevox_core/src/manifest.rs
+++ b/crates/voicevox_core/src/manifest.rs
@@ -6,7 +6,7 @@ use derive_new::new;
 use serde::{Deserialize, Serialize};
 use serde_with::{serde_as, DisplayFromStr};
 
-use crate::StyleId;
+use crate::{StyleId, VoiceModelId};
 
 pub type RawManifestVersion = String;
 #[derive(Deserialize, Clone, Debug, PartialEq, new)]
@@ -38,10 +38,9 @@ impl Display for InnerVoiceId {
 
 #[derive(Deserialize, Getters, Clone)]
 pub struct Manifest {
-    // FIXME: UUIDにする
-    // https://github.com/VOICEVOX/voicevox_core/issues/581
     #[allow(dead_code)]
     manifest_version: ManifestVersion,
+    pub(crate) id: VoiceModelId,
     metas_filename: String,
     #[serde(flatten)]
     domains: ManifestDomains,
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index 6980ab7fc..f590e18f4 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -58,7 +58,7 @@ impl<R: InferenceRuntime> Status<R> {
         Ok(())
     }
 
-    pub(crate) fn unload_model(&self, voice_model_id: &VoiceModelId) -> Result<()> {
+    pub(crate) fn unload_model(&self, voice_model_id: VoiceModelId) -> Result<()> {
         self.loaded_models.lock().unwrap().remove(voice_model_id)
     }
 
@@ -77,7 +77,7 @@ impl<R: InferenceRuntime> Status<R> {
         self.loaded_models.lock().unwrap().ids_for::<D>(style_id)
     }
 
-    pub(crate) fn is_loaded_model(&self, voice_model_id: &VoiceModelId) -> bool {
+    pub(crate) fn is_loaded_model(&self, voice_model_id: VoiceModelId) -> bool {
         self.loaded_models
             .lock()
             .unwrap()
@@ -101,7 +101,7 @@ impl<R: InferenceRuntime> Status<R> {
     /// `self`が`model_id`を含んでいないとき、パニックする。
     pub(crate) fn run_session<I>(
         &self,
-        model_id: &VoiceModelId,
+        model_id: VoiceModelId,
         input: I,
     ) -> Result<<I::Signature as InferenceSignature>::Output>
     where
@@ -159,7 +159,7 @@ impl<R: InferenceRuntime> LoadedModels<R> {
             .and_then(|(inner_voice_ids, _)| inner_voice_ids.get(&style_id).copied())
             .unwrap_or_else(|| InnerVoiceId::new(style_id.raw_id()));
 
-        Ok((model_id.clone(), inner_voice_id))
+        Ok((*model_id, inner_voice_id))
     }
 
     /// # Panics
@@ -168,12 +168,12 @@ impl<R: InferenceRuntime> LoadedModels<R> {
     ///
     /// - `self`が`model_id`を含んでいないとき
     /// - 対応する`InferenceDomain`が欠けているとき
-    fn get<I>(&self, model_id: &VoiceModelId) -> InferenceSessionCell<R, I>
+    fn get<I>(&self, model_id: VoiceModelId) -> InferenceSessionCell<R, I>
     where
         I: InferenceInputSignature,
         <I::Signature as InferenceSignature>::Domain: InferenceDomainExt,
     {
-        let (_, session_set) = self.0[model_id]
+        let (_, session_set) = self.0[&model_id]
             .session_sets_with_inner_ids
             .get::<<I::Signature as InferenceSignature>::Domain>()
             .as_ref()
@@ -190,8 +190,8 @@ impl<R: InferenceRuntime> LoadedModels<R> {
         session_set.get()
     }
 
-    fn contains_voice_model(&self, model_id: &VoiceModelId) -> bool {
-        self.0.contains_key(model_id)
+    fn contains_voice_model(&self, model_id: VoiceModelId) -> bool {
+        self.0.contains_key(&model_id)
     }
 
     fn contains_style(&self, style_id: StyleId) -> bool {
@@ -216,9 +216,9 @@ impl<R: InferenceRuntime> LoadedModels<R> {
             source: None,
         };
 
-        if self.0.contains_key(&model_header.id) {
+        if self.0.contains_key(&model_header.manifest.id) {
             return Err(error(LoadModelErrorKind::ModelAlreadyLoaded {
-                id: model_header.id.clone(),
+                id: model_header.manifest.id,
             }));
         }
 
@@ -255,7 +255,7 @@ impl<R: InferenceRuntime> LoadedModels<R> {
         self.ensure_acceptable(model_header)?;
 
         let prev = self.0.insert(
-            model_header.id.clone(),
+            model_header.manifest.id,
             LoadedModel {
                 metas: model_header.metas.clone(),
                 session_sets_with_inner_ids,
@@ -265,12 +265,9 @@ impl<R: InferenceRuntime> LoadedModels<R> {
         Ok(())
     }
 
-    fn remove(&mut self, model_id: &VoiceModelId) -> Result<()> {
-        if self.0.remove(model_id).is_none() {
-            return Err(ErrorRepr::ModelNotFound {
-                model_id: model_id.clone(),
-            }
-            .into());
+    fn remove(&mut self, model_id: VoiceModelId) -> Result<()> {
+        if self.0.remove(&model_id).is_none() {
+            return Err(ErrorRepr::ModelNotFound { model_id }.into());
         }
         Ok(())
     }
@@ -415,13 +412,13 @@ mod tests {
         let model_header = vvm.header();
         let model_contents = &vvm.read_inference_models().await.unwrap();
         assert!(
-            !status.is_loaded_model(&model_header.id),
+            !status.is_loaded_model(model_header.manifest.id),
             "model should  not be loaded"
         );
         let result = status.insert_model(model_header, model_contents);
         assert_debug_fmt_eq!(Ok(()), result);
         assert!(
-            status.is_loaded_model(&model_header.id),
+            status.is_loaded_model(model_header.manifest.id),
             "model should be loaded",
         );
     }
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 06555ea28..4b26eb56b 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -207,12 +207,12 @@ pub(crate) mod blocking {
         }
 
         /// 音声モデルの読み込みを解除する。
-        pub fn unload_voice_model(&self, voice_model_id: &VoiceModelId) -> Result<()> {
+        pub fn unload_voice_model(&self, voice_model_id: VoiceModelId) -> Result<()> {
             self.status.unload_model(voice_model_id)
         }
 
         /// 指定したIDの音声モデルが読み込まれているか判定する。
-        pub fn is_loaded_voice_model(&self, voice_model_id: &VoiceModelId) -> bool {
+        pub fn is_loaded_voice_model(&self, voice_model_id: VoiceModelId) -> bool {
             self.status.is_loaded_model(voice_model_id)
         }
 
@@ -841,7 +841,7 @@ pub(crate) mod blocking {
             let PredictDurationOutput {
                 phoneme_length: output,
             } = self.status.run_session(
-                &model_id,
+                model_id,
                 PredictDurationInput {
                     phoneme_list: ndarray::arr1(phoneme_vector),
                     speaker_id: ndarray::arr1(&[inner_voice_id.raw_id().into()]),
@@ -874,7 +874,7 @@ pub(crate) mod blocking {
             let (model_id, inner_voice_id) = self.status.ids_for::<TalkDomain>(style_id)?;
 
             let PredictIntonationOutput { f0_list: output } = self.status.run_session(
-                &model_id,
+                model_id,
                 PredictIntonationInput {
                     length: ndarray::arr0(length as i64),
                     vowel_phoneme_list: ndarray::arr1(vowel_phoneme_vector),
@@ -917,7 +917,7 @@ pub(crate) mod blocking {
             );
 
             let DecodeOutput { wave: output } = self.status.run_session(
-                &model_id,
+                model_id,
                 DecodeInput {
                     f0: ndarray::arr1(&f0_with_padding)
                         .into_shape([length_with_padding, 1])
@@ -1150,11 +1150,11 @@ pub(crate) mod tokio {
             self.0.status.insert_model(model.header(), model_bytes)
         }
 
-        pub fn unload_voice_model(&self, voice_model_id: &VoiceModelId) -> Result<()> {
+        pub fn unload_voice_model(&self, voice_model_id: VoiceModelId) -> Result<()> {
             self.0.unload_voice_model(voice_model_id)
         }
 
-        pub fn is_loaded_voice_model(&self, voice_model_id: &VoiceModelId) -> bool {
+        pub fn is_loaded_voice_model(&self, voice_model_id: VoiceModelId) -> bool {
             self.0.is_loaded_voice_model(voice_model_id)
         }
 
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index 358d0153c..f5e862854 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -4,11 +4,13 @@
 
 use anyhow::anyhow;
 use derive_getters::Getters;
+use derive_more::From;
 use derive_new::new;
 use easy_ext::ext;
 use enum_map::EnumMap;
 use itertools::Itertools as _;
 use serde::Deserialize;
+use uuid::Uuid;
 
 use crate::{
     error::{LoadModelError, LoadModelErrorKind, LoadModelResult},
@@ -24,7 +26,7 @@ use std::path::{Path, PathBuf};
 /// [`VoiceModelId`]の実体。
 ///
 /// [`VoiceModelId`]: VoiceModelId
-pub type RawVoiceModelId = String;
+pub type RawVoiceModelId = Uuid;
 
 pub(crate) type ModelBytesWithInnerVoiceIdsByDomain =
     (Option<(StyleIdToInnerVoiceId, EnumMap<TalkOperation, Vec<u8>>)>,);
@@ -34,6 +36,7 @@ pub(crate) type ModelBytesWithInnerVoiceIdsByDomain =
     PartialEq,
     Eq,
     Clone,
+    Copy,
     Ord,
     Hash,
     PartialOrd,
@@ -42,7 +45,9 @@ pub(crate) type ModelBytesWithInnerVoiceIdsByDomain =
     Getters,
     derive_more::Display,
     Debug,
+    From,
 )]
+#[serde(transparent)]
 pub struct VoiceModelId {
     raw_voice_model_id: RawVoiceModelId,
 }
@@ -53,9 +58,7 @@ pub struct VoiceModelId {
 /// モデルの`[u8]`と分けて`Status`に渡す。
 #[derive(Clone)]
 pub(crate) struct VoiceModelHeader {
-    /// ID。
-    pub(crate) id: VoiceModelId,
-    manifest: Manifest,
+    pub(crate) manifest: Manifest,
     /// メタ情報。
     ///
     /// `manifest`が対応していない`StyleType`のスタイルは含まれるべきではない。
@@ -64,12 +67,7 @@ pub(crate) struct VoiceModelHeader {
 }
 
 impl VoiceModelHeader {
-    fn new(
-        id: VoiceModelId,
-        manifest: Manifest,
-        metas: &[u8],
-        path: &Path,
-    ) -> LoadModelResult<Self> {
+    fn new(manifest: Manifest, metas: &[u8], path: &Path) -> LoadModelResult<Self> {
         let metas =
             serde_json::from_slice::<VoiceModelMeta>(metas).map_err(|source| LoadModelError {
                 path: path.to_owned(),
@@ -94,7 +92,6 @@ impl VoiceModelHeader {
             })?;
 
         Ok(Self {
-            id,
             manifest,
             metas,
             path: path.to_owned(),
@@ -151,8 +148,8 @@ pub(crate) mod blocking {
         path::Path,
     };
 
+    use easy_ext::ext;
     use enum_map::EnumMap;
-    use nanoid::nanoid;
     use ouroboros::self_referencing;
     use rayon::iter::{IntoParallelIterator as _, ParallelIterator as _};
     use serde::de::DeserializeOwned;
@@ -220,14 +217,13 @@ pub(crate) mod blocking {
             let reader = BlockingVvmEntryReader::open(path)?;
             let manifest = reader.read_vvm_json::<Manifest>("manifest.json")?;
             let metas = &reader.read_vvm_entry(manifest.metas_filename())?;
-            let id = VoiceModelId::new(nanoid!());
-            let header = VoiceModelHeader::new(id, manifest, metas, path)?;
+            let header = VoiceModelHeader::new(manifest, metas, path)?;
             Ok(Self { header })
         }
 
         /// ID。
-        pub fn id(&self) -> &VoiceModelId {
-            &self.header.id
+        pub fn id(&self) -> VoiceModelId {
+            self.header.manifest.id
         }
 
         /// メタ情報。
@@ -289,6 +285,13 @@ pub(crate) mod blocking {
             })
         }
     }
+
+    #[ext(IdRef)]
+    pub impl VoiceModel {
+        fn id_ref(&self) -> &VoiceModelId {
+            &self.header.manifest.id
+        }
+    }
 }
 
 pub(crate) mod tokio {
@@ -297,7 +300,6 @@ pub(crate) mod tokio {
     use derive_new::new;
     use enum_map::EnumMap;
     use futures::future::{join3, OptionFuture};
-    use nanoid::nanoid;
     use serde::de::DeserializeOwned;
 
     use crate::{
@@ -360,14 +362,13 @@ pub(crate) mod tokio {
             let reader = AsyncVvmEntryReader::open(path.as_ref()).await?;
             let manifest = reader.read_vvm_json::<Manifest>("manifest.json").await?;
             let metas = &reader.read_vvm_entry(manifest.metas_filename()).await?;
-            let id = VoiceModelId::new(nanoid!());
-            let header = VoiceModelHeader::new(id, manifest, metas, path.as_ref())?;
+            let header = VoiceModelHeader::new(manifest, metas, path.as_ref())?;
             Ok(Self { header })
         }
 
         /// ID。
-        pub fn id(&self) -> &VoiceModelId {
-            &self.header.id
+        pub fn id(&self) -> VoiceModelId {
+            self.header.manifest.id
         }
 
         /// メタ情報。
diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml
index ad3a65fa7..f10e2a6f4 100644
--- a/crates/voicevox_core_c_api/Cargo.toml
+++ b/crates/voicevox_core_c_api/Cargo.toml
@@ -24,6 +24,7 @@ chrono = { workspace = true, default-features = false, features = ["clock"] }
 colorchoice.workspace = true
 cstr.workspace = true
 derive-getters.workspace = true
+easy-ext.workspace = true
 futures.workspace = true
 itertools.workspace = true
 libc.workspace = true
diff --git a/crates/voicevox_core_c_api/include/voicevox_core.h b/crates/voicevox_core_c_api/include/voicevox_core.h
index 592ec8abb..da921c869 100644
--- a/crates/voicevox_core_c_api/include/voicevox_core.h
+++ b/crates/voicevox_core_c_api/include/voicevox_core.h
@@ -277,7 +277,7 @@ typedef struct VoicevoxInitializeOptions {
 /**
  * 音声モデルID。
  */
-typedef const char *VoicevoxVoiceModelId;
+typedef const uint8_t (*VoicevoxVoiceModelId)[16];
 
 /**
  * スタイルID。
@@ -554,7 +554,7 @@ VoicevoxResultCode voicevox_synthesizer_load_voice_model(const struct VoicevoxSy
  *
  * \safety{
  * - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
- * - `model_id`はヌル終端文字列を指し、かつ<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
+ * - `model_id`は<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
  * }
  */
 #ifdef _WIN32
@@ -589,7 +589,7 @@ bool voicevox_synthesizer_is_gpu_mode(const struct VoicevoxSynthesizer *synthesi
  *
  * \safety{
  * - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
- * - `model_id`はヌル終端文字列を指し、かつ<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
+ * - `model_id`は<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
  * }
  */
 #ifdef _WIN32
diff --git a/crates/voicevox_core_c_api/src/c_impls.rs b/crates/voicevox_core_c_api/src/c_impls.rs
index 4e73bf0fb..fe4afcf65 100644
--- a/crates/voicevox_core_c_api/src/c_impls.rs
+++ b/crates/voicevox_core_c_api/src/c_impls.rs
@@ -5,6 +5,9 @@ use voicevox_core::{InitializeOptions, Result, VoiceModelId};
 
 use crate::{helpers::CApiResult, OpenJtalkRc, VoicevoxSynthesizer, VoicevoxVoiceModel};
 
+// FIXME: 中身(Rust API)を直接操作するかラッパーメソッド越しにするのかが混在していて、一貫性を
+// 欠いている
+
 impl OpenJtalkRc {
     pub(crate) fn new(open_jtalk_dic_dir: impl AsRef<Utf8Path>) -> Result<Self> {
         Ok(Self {
@@ -28,7 +31,7 @@ impl VoicevoxSynthesizer {
         Ok(())
     }
 
-    pub(crate) fn unload_voice_model(&self, model_id: &VoiceModelId) -> Result<()> {
+    pub(crate) fn unload_voice_model(&self, model_id: VoiceModelId) -> Result<()> {
         self.synthesizer.unload_voice_model(model_id)?;
         Ok(())
     }
@@ -42,8 +45,7 @@ impl VoicevoxSynthesizer {
 impl VoicevoxVoiceModel {
     pub(crate) fn from_path(path: impl AsRef<Path>) -> Result<Self> {
         let model = voicevox_core::blocking::VoiceModel::from_path(path)?;
-        let id = CString::new(model.id().raw_voice_model_id().as_str()).unwrap();
         let metas = CString::new(serde_json::to_string(model.metas()).unwrap()).unwrap();
-        Ok(Self { model, id, metas })
+        Ok(Self { model, metas })
     }
 }
diff --git a/crates/voicevox_core_c_api/src/compatible_engine.rs b/crates/voicevox_core_c_api/src/compatible_engine.rs
index 6755910f5..ae4d21a93 100644
--- a/crates/voicevox_core_c_api/src/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/src/compatible_engine.rs
@@ -37,10 +37,7 @@ struct VoiceModelSet {
 
 static VOICE_MODEL_SET: Lazy<VoiceModelSet> = Lazy::new(|| {
     let all_vvms = get_all_models();
-    let model_map: BTreeMap<_, _> = all_vvms
-        .iter()
-        .map(|vvm| (vvm.id().clone(), vvm.clone()))
-        .collect();
+    let model_map: BTreeMap<_, _> = all_vvms.iter().map(|vvm| (vvm.id(), vvm.clone())).collect();
     let metas = voicevox_core::__internal::interop::merge_metas(
         all_vvms.iter().flat_map(|vvm| vvm.metas()),
     );
@@ -48,7 +45,7 @@ static VOICE_MODEL_SET: Lazy<VoiceModelSet> = Lazy::new(|| {
     for vvm in all_vvms.iter() {
         for meta in vvm.metas().iter() {
             for style in meta.styles().iter() {
-                style_model_map.insert(*style.id(), vvm.id().clone());
+                style_model_map.insert(*style.id(), vvm.id());
             }
         }
     }
diff --git a/crates/voicevox_core_c_api/src/helpers.rs b/crates/voicevox_core_c_api/src/helpers.rs
index 1c163a0d0..ac0cab286 100644
--- a/crates/voicevox_core_c_api/src/helpers.rs
+++ b/crates/voicevox_core_c_api/src/helpers.rs
@@ -1,5 +1,7 @@
+use easy_ext::ext;
 use std::{error::Error as _, ffi::CStr, fmt::Debug, iter};
-use voicevox_core::{AudioQueryModel, UserDictWord};
+use uuid::Uuid;
+use voicevox_core::{AudioQueryModel, UserDictWord, VoiceModelId};
 
 use thiserror::Error;
 use tracing::error;
@@ -163,6 +165,13 @@ impl Default for VoicevoxSynthesisOptions {
     }
 }
 
+#[ext(UuidBytesExt)]
+pub(crate) impl uuid::Bytes {
+    fn to_model_id(self) -> VoiceModelId {
+        Uuid::from_bytes(self).into()
+    }
+}
+
 impl VoicevoxUserDictWord {
     pub(crate) unsafe fn try_into_word(&self) -> CApiResult<voicevox_core::UserDictWord> {
         Ok(UserDictWord::new(
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index fbb0bf6bf..08a54b11a 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -12,7 +12,7 @@ mod slice_owner;
 use self::drop_check::C_STRING_DROP_CHECKER;
 use self::helpers::{
     accent_phrases_to_json, audio_query_model_to_json, ensure_utf8, into_result_code_with_error,
-    CApiError,
+    CApiError, UuidBytesExt as _,
 };
 use self::result_code::VoicevoxResultCode;
 use self::slice_owner::U8_SLICE_OWNER;
@@ -30,7 +30,8 @@ use std::sync::{Arc, Once};
 use tracing_subscriber::fmt::format::Writer;
 use tracing_subscriber::EnvFilter;
 use uuid::Uuid;
-use voicevox_core::{AccentPhraseModel, AudioQueryModel, TtsOptions, UserDictWord, VoiceModelId};
+use voicevox_core::__internal::interop::IdRef as _;
+use voicevox_core::{AccentPhraseModel, AudioQueryModel, TtsOptions, UserDictWord};
 use voicevox_core::{StyleId, SupportedDevices, SynthesisOptions};
 
 fn init_logger_once() {
@@ -238,12 +239,11 @@ pub extern "C" fn voicevox_get_version() -> *const c_char {
 #[derive(Getters)]
 pub struct VoicevoxVoiceModel {
     model: voicevox_core::blocking::VoiceModel,
-    id: CString,
     metas: CString,
 }
 
 /// 音声モデルID。
-pub type VoicevoxVoiceModelId = *const c_char;
+pub type VoicevoxVoiceModelId<'a> = &'a [u8; 16];
 
 /// スタイルID。
 ///
@@ -285,9 +285,9 @@ pub unsafe extern "C" fn voicevox_voice_model_new_from_path(
 /// - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
 /// }
 #[no_mangle]
-pub extern "C" fn voicevox_voice_model_id(model: &VoicevoxVoiceModel) -> VoicevoxVoiceModelId {
+pub extern "C" fn voicevox_voice_model_id(model: &VoicevoxVoiceModel) -> VoicevoxVoiceModelId<'_> {
     init_logger_once();
-    model.id().as_ptr()
+    model.model.id_ref().raw_voice_model_id().as_bytes()
 }
 
 /// ::VoicevoxVoiceModel からメタ情報を取得する。
@@ -399,20 +399,16 @@ pub extern "C" fn voicevox_synthesizer_load_voice_model(
 ///
 /// \safety{
 /// - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
-/// - `model_id`はヌル終端文字列を指し、かつ<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
+/// - `model_id`は<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
 /// }
 #[no_mangle]
-pub unsafe extern "C" fn voicevox_synthesizer_unload_voice_model(
+pub extern "C" fn voicevox_synthesizer_unload_voice_model(
     synthesizer: &VoicevoxSynthesizer,
-    model_id: VoicevoxVoiceModelId,
+    model_id: VoicevoxVoiceModelId<'_>,
 ) -> VoicevoxResultCode {
     init_logger_once();
-    into_result_code_with_error((|| {
-        let raw_model_id = ensure_utf8(unsafe { CStr::from_ptr(model_id) })?;
-        synthesizer
-            .unload_voice_model(&VoiceModelId::new(raw_model_id.to_string()))
-            .map_err(Into::into)
-    })())
+    let model_id = model_id.to_model_id();
+    into_result_code_with_error(synthesizer.unload_voice_model(model_id).map_err(Into::into))
 }
 
 /// ハードウェアアクセラレーションがGPUモードか判定する。
@@ -439,21 +435,16 @@ pub extern "C" fn voicevox_synthesizer_is_gpu_mode(synthesizer: &VoicevoxSynthes
 ///
 /// \safety{
 /// - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
-/// - `model_id`はヌル終端文字列を指し、かつ<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
+/// - `model_id`は<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
 /// }
 #[no_mangle]
-pub unsafe extern "C" fn voicevox_synthesizer_is_loaded_voice_model(
+pub extern "C" fn voicevox_synthesizer_is_loaded_voice_model(
     synthesizer: &VoicevoxSynthesizer,
-    model_id: VoicevoxVoiceModelId,
+    model_id: VoicevoxVoiceModelId<'_>,
 ) -> bool {
     init_logger_once();
-    let Ok(raw_model_id) = ensure_utf8(unsafe { CStr::from_ptr(model_id) }) else {
-        // 与えられたIDがUTF-8ではない場合、それに対応する`VoicdModel`は確実に存在しない
-        return false;
-    };
-    synthesizer
-        .synthesizer()
-        .is_loaded_voice_model(&VoiceModelId::new(raw_model_id.into()))
+    let model_id = model_id.to_model_id();
+    synthesizer.synthesizer().is_loaded_voice_model(model_id)
 }
 
 /// 今読み込んでいる音声モデルのメタ情報を、JSONで取得する。
diff --git a/crates/voicevox_core_java_api/Cargo.toml b/crates/voicevox_core_java_api/Cargo.toml
index 06b2af618..b39a98b2a 100644
--- a/crates/voicevox_core_java_api/Cargo.toml
+++ b/crates/voicevox_core_java_api/Cargo.toml
@@ -15,8 +15,11 @@ directml = ["voicevox_core/directml"]
 android_logger.workspace = true
 chrono = { workspace = true, default-features = false, features = ["clock"] }
 derive_more.workspace = true
+easy-ext.workspace = true
 jni.workspace = true
 once_cell.workspace = true
+pretty_assertions = "1.3.0"
+rstest.workspace = true
 serde_json = { workspace = true, features = ["preserve_order"] }
 tracing = { workspace = true, features = ["log"] }
 tracing-subscriber = { workspace = true, features = ["env-filter"] }
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
index a3fe0de6c..6ec6d9108 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
@@ -5,6 +5,7 @@
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.List;
+import java.util.UUID;
 import jp.hiroshiba.voicevoxcore.exceptions.InferenceFailedException;
 import jp.hiroshiba.voicevoxcore.exceptions.InvalidModelDataException;
 
@@ -65,7 +66,7 @@ public void loadVoiceModel(VoiceModel voiceModel) throws InvalidModelDataExcepti
    *
    * @param voiceModelId 読み込みを解除する音声モデルのID。
    */
-  public void unloadVoiceModel(String voiceModelId) {
+  public void unloadVoiceModel(UUID voiceModelId) {
     rsUnloadVoiceModel(voiceModelId);
   }
 
@@ -75,7 +76,7 @@ public void unloadVoiceModel(String voiceModelId) {
    * @param voiceModelId 音声モデルのID。
    * @return 指定した音声モデルのIDが読み込まれているかどうか。
    */
-  public boolean isLoadedVoiceModel(String voiceModelId) {
+  public boolean isLoadedVoiceModel(UUID voiceModelId) {
     return rsIsLoadedVoiceModel(voiceModelId);
   }
 
@@ -274,9 +275,9 @@ public TtsConfigurator tts(String text, int styleId) {
 
   private native void rsLoadVoiceModel(VoiceModel voiceModel) throws InvalidModelDataException;
 
-  private native void rsUnloadVoiceModel(String voiceModelId);
+  private native void rsUnloadVoiceModel(UUID voiceModelId);
 
-  private native boolean rsIsLoadedVoiceModel(String voiceModelId);
+  private native boolean rsIsLoadedVoiceModel(UUID voiceModelId);
 
   @Nonnull
   private native String rsAudioQueryFromKana(String kana, int styleId)
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java
index 576629515..d8c002f0f 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java
@@ -5,13 +5,14 @@
 import com.google.gson.annotations.SerializedName;
 import jakarta.annotation.Nonnull;
 import jakarta.annotation.Nullable;
+import java.util.UUID;
 
 /** 音声モデル。 */
 public class VoiceModel extends Dll {
   private long handle;
 
   /** ID。 */
-  @Nonnull public final String id;
+  @Nonnull public final UUID id;
 
   /** メタ情報。 */
   @Nonnull public final SpeakerMeta[] metas;
@@ -36,7 +37,7 @@ protected void finalize() throws Throwable {
   private native void rsFromPath(String modelPath);
 
   @Nonnull
-  private native String rsGetId();
+  private native UUID rsGetId();
 
   @Nonnull
   private native String rsGetMetasJson();
diff --git a/crates/voicevox_core_java_api/src/common.rs b/crates/voicevox_core_java_api/src/common.rs
index bdb37f4ff..6e13cee89 100644
--- a/crates/voicevox_core_java_api/src/common.rs
+++ b/crates/voicevox_core_java_api/src/common.rs
@@ -1,7 +1,12 @@
 use std::{error::Error as _, iter};
 
 use derive_more::From;
-use jni::{objects::JThrowable, JNIEnv};
+use easy_ext::ext;
+use jni::{
+    objects::{JObject, JThrowable},
+    JNIEnv,
+};
+use uuid::Uuid;
 
 #[macro_export]
 macro_rules! object {
@@ -168,3 +173,51 @@ pub(crate) enum JavaApiError {
 
     DeJson(serde_json::Error),
 }
+
+#[ext(JNIEnvExt)]
+pub(crate) impl JNIEnv<'_> {
+    fn new_uuid(&mut self, uuid: Uuid) -> jni::errors::Result<JObject<'_>> {
+        let (msbs, lsbs) = split_uuid(uuid);
+        self.new_object("java/util/UUID", "(JJ)V", &[msbs.into(), lsbs.into()])
+    }
+
+    fn get_uuid(&mut self, obj: &JObject<'_>) -> jni::errors::Result<Uuid> {
+        let mut get_bits = |method_name| self.call_method(obj, method_name, "()J", &[])?.j();
+        let msbs = get_bits("getMostSignificantBits")?;
+        let lsbs = get_bits("getLeastSignificantBits")?;
+        Ok(construct_uuid(msbs, lsbs))
+    }
+}
+
+fn split_uuid(uuid: Uuid) -> (i64, i64) {
+    let uuid = uuid.as_u128();
+    let msbs = (uuid >> 64) as _;
+    let lsbs = uuid as _;
+    (msbs, lsbs)
+}
+
+fn construct_uuid(msbs: i64, lsbs: i64) -> Uuid {
+    return Uuid::from_u128((to_u128(msbs) << 64) + to_u128(lsbs));
+
+    fn to_u128(bits: i64) -> u128 {
+        (bits as u64).into()
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use pretty_assertions::assert_eq;
+    use rstest::rstest;
+    use uuid::{uuid, Uuid};
+
+    #[rstest]
+    #[case(uuid!("a1a2a3a4-b1b2-c1c2-d1d2-e1e2e3e4e5e6"))]
+    #[case(uuid!("00000000-0000-0000-0000-000000000000"))]
+    #[case(uuid!("00000000-0000-0000-ffff-ffffffffffff"))]
+    #[case(uuid!("ffffffff-ffff-ffff-0000-000000000000"))]
+    #[case(uuid!("ffffffff-ffff-ffff-ffff-ffffffffffff"))]
+    fn uuid_conversion_works(#[case] uuid: Uuid) {
+        let (msbs, lsbs) = super::split_uuid(uuid);
+        assert_eq!(uuid, super::construct_uuid(msbs, lsbs));
+    }
+}
diff --git a/crates/voicevox_core_java_api/src/synthesizer.rs b/crates/voicevox_core_java_api/src/synthesizer.rs
index fee5bc132..dc5dc971d 100644
--- a/crates/voicevox_core_java_api/src/synthesizer.rs
+++ b/crates/voicevox_core_java_api/src/synthesizer.rs
@@ -1,5 +1,5 @@
 use crate::{
-    common::{throw_if_err, JavaApiError},
+    common::{throw_if_err, JNIEnvExt as _, JavaApiError},
     enum_object, object, object_type,
 };
 
@@ -115,10 +115,10 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsLoadVoice
 unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsUnloadVoiceModel<'local>(
     env: JNIEnv<'local>,
     this: JObject<'local>,
-    model_id: JString<'local>,
+    model_id: JObject<'local>,
 ) {
     throw_if_err(env, (), |env| {
-        let model_id: String = env.get_string(&model_id)?.into();
+        let model_id = env.get_uuid(&model_id)?.into();
 
         let internal = env
             .get_rust_field::<_, _, Arc<voicevox_core::blocking::Synthesizer<voicevox_core::blocking::OpenJtalk>>>(
@@ -126,7 +126,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsUnloadVoi
             )?
             .clone();
 
-        internal.unload_voice_model(&voicevox_core::VoiceModelId::new(model_id))?;
+        internal.unload_voice_model(model_id)?;
 
         Ok(())
     })
@@ -138,10 +138,10 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsIsLoadedV
 >(
     env: JNIEnv<'local>,
     this: JObject<'local>,
-    model_id: JString<'local>,
+    model_id: JObject<'local>,
 ) -> jboolean {
     throw_if_err(env, false, |env| {
-        let model_id: String = env.get_string(&model_id)?.into();
+        let model_id = env.get_uuid(&model_id)?.into();
 
         let internal = env
             .get_rust_field::<_, _, Arc<voicevox_core::blocking::Synthesizer<voicevox_core::blocking::OpenJtalk>>>(
@@ -149,7 +149,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsIsLoadedV
             )?
             .clone();
 
-        let is_loaded = internal.is_loaded_voice_model(&voicevox_core::VoiceModelId::new(model_id));
+        let is_loaded = internal.is_loaded_voice_model(model_id);
 
         Ok(is_loaded)
     })
diff --git a/crates/voicevox_core_java_api/src/voice_model.rs b/crates/voicevox_core_java_api/src/voice_model.rs
index 42a20544a..546ab9bf6 100644
--- a/crates/voicevox_core_java_api/src/voice_model.rs
+++ b/crates/voicevox_core_java_api/src/voice_model.rs
@@ -1,6 +1,6 @@
 use std::{borrow::Cow, sync::Arc};
 
-use crate::common::throw_if_err;
+use crate::common::{throw_if_err, JNIEnvExt as _};
 use jni::{
     objects::{JObject, JString},
     sys::jobject,
@@ -35,9 +35,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsGetId<'loc
             .get_rust_field::<_, _, Arc<voicevox_core::blocking::VoiceModel>>(&this, "handle")?
             .clone();
 
-        let id = internal.id().raw_voice_model_id();
-
-        let id = env.new_string(id)?;
+        let id = env.new_uuid(*internal.id().raw_voice_model_id())?;
 
         Ok(id.into_raw())
     })
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_models.py b/crates/voicevox_core_python_api/python/voicevox_core/_models.py
index 21a2016fe..f7929fae2 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_models.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_models.py
@@ -1,6 +1,7 @@
 import dataclasses
 from enum import Enum
 from typing import List, NewType, Optional
+from uuid import UUID
 
 import pydantic
 
@@ -24,13 +25,13 @@
 x : str
 """
 
-VoiceModelId = NewType("VoiceModelId", str)
+VoiceModelId = NewType("VoiceModelId", UUID)
 """
 音声モデルID。
 
 Parameters
 ----------
-x : str
+x : UUID
 """
 
 
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
index d8e9f6fe2..468d885ee 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
@@ -109,7 +109,7 @@ class Synthesizer:
             読み込むモデルのスタイルID。
         """
         ...
-    def unload_voice_model(self, voice_model_id: Union[VoiceModelId, str]) -> None:
+    def unload_voice_model(self, voice_model_id: Union[VoiceModelId, UUID]) -> None:
         """
         音声モデルの読み込みを解除する。
 
@@ -119,7 +119,7 @@ class Synthesizer:
             音声モデルID。
         """
         ...
-    def is_loaded_voice_model(self, voice_model_id: Union[VoiceModelId, str]) -> bool:
+    def is_loaded_voice_model(self, voice_model_id: Union[VoiceModelId, UUID]) -> bool:
         """
         指定したvoice_model_idのモデルが読み込まれているか判定する。
 
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
index 5584d68bb..fd09eb8cd 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
@@ -104,7 +104,7 @@ class Synthesizer:
             読み込むモデルのスタイルID。
         """
         ...
-    def unload_voice_model(self, voice_model_id: Union[VoiceModelId, str]) -> None:
+    def unload_voice_model(self, voice_model_id: Union[VoiceModelId, UUID]) -> None:
         """
         音声モデルの読み込みを解除する。
 
@@ -114,7 +114,7 @@ class Synthesizer:
             音声モデルID。
         """
         ...
-    def is_loaded_voice_model(self, voice_model_id: Union[VoiceModelId, str]) -> bool:
+    def is_loaded_voice_model(self, voice_model_id: Union[VoiceModelId, UUID]) -> bool:
         """
         指定したvoice_model_idのモデルが読み込まれているか判定する。
 
diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs
index 3cee4186b..f40b2d449 100644
--- a/crates/voicevox_core_python_api/src/convert.rs
+++ b/crates/voicevox_core_python_api/src/convert.rs
@@ -149,6 +149,7 @@ pub(crate) fn to_rust_uuid(ob: &PyAny) -> PyResult<Uuid> {
     let uuid = ob.getattr("hex")?.extract::<String>()?;
     uuid.parse::<Uuid>().into_py_value_result()
 }
+// FIXME: `to_object`は必要無いのでは?
 pub(crate) fn to_py_uuid(py: Python<'_>, uuid: Uuid) -> PyResult<PyObject> {
     let uuid = uuid.hyphenated().to_string();
     let uuid = py.import("uuid")?.call_method1("UUID", (uuid,))?;
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index 492d18f0e..e43fa4476 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -154,13 +154,13 @@ mod blocking {
     use camino::Utf8PathBuf;
     use pyo3::{
         pyclass, pymethods,
-        types::{IntoPyDict as _, PyBytes, PyDict, PyList, PyString},
+        types::{IntoPyDict as _, PyBytes, PyDict, PyList},
         PyAny, PyObject, PyRef, PyResult, Python,
     };
     use uuid::Uuid;
     use voicevox_core::{
         AccelerationMode, AudioQueryModel, InitializeOptions, StyleId, SynthesisOptions,
-        TtsOptions, UserDictWord, VoiceModelId,
+        TtsOptions, UserDictWord,
     };
 
     use crate::{convert::VoicevoxCoreResultExt as _, Closable};
@@ -180,8 +180,9 @@ mod blocking {
         }
 
         #[getter]
-        fn id(&self) -> &str {
-            self.model.id().raw_voice_model_id()
+        fn id(&self, py: Python<'_>) -> PyResult<PyObject> {
+            let id = *self.model.id().raw_voice_model_id();
+            crate::convert::to_py_uuid(py, id)
         }
 
         #[getter]
@@ -289,23 +290,25 @@ mod blocking {
                 .into_py_result(py)
         }
 
-        fn unload_voice_model(&mut self, voice_model_id: &str, py: Python<'_>) -> PyResult<()> {
+        fn unload_voice_model(
+            &mut self,
+            #[pyo3(from_py_with = "crate::convert::to_rust_uuid")] voice_model_id: Uuid,
+            py: Python<'_>,
+        ) -> PyResult<()> {
             self.synthesizer
                 .get()?
-                .unload_voice_model(&VoiceModelId::new(voice_model_id.to_string()))
+                .unload_voice_model(voice_model_id.into())
                 .into_py_result(py)
         }
 
-        // C APIの挙動と一貫性を持たせる。
-        fn is_loaded_voice_model(&self, voice_model_id: &PyString) -> PyResult<bool> {
-            let Ok(voice_model_id) = voice_model_id.to_str() else {
-                // 与えられたIDがUTF-8ではない場合、それに対応する`VoicdModel`は確実に存在しない
-                return Ok(false);
-            };
+        fn is_loaded_voice_model(
+            &self,
+            #[pyo3(from_py_with = "crate::convert::to_rust_uuid")] voice_model_id: Uuid,
+        ) -> PyResult<bool> {
             Ok(self
                 .synthesizer
                 .get()?
-                .is_loaded_voice_model(&VoiceModelId::new(voice_model_id.to_string())))
+                .is_loaded_voice_model(voice_model_id.into()))
         }
 
         fn audio_query_from_kana<'py>(
@@ -579,13 +582,13 @@ mod asyncio {
     use camino::Utf8PathBuf;
     use pyo3::{
         pyclass, pymethods,
-        types::{IntoPyDict as _, PyBytes, PyDict, PyList, PyString},
+        types::{IntoPyDict as _, PyBytes, PyDict, PyList},
         PyAny, PyObject, PyRef, PyResult, Python, ToPyObject as _,
     };
     use uuid::Uuid;
     use voicevox_core::{
         AccelerationMode, AudioQueryModel, InitializeOptions, StyleId, SynthesisOptions,
-        TtsOptions, UserDictWord, VoiceModelId,
+        TtsOptions, UserDictWord,
     };
 
     use crate::{convert::VoicevoxCoreResultExt as _, Closable};
@@ -608,8 +611,9 @@ mod asyncio {
         }
 
         #[getter]
-        fn id(&self) -> &str {
-            self.model.id().raw_voice_model_id()
+        fn id(&self, py: Python<'_>) -> PyResult<PyObject> {
+            let id = *self.model.id().raw_voice_model_id();
+            crate::convert::to_py_uuid(py, id)
         }
 
         #[getter]
@@ -725,23 +729,25 @@ mod asyncio {
             })
         }
 
-        fn unload_voice_model(&mut self, voice_model_id: &str, py: Python<'_>) -> PyResult<()> {
+        fn unload_voice_model(
+            &mut self,
+            #[pyo3(from_py_with = "crate::convert::to_rust_uuid")] voice_model_id: Uuid,
+            py: Python<'_>,
+        ) -> PyResult<()> {
             self.synthesizer
                 .get()?
-                .unload_voice_model(&VoiceModelId::new(voice_model_id.to_string()))
+                .unload_voice_model(voice_model_id.into())
                 .into_py_result(py)
         }
 
-        // C APIの挙動と一貫性を持たせる。
-        fn is_loaded_voice_model(&self, voice_model_id: &PyString) -> PyResult<bool> {
-            let Ok(voice_model_id) = voice_model_id.to_str() else {
-                // 与えられたIDがUTF-8ではない場合、それに対応する`VoicdModel`は確実に存在しない
-                return Ok(false);
-            };
+        fn is_loaded_voice_model(
+            &self,
+            #[pyo3(from_py_with = "crate::convert::to_rust_uuid")] voice_model_id: Uuid,
+        ) -> PyResult<bool> {
             Ok(self
                 .synthesizer
                 .get()?
-                .is_loaded_voice_model(&VoiceModelId::new(voice_model_id.to_string())))
+                .is_loaded_voice_model(voice_model_id.into()))
         }
 
         fn audio_query_from_kana<'py>(
diff --git a/model/sample.vvm/manifest.json b/model/sample.vvm/manifest.json
index 0b82d0c3f..cdc765ec5 100644
--- a/model/sample.vvm/manifest.json
+++ b/model/sample.vvm/manifest.json
@@ -1,5 +1,6 @@
 {
   "manifest_version": "0.0.0",
+  "id": "018fa5b1-146c-71e9-b523-6f6dabcf05fe",
   "metas_filename": "metas.json",
   "talk": {
     "predict_duration_filename": "predict_duration.onnx",

From be8d0c065fb8a0da442062e605d3b7b583398ecc Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sat, 25 May 2024 02:40:40 +0900
Subject: [PATCH 04/36] =?UTF-8?q?change:=20`manifest=5Fversion`=E3=82=92`v?=
 =?UTF-8?q?vm=5Fformat=5Fversion`=E3=81=AB=20(#794)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* change: `manifest_version`を`vvm_format_version`に

* エラーメッセージを変更

* エラーメッセージを変更

* 文字列ではなく整数にする
---
 crates/voicevox_core/src/manifest.rs | 82 +++++++++++++++++++++++++---
 model/sample.vvm/manifest.json       |  2 +-
 2 files changed, 74 insertions(+), 10 deletions(-)

diff --git a/crates/voicevox_core/src/manifest.rs b/crates/voicevox_core/src/manifest.rs
index 8464a48ab..0808a6414 100644
--- a/crates/voicevox_core/src/manifest.rs
+++ b/crates/voicevox_core/src/manifest.rs
@@ -1,20 +1,49 @@
-use std::{collections::BTreeMap, fmt::Display, sync::Arc};
+use std::{
+    collections::BTreeMap,
+    fmt::{self, Display},
+    sync::Arc,
+};
 
 use derive_getters::Getters;
 use derive_more::Deref;
 use derive_new::new;
-use serde::{Deserialize, Serialize};
+use serde::{de, Deserialize, Deserializer, Serialize};
 use serde_with::{serde_as, DisplayFromStr};
 
 use crate::{StyleId, VoiceModelId};
 
-pub type RawManifestVersion = String;
-#[derive(Deserialize, Clone, Debug, PartialEq, new)]
-pub struct ManifestVersion(RawManifestVersion);
+#[derive(Clone)]
+struct FormatVersionV1;
 
-impl Display for ManifestVersion {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
-        write!(f, "{}", self.0)
+impl<'de> Deserialize<'de> for FormatVersionV1 {
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        return deserializer.deserialize_any(Visitor);
+
+        struct Visitor;
+
+        impl<'de> de::Visitor<'de> for Visitor {
+            type Value = FormatVersionV1;
+
+            fn expecting(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
+                formatter.write_str("an unsigned integer")
+            }
+
+            fn visit_u64<E>(self, v: u64) -> Result<Self::Value, E>
+            where
+                E: de::Error,
+            {
+                match v {
+                    1 => Ok(FormatVersionV1),
+                    v => Err(E::custom(format!(
+                        "未知の形式です（`vvm_format_version={v}`）。新しいバージョンのVOICEVOX \
+                         COREであれば対応しているかもしれません",
+                    ))),
+                }
+            }
+        }
     }
 }
 
@@ -39,7 +68,7 @@ impl Display for InnerVoiceId {
 #[derive(Deserialize, Getters, Clone)]
 pub struct Manifest {
     #[allow(dead_code)]
-    manifest_version: ManifestVersion,
+    vvm_format_version: FormatVersionV1,
     pub(crate) id: VoiceModelId,
     metas_filename: String,
     #[serde(flatten)]
@@ -66,3 +95,38 @@ pub(crate) struct TalkManifest {
 pub(crate) struct StyleIdToInnerVoiceId(
     #[serde_as(as = "Arc<BTreeMap<DisplayFromStr, _>>")] Arc<BTreeMap<StyleId, InnerVoiceId>>,
 );
+
+#[cfg(test)]
+mod tests {
+    use std::ops::Deref;
+
+    use rstest::rstest;
+    use serde::Deserialize;
+
+    use super::FormatVersionV1;
+
+    #[rstest]
+    #[case("{\"vvm_format_version\":1}", Ok(()))]
+    #[case(
+        "{\"vvm_format_version\":2}",
+        Err(
+            "未知の形式です（`vvm_format_version=2`）。新しいバージョンのVOICEVOX COREであれば対応\
+             しているかもしれません at line 1 column 23",
+        )
+    )]
+    fn vvm_format_version_works(
+        #[case] input: &str,
+        #[case] expected: Result<(), &str>,
+    ) -> anyhow::Result<()> {
+        let actual = serde_json::from_str::<ManifestPart>(input).map_err(|e| e.to_string());
+        let actual = actual.as_ref().map(|_| ()).map_err(Deref::deref);
+        assert_eq!(expected, actual);
+        return Ok(());
+
+        #[derive(Deserialize)]
+        struct ManifestPart {
+            #[allow(dead_code)]
+            vvm_format_version: FormatVersionV1,
+        }
+    }
+}
diff --git a/model/sample.vvm/manifest.json b/model/sample.vvm/manifest.json
index cdc765ec5..db2ca92c1 100644
--- a/model/sample.vvm/manifest.json
+++ b/model/sample.vvm/manifest.json
@@ -1,5 +1,5 @@
 {
-  "manifest_version": "0.0.0",
+  "vvm_format_version": 1,
   "id": "018fa5b1-146c-71e9-b523-6f6dabcf05fe",
   "metas_filename": "metas.json",
   "talk": {

From 4cd19cce53ae2e0ee14adeb93180f3c6e530ba3a Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sat, 25 May 2024 22:18:28 +0900
Subject: [PATCH 05/36] =?UTF-8?q?chore:=20#796=20=E3=81=AB=E5=AF=BE?=
 =?UTF-8?q?=E3=81=99=E3=82=8BJava=E3=81=AE=E3=83=86=E3=82=B9=E3=83=88?=
 =?UTF-8?q?=E3=82=92=E8=BF=BD=E5=8A=A0=20(#797)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* chore: #796 に対するJavaのテストを追加

* テスト名を変更
---
 .../voicevoxcore/VoiceModelTest.java          | 36 +++++++++++++++++++
 1 file changed, 36 insertions(+)
 create mode 100644 crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java

diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java
new file mode 100644
index 000000000..5a720b07f
--- /dev/null
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java
@@ -0,0 +1,36 @@
+package jp.hiroshiba.voicevoxcore;
+
+import static org.junit.jupiter.api.Assertions.assertEquals;
+
+import com.google.gson.Gson;
+import com.google.gson.annotations.Expose;
+import com.google.gson.annotations.SerializedName;
+import jakarta.annotation.Nonnull;
+import java.io.File;
+import java.io.IOException;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.util.UUID;
+import org.junit.jupiter.api.Test;
+
+class VoiceModelTest extends TestUtils {
+  @Test
+  void idShouldBePreservedAsIs() throws IOException {
+    UUID expected = UUID.fromString(Manifest.readJson().id);
+    UUID actual = loadModel().id;
+    assertEquals(expected, actual);
+  }
+
+  private static class Manifest {
+    @SerializedName("id")
+    @Expose
+    @Nonnull
+    String id;
+
+    static Manifest readJson() throws IOException {
+      Path path = new File("../../../model/sample.vvm/manifest.json").toPath();
+      String json = new String(Files.readAllBytes(path));
+      return new Gson().fromJson(json, Manifest.class);
+    }
+  }
+}

From 264460ddf810843a9d54fea5413499359265bdb7 Mon Sep 17 00:00:00 2001
From: Han Yeong-woo <han@yeongwoo.dev>
Date: Tue, 4 Jun 2024 22:08:49 +0900
Subject: [PATCH 06/36] Bump actions (#798)

---
 .github/workflows/build_and_deploy.yml        | 34 +++++++++----------
 .../workflows/build_and_deploy_downloader.yml |  4 +--
 .github/workflows/cargo-deny.yml              |  2 +-
 .github/workflows/download_test.yml           |  2 +-
 .github/workflows/generate_document.yml       | 10 +++---
 .github/workflows/java_lint.yml               |  2 +-
 .github/workflows/labeler.yml                 |  2 +-
 .github/workflows/python_lint.yml             |  4 +--
 .github/workflows/test.yml                    | 34 +++++++++----------
 .github/workflows/typos.yml                   |  4 +--
 _typos.toml                                   |  5 +++
 11 files changed, 54 insertions(+), 49 deletions(-)

diff --git a/.github/workflows/build_and_deploy.yml b/.github/workflows/build_and_deploy.yml
index 01ddfc434..aecd7dca8 100644
--- a/.github/workflows/build_and_deploy.yml
+++ b/.github/workflows/build_and_deploy.yml
@@ -178,9 +178,9 @@ jobs:
     env:
       ASSET_NAME: voicevox_core-${{ matrix.artifact_name }}-${{ needs.config.outputs.version }}
     steps:
-      - uses: actions/checkout@v3 # 製品版ではない場合
+      - uses: actions/checkout@v4 # 製品版ではない場合
         if: ${{ !inputs.is_production }}
-      - uses: actions/checkout@v3 # 製品版の場合
+      - uses: actions/checkout@v4 # 製品版の場合
         if: inputs.is_production
         with:
           fetch-depth: 0 # 全履歴取得
@@ -196,7 +196,7 @@ jobs:
           ) > /dev/null 2>&1
       - name: Set up Python 3.8
         if: matrix.whl_local_version
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.8"
           architecture: ${{ contains(matrix.artifact_name,'x86') && 'x86' || 'x64' }}
@@ -220,7 +220,7 @@ jobs:
           echo "AR_${{ matrix.target }}=llvm-ar" >> "$GITHUB_ENV"
       - name: Checkout VOICEVOX RESOURCE
         if: inputs.is_production
-        uses: actions/checkout@v3
+        uses: actions/checkout@v4
         with:
           repository: VOICEVOX/voicevox_resource
           ref: ${{ env.VOICEVOX_RESOURCE_VERSION }}
@@ -316,7 +316,7 @@ jobs:
           7z a "../${{ env.ASSET_NAME }}.zip" "${{ env.ASSET_NAME }}"
       - name: Upload to Release
         if: fromJson(needs.config.outputs.deploy) && !contains(matrix.target, 'ios')
-        uses: softprops/action-gh-release@v1
+        uses: softprops/action-gh-release@v2
         with:
           prerelease: true
           tag_name: ${{ env.VERSION }}
@@ -325,7 +325,7 @@ jobs:
           target_commitish: ${{ github.sha }}
       - name: Upload Python whl to Release
         if: fromJson(needs.config.outputs.deploy) && matrix.whl_local_version
-        uses: softprops/action-gh-release@v1
+        uses: softprops/action-gh-release@v2
         with:
           prerelease: true
           tag_name: ${{ env.VERSION }}
@@ -349,7 +349,7 @@ jobs:
       IOS_AARCH64_PATH: artifact/voicevox_core-aarch64-apple-ios
       ASSET_NAME: voicevox_core-ios-xcframework-cpu-${{ needs.config.outputs.version }}
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - uses: actions/download-artifact@v4
         with:
           name: voicevox_core-x86_64-apple-ios
@@ -363,10 +363,10 @@ jobs:
           name: voicevox_core-aarch64-apple-ios
           path: ${{ env.IOS_AARCH64_PATH }}
       - name: Create xcframework
-        id: create-xcframework 
+        id: create-xcframework
         run: |
           build_util/make_ios_xcframework.bash
-          echo "output_asset_path=${OUTPUT_ASSET_PATH}" >> "$GITHUB_OUTPUT" 
+          echo "output_asset_path=${OUTPUT_ASSET_PATH}" >> "$GITHUB_OUTPUT"
         env:
           OUTPUT_ASSET_PATH: artifact/voicevox_core-ios-xcframework-cpu
       - name: Archive artifact
@@ -375,7 +375,7 @@ jobs:
           7z a "../../${{ env.ASSET_NAME }}.zip" "voicevox_core.xcframework"
       - name: Upload to Release
         if: fromJson(needs.config.outputs.deploy)
-        uses: softprops/action-gh-release@v1
+        uses: softprops/action-gh-release@v2
         with:
           prerelease: true
           tag_name: ${{ env.VERSION }}
@@ -389,10 +389,10 @@ jobs:
     env:
       ASSET_NAME: model-${{ needs.config.outputs.version }}
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Checkout VOICEVOX FAT RESOURCE
         if: inputs.is_production
-        uses: actions/checkout@v3
+        uses: actions/checkout@v4
         with:
           repository: VOICEVOX/voicevox_fat_resource
           ref: ${{ env.VOICEVOX_FAT_RESOURCE_VERSION }}
@@ -412,7 +412,7 @@ jobs:
           7z a "../${{ env.ASSET_NAME }}.zip" "${{ env.ASSET_NAME }}"
       - name: Upload to Release
         if: fromJson(needs.config.outputs.deploy)
-        uses: softprops/action-gh-release@v1
+        uses: softprops/action-gh-release@v2
         with:
           prerelease: true
           tag_name: ${{ env.VERSION }}
@@ -425,7 +425,7 @@ jobs:
     if: ${{ !(github.event_name != 'release' && github.event_name != 'workflow_dispatch') }} # !env.IS_SIMPLE_TEST と同じ
     needs: [config, build_and_deploy]
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Set up Java
@@ -446,13 +446,13 @@ jobs:
           cargo set-version "$VERSION" -p voicevox_core_java_api
 
       - name: "Download artifact (android-arm64-cpu)"
-        uses: actions/download-artifact@v3
+        uses: actions/download-artifact@v4
         with:
           name: voicevox_core_java_api-android-arm64-cpu
           path: artifact/android-arm64-cpu
 
       - name: "Download artifact (android-x86_64-cpu)"
-        uses: actions/download-artifact@v3
+        uses: actions/download-artifact@v4
         with:
           name: voicevox_core_java_api-android-x86_64-cpu
           path: artifact/android-x86_64-cpu
@@ -486,7 +486,7 @@ jobs:
 
       - name: Upload to Release
         if: fromJson(needs.config.outputs.deploy)
-        uses: softprops/action-gh-release@v1
+        uses: softprops/action-gh-release@v2
         with:
           prerelease: true
           tag_name: ${{ env.VERSION }}
diff --git a/.github/workflows/build_and_deploy_downloader.yml b/.github/workflows/build_and_deploy_downloader.yml
index 9daeadea4..d1b9f4a21 100644
--- a/.github/workflows/build_and_deploy_downloader.yml
+++ b/.github/workflows/build_and_deploy_downloader.yml
@@ -69,7 +69,7 @@ jobs:
     runs-on: ${{ matrix.os }}
 
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
 
       - name: Install cross compiler for aarch64-unknown-linux-gnu
         if: matrix.target == 'aarch64-unknown-linux-gnu'
@@ -104,7 +104,7 @@ jobs:
 
       - name: Upload to Release
         if: env.VERSION != '0.0.0'
-        uses: softprops/action-gh-release@v1
+        uses: softprops/action-gh-release@v2
         with:
           prerelease: true
           tag_name: ${{ env.VERSION }}
diff --git a/.github/workflows/cargo-deny.yml b/.github/workflows/cargo-deny.yml
index cf600f535..cf2ae2e3d 100644
--- a/.github/workflows/cargo-deny.yml
+++ b/.github/workflows/cargo-deny.yml
@@ -9,7 +9,7 @@ jobs:
   cargo-deny:
     runs-on: ubuntu-20.04
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Install cargo-binstall
         uses: taiki-e/install-action@cargo-binstall
       - name: Install cargo-deny
diff --git a/.github/workflows/download_test.yml b/.github/workflows/download_test.yml
index 2a1190e40..9f953534a 100644
--- a/.github/workflows/download_test.yml
+++ b/.github/workflows/download_test.yml
@@ -184,7 +184,7 @@ jobs:
     runs-on: ${{ matrix.os }}
     name: ${{ matrix.name }}-${{ matrix.os }}
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Get prerelease latest version
diff --git a/.github/workflows/generate_document.yml b/.github/workflows/generate_document.yml
index 37c39a1dd..531e800c3 100644
--- a/.github/workflows/generate_document.yml
+++ b/.github/workflows/generate_document.yml
@@ -11,13 +11,13 @@ jobs:
   generate_api_document:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
         with:
           submodules: true
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Set up Python
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.8"
       - name: Setup Java
@@ -42,7 +42,7 @@ jobs:
       - name: cp crates/voicevox_core_c_api/include/voicevox_core.h
         run: cp crates/voicevox_core_c_api/include/voicevox_core.h docs/apis/c_api/doxygen/
       - name: Generate doxygen document
-        uses: mattnotmitt/doxygen-action@v1.9.4
+        uses: mattnotmitt/doxygen-action@v1.9.8
         with:
           working-directory: "docs/apis/c_api/doxygen"
       - name: Build voicevox_core_python_api
@@ -60,7 +60,7 @@ jobs:
           mkdir -p public/apis/java_api
           cp -r crates/voicevox_core_java_api/lib/build/docs/javadoc/* public/apis/java_api
       - name: Uplaod api document
-        uses: actions/upload-pages-artifact@v1
+        uses: actions/upload-pages-artifact@v3
         if: ${{ github.ref_name == 'main' }}
         with:
           path: public
@@ -78,4 +78,4 @@ jobs:
     steps:
       - name: Deploy to GitHub pages
         id: api
-        uses: actions/deploy-pages@v1
+        uses: actions/deploy-pages@v4
diff --git a/.github/workflows/java_lint.yml b/.github/workflows/java_lint.yml
index ad408e3a7..6b7ff9e46 100644
--- a/.github/workflows/java_lint.yml
+++ b/.github/workflows/java_lint.yml
@@ -21,7 +21,7 @@ jobs:
   java-lint:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - uses: actions/setup-java@v4
         with:
           java-version: "11"
diff --git a/.github/workflows/labeler.yml b/.github/workflows/labeler.yml
index 25d78ec6a..3299f1586 100644
--- a/.github/workflows/labeler.yml
+++ b/.github/workflows/labeler.yml
@@ -10,7 +10,7 @@ jobs:
   triage:
     runs-on: ubuntu-latest
     steps:
-    - uses: github/issue-labeler@v2.5
+    - uses: github/issue-labeler@v3.4
       with:
         repo-token: "${{ secrets.GITHUB_TOKEN }}"
         configuration-path: .github/labeler.yml
diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index 22449c391..486119e2c 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -21,8 +21,8 @@ jobs:
   python:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
         with:
           python-version: "3.8"
       - name: Install Poetry
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index d0639d045..cace94823 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -18,7 +18,7 @@ jobs:
   shellcheck:
     runs-on: ubuntu-22.04
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Update ShellCheck
         run: |
           sudo apt-get update
@@ -29,7 +29,7 @@ jobs:
   actionlint:
     runs-on: ubuntu-22.04
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       # ShellCheckとPyflakesをインストールしておくと、shell: bashとshell: pythonのコードを検査してくれるようになる
       #
       # 参考:
@@ -40,7 +40,7 @@ jobs:
           sudo apt-get update
           sudo apt-get install -y shellcheck
       - name: Set up Python 3.8
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.8"
       - name: Install Pyflakes
@@ -53,7 +53,7 @@ jobs:
   validate-cargo-lock:
     runs-on: ubuntu-22.04
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Validate Cargo.lock
@@ -62,13 +62,13 @@ jobs:
   rust-lint:
     runs-on: windows-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
         with:
           components: clippy,rustfmt
       - name: Set up Python 3.8
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.8"
       - uses: Swatinem/rust-cache@v2
@@ -79,7 +79,7 @@ jobs:
   rust-unit-test:
     runs-on: windows-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - uses: Swatinem/rust-cache@v2
@@ -124,9 +124,9 @@ jobs:
         include: ${{ fromJson(needs.rust-integration-test-strategy-matrix.outputs.includes) }}
     runs-on: ${{ matrix.os }}
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Python 3.8
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.8"
       - name: Set up Rust
@@ -140,7 +140,7 @@ jobs:
   c-header:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Install cargo-binstall
@@ -187,7 +187,7 @@ jobs:
             artifact_name: linux-x64-cpu-cpp-shared
     runs-on: ${{ matrix.os }}
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Install cargo-binstall
@@ -203,7 +203,7 @@ jobs:
           cp -v target/debug/libonnxruntime.*.dylib example/cpp/unix/voicevox_core/ || true
 
       - if: startsWith(matrix.os, 'mac')
-        uses: jwlawson/actions-setup-cmake@v1.13
+        uses: jwlawson/actions-setup-cmake@v2
       - name: Install build dependencies
         if: startsWith(matrix.os, 'ubuntu')
         run: |
@@ -229,7 +229,7 @@ jobs:
         shell: pwsh
 
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Install cargo-binstall
@@ -243,7 +243,7 @@ jobs:
           cp target/debug/voicevox_core.dll.lib example/cpp/windows/simple_tts/lib/x64/voicevox_core.lib
 
       - name: Add MSBuild to PATH
-        uses: microsoft/setup-msbuild@v1.0.2
+        uses: microsoft/setup-msbuild@v2
       - name: Restore NuGet packages
         working-directory: ${{env.GITHUB_WORKSPACE}}
         run: nuget restore ${{env.SOLUTION_FILE_PATH}}
@@ -266,9 +266,9 @@ jobs:
         shell: bash
         working-directory: ./crates/voicevox_core_python_api
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Python 3.8
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.8"
       - name: Set up Rust
@@ -301,7 +301,7 @@ jobs:
           - os: ubuntu-latest
     runs-on: ${{ matrix.os }}
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
       - name: Set up Java
diff --git a/.github/workflows/typos.yml b/.github/workflows/typos.yml
index a42e05dcf..f7ac45241 100644
--- a/.github/workflows/typos.yml
+++ b/.github/workflows/typos.yml
@@ -16,7 +16,7 @@ jobs:
     runs-on: ubuntu-latest
 
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
 
       - name: typos-action
-        uses: crate-ci/typos@v1.12.12
+        uses: crate-ci/typos@v1.21.0
diff --git a/_typos.toml b/_typos.toml
index b70ddc608..4c3b0f48b 100644
--- a/_typos.toml
+++ b/_typos.toml
@@ -1,6 +1,11 @@
 # Files for typos
 # Instruction:  https://github.com/marketplace/actions/typos-action#getting-started
 
+[default]
+extend-ignore-identifiers-re = [
+    "\\bPNGs\\b", # https://github.com/crate-ci/typos/issues/745
+]
+
 [default.extend-identifiers]
 NdArray="NdArray" # onnxruntime::session::NdArray
 

From 7cdea5e9150a33d98163150503eb00244adf627e Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sat, 15 Jun 2024 23:46:11 +0900
Subject: [PATCH 07/36] =?UTF-8?q?fix:=20`voicevox=5Fuser=5Fdict=5Fadd=5Fwo?=
 =?UTF-8?q?rd`=E3=81=8C=E3=82=B9=E3=82=BF=E3=83=83=E3=82=AF=E3=82=92?=
 =?UTF-8?q?=E7=A0=B4=E5=A3=8A=E3=81=99=E3=82=8B=E3=81=AE=E3=82=92=E4=BF=AE?=
 =?UTF-8?q?=E6=AD=A3=20(#800)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crates/voicevox_core_c_api/src/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 08a54b11a..eb2e4698e 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -1161,7 +1161,7 @@ pub unsafe extern "C" fn voicevox_user_dict_add_word(
     into_result_code_with_error((|| {
         let word = word.read_unaligned().try_into_word()?;
         let uuid = user_dict.dict.add_word(word)?;
-        output_word_uuid.as_ptr().copy_from(uuid.as_bytes(), 16);
+        output_word_uuid.as_ptr().write_unaligned(uuid.into_bytes());
 
         Ok(())
     })())

From ca1a982f3d0257cfb9f431abe8f230fcd37abab4 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 16 Jun 2024 00:56:03 +0900
Subject: [PATCH 08/36] chore(deps): update dependency rust to v1.79.0 (#799)

Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com>
---
 rust-toolchain | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rust-toolchain b/rust-toolchain
index 54227249d..b3a8c61e6 100644
--- a/rust-toolchain
+++ b/rust-toolchain
@@ -1 +1 @@
-1.78.0
+1.79.0

From d3b559cc0dc56b298c4a4e67453c8af9449e935c Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Tue, 25 Jun 2024 04:17:02 +0900
Subject: [PATCH 09/36] =?UTF-8?q?change:=20macOS=2011=E3=81=AE=E3=82=B5?=
 =?UTF-8?q?=E3=83=9D=E3=83=BC=E3=83=88=E3=82=92=E5=88=87=E3=82=8B=20(#801)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .github/workflows/build_and_deploy.yml            | 4 ++--
 .github/workflows/build_and_deploy_downloader.yml | 4 ++--
 .github/workflows/test.yml                        | 4 ++--
 3 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/build_and_deploy.yml b/.github/workflows/build_and_deploy.yml
index aecd7dca8..8ac31c592 100644
--- a/.github/workflows/build_and_deploy.yml
+++ b/.github/workflows/build_and_deploy.yml
@@ -123,7 +123,7 @@ jobs:
               "can_skip_in_simple_test": true
             },
             {
-              "os": "macos-11",
+              "os": "macos-12",
               "features": "",
               "target": "aarch64-apple-darwin",
               "artifact_name": "osx-arm64-cpu",
@@ -131,7 +131,7 @@ jobs:
               "can_skip_in_simple_test": false
             },
             {
-              "os": "macos-11",
+              "os": "macos-12",
               "features": "",
               "target": "x86_64-apple-darwin",
               "artifact_name": "osx-x64-cpu",
diff --git a/.github/workflows/build_and_deploy_downloader.yml b/.github/workflows/build_and_deploy_downloader.yml
index d1b9f4a21..20fd4d63a 100644
--- a/.github/workflows/build_and_deploy_downloader.yml
+++ b/.github/workflows/build_and_deploy_downloader.yml
@@ -60,11 +60,11 @@ jobs:
 
           - name: download-osx-x64
             target: x86_64-apple-darwin
-            os: macos-11
+            os: macos-12
 
           - name: download-osx-arm64
             target: aarch64-apple-darwin
-            os: macos-11
+            os: macos-12
 
     runs-on: ${{ matrix.os }}
 
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index cace94823..14bfbddd0 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -103,8 +103,8 @@ jobs:
             { "os": "windows-2022", "features": "", "can_skip_in_simple_test": true },
             { "os": "windows-2019", "features": "directml", "can_skip_in_simple_test": false },
             { "os": "windows-2022", "features": "directml", "can_skip_in_simple_test": true },
-            { "os": "macos-11", "features": "", "can_skip_in_simple_test": false },
-            { "os": "macos-12", "features": "", "can_skip_in_simple_test": true },
+            { "os": "macos-12", "features": "", "can_skip_in_simple_test": false },
+            { "os": "macos-13", "features": "", "can_skip_in_simple_test": true },
             { "os": "ubuntu-20.04", "features": "", "can_skip_in_simple_test": false },
             { "os": "ubuntu-22.04", "features": "", "can_skip_in_simple_test": true }
           ]'

From a728d7eb6dcb975a8fa4f8b1b14ce693d7815213 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Thu, 4 Jul 2024 16:31:36 +0900
Subject: [PATCH 10/36] =?UTF-8?q?add:=20Rust=20API=E3=81=AEAPI=E3=83=89?=
 =?UTF-8?q?=E3=82=AD=E3=83=A5=E3=83=A1=E3=83=B3=E3=83=88=E3=82=92=E3=83=87?=
 =?UTF-8?q?=E3=83=97=E3=83=AD=E3=82=A4=E3=81=99=E3=82=8B=E3=82=88=E3=81=86?=
 =?UTF-8?q?=E3=81=AB=E3=81=99=E3=82=8B=20(#803)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .github/workflows/generate_document.yml | 22 ++++++++++++++++++++--
 docs/apis/index.html                    |  1 +
 2 files changed, 21 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/generate_document.yml b/.github/workflows/generate_document.yml
index 531e800c3..039800df1 100644
--- a/.github/workflows/generate_document.yml
+++ b/.github/workflows/generate_document.yml
@@ -16,6 +16,20 @@ jobs:
           submodules: true
       - name: Set up Rust
         uses: ./.github/actions/rust-toolchain-from-file
+      - name: Extract the Rust version used on Docs.rs
+        id: docsrs-rust-version
+        run: |
+          page=$(curl -f https://docs.rs/about/builds)
+          date=$(
+            sed -n \
+              's:^.*<code>rustc 1\.[0-9]\+\.[0-9]\+-nightly ([0-9a-f]\{9\} \([0-9]\{4\}-[0-9]\{2\}-[0-9]\{2\}\))</code>.*$:\1:p' \
+              <<< "$page"
+          )
+          echo "rust-toolchain=nightly-$date" >> "$GITHUB_OUTPUT"
+      - name: Set up nightly Rust
+        uses: dtolnay/rust-toolchain@master
+        with:
+          toolchain: ${{ steps.docsrs-rust-version.outputs.rust-toolchain }}
       - name: Set up Python
         uses: actions/setup-python@v5
         with:
@@ -25,8 +39,8 @@ jobs:
         with:
           java-version: "11"
           distribution: "adopt"
-      - name: Install cargo-binstall
-        uses: taiki-e/install-action@cargo-binstall
+      - name: Install cargo-docs-rs
+        uses: dtolnay/install@cargo-docs-rs
       - name: Create a venv
         uses: ./.github/actions/create-venv
       - name: Install python dependencies
@@ -39,6 +53,10 @@ jobs:
         run: mkdir -p public/apis/c_api
       - name: cp docs/apis/index.html
         run: cp docs/apis/index.html public/apis/
+      - name: Generate rustdoc
+        run: |
+          cargo +${{ steps.docsrs-rust-version.outputs.rust-toolchain }} docs-rs -p voicevox_core
+          mv target/x86_64-unknown-linux-gnu/doc public/apis/rust_api
       - name: cp crates/voicevox_core_c_api/include/voicevox_core.h
         run: cp crates/voicevox_core_c_api/include/voicevox_core.h docs/apis/c_api/doxygen/
       - name: Generate doxygen document
diff --git a/docs/apis/index.html b/docs/apis/index.html
index 639602f9f..d1f5d09b2 100644
--- a/docs/apis/index.html
+++ b/docs/apis/index.html
@@ -6,6 +6,7 @@
   <body>
     <!-- TODO: まともなページを用意する -->
     <ul>
+      <li><a href="./rust_api/voicevox_core">Rust API</a></li>
       <li><a href="./c_api">C API</a></li>
       <li><a href="./python_api">Python API</a></li>
       <li><a href="./java_api">Java API</a></li>

From 537d9b23225780af207a4f1f59ed65d9a34b4af6 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 5 Jul 2024 07:15:15 +0900
Subject: [PATCH 11/36] =?UTF-8?q?change:=20`Onnxruntime`=E5=9E=8B=E3=82=92?=
 =?UTF-8?q?=E8=BF=BD=E5=8A=A0=E3=81=97=E3=80=81=E3=81=9D=E3=81=93=E3=81=8B?=
 =?UTF-8?q?=E3=82=89`dlopen`/`LoadLibrary*`=E3=82=92=E8=A1=8C=E3=81=86=20(?=
 =?UTF-8?q?#802)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* change: `Onnxruntime`型を追加し、そこから`dlopen`/`LoadLibrary*`を行う

* KotlinのexampleにFIXMEを追加

* "ONNX Runtimeを表す" → "AIエンジンの"

* ドキュメントとコメントを追加

* フィーチャをリネーム

* fixup! フィーチャをリネーム

* fixup! フィーチャをリネーム

* fixup! フィーチャをリネーム

* fixup! フィーチャをリネーム

* fixup! フィーチャをリネーム

* voicevox-ortを更新

* `sed`のし損ねを修正

* ドキュメントやコメントを更新

* C APIに定数のgetterを追加

* voicevox-ortを更新

* "filename"を"ファイル名（モジュール名）もしくはファイルパス"に

* C APIのドキュメントに"Availability"のセクションを追加

* フィーチャに関するドキュメントを更新

https://github.com/VOICEVOX/voicevox_core/pull/802#issuecomment-2198751933

* C APIのビルドに関するドキュメントのヘッダファイル周りを更新

* voicevox-ortを更新

* `JavaStr`を`CStr::to_str`しない

* fixup! `JavaStr`を`CStr::to_str`しない

* 不要な依存を削除

* `link-onnxruntime`で`cargo test`が通るようにする

* fixup! `link-onnxruntime`で`cargo test`が通るようにする

* fixup! `link-onnxruntime`で`cargo test`が通るようにする
---
 .github/workflows/build_and_deploy.yml        |  40 +-
 .github/workflows/generate_document.yml       |   4 +-
 .github/workflows/test.yml                    |  21 +-
 Cargo.lock                                    | 124 +++++-
 Cargo.toml                                    |  11 +-
 README.md                                     |  12 +-
 crates/test_util/Cargo.toml                   |   2 +
 crates/test_util/build.rs                     |  34 ++
 crates/test_util/src/lib.rs                   |   3 +
 crates/voicevox_core/Cargo.toml               |  16 +-
 .../src/__internal/doctest_fixtures.rs        |  12 +-
 crates/voicevox_core/src/blocking.rs          |  11 +-
 crates/voicevox_core/src/devices.rs           |  32 --
 crates/voicevox_core/src/error.rs             |  10 +
 crates/voicevox_core/src/infer.rs             |   4 +-
 crates/voicevox_core/src/infer/runtimes.rs    |   4 +-
 .../src/infer/runtimes/onnxruntime.rs         | 385 +++++++++++++++++-
 crates/voicevox_core/src/infer/session_set.rs |   3 +-
 crates/voicevox_core/src/lib.rs               |  62 +++
 crates/voicevox_core/src/status.rs            |  36 +-
 crates/voicevox_core/src/synthesizer.rs       | 122 ++++--
 crates/voicevox_core/src/tokio.rs             |  11 +-
 crates/voicevox_core_c_api/Cargo.toml         |   5 +
 crates/voicevox_core_c_api/build.rs           |   1 +
 crates/voicevox_core_c_api/cbindgen.toml      |  30 +-
 .../include/voicevox_core.h                   | 200 ++++++++-
 crates/voicevox_core_c_api/src/c_impls.rs     |  70 +++-
 .../src/compatible_engine.rs                  |  25 +-
 crates/voicevox_core_c_api/src/helpers.rs     |  19 +-
 crates/voicevox_core_c_api/src/lib.rs         | 210 +++++++++-
 crates/voicevox_core_c_api/src/result_code.rs |   5 +
 .../tests/e2e/assert_cdylib.rs                |  12 +-
 .../voicevox_core_c_api/tests/e2e/log_mask.rs |   7 +
 crates/voicevox_core_c_api/tests/e2e/main.rs  |   1 +
 .../tests/e2e/snapshots.toml                  |  32 +-
 .../tests/e2e/testcases/compatible_engine.rs  |  13 +-
 ...ble_engine_load_model_before_initialize.rs |   1 +
 .../tests/e2e/testcases/global_info.rs        |  22 +-
 .../tests/e2e/testcases/simple_tts.rs         |  11 +
 .../testcases/synthesizer_new_output_json.rs  |  11 +
 .../e2e/testcases/tts_via_audio_query.rs      |  11 +
 .../tests/e2e/testcases/user_dict_load.rs     |  11 +
 .../e2e/testcases/user_dict_manipulate.rs     |   1 +
 crates/voicevox_core_java_api/Cargo.toml      |   3 +-
 .../jp/hiroshiba/voicevoxcore/GlobalInfo.java |  18 +-
 .../hiroshiba/voicevoxcore/Onnxruntime.java   | 132 ++++++
 .../hiroshiba/voicevoxcore/Synthesizer.java   |  29 +-
 .../InitInferenceRuntimeException.java        |  14 +
 .../jp/hiroshiba/voicevoxcore/InfoTest.java   |   5 +-
 .../voicevoxcore/SynthesizerTest.java         |  17 +-
 .../jp/hiroshiba/voicevoxcore/TestUtils.java  |  10 +
 .../hiroshiba/voicevoxcore/UserDictTest.java  |   3 +-
 crates/voicevox_core_java_api/src/common.rs   |   1 +
 crates/voicevox_core_java_api/src/info.rs     |  11 -
 crates/voicevox_core_java_api/src/lib.rs      |   1 +
 .../voicevox_core_java_api/src/onnxruntime.rs |  56 +++
 .../voicevox_core_java_api/src/synthesizer.rs |  10 +-
 crates/voicevox_core_python_api/Cargo.toml    |   3 +-
 .../python/test/conftest.py                   |   8 +
 .../python/test/test_asyncio_metas.py         |   7 +-
 .../test/test_asyncio_user_dict_load.py       |   5 +-
 .../python/test/test_blocking_metas.py        |   7 +-
 .../test/test_blocking_user_dict_load.py      |   5 +-
 ...est_pseudo_raii_for_asyncio_synthesizer.py |  11 +-
 ...st_pseudo_raii_for_blocking_synthesizer.py |  11 +-
 .../python/test/test_type_stub_consts.py      |  50 +++
 .../python/voicevox_core/__init__.py          |   4 +-
 .../python/voicevox_core/_load_dlls.py        |   1 +
 .../python/voicevox_core/_rust/__init__.pyi   |  22 +-
 .../python/voicevox_core/_rust/asyncio.pyi    |  75 ++++
 .../python/voicevox_core/_rust/blocking.pyi   |  75 ++++
 .../python/voicevox_core/asyncio.py           |   4 +-
 .../python/voicevox_core/blocking.py          |   4 +-
 .../voicevox_core_python_api/src/convert.rs   |   9 +-
 crates/voicevox_core_python_api/src/lib.rs    | 171 +++++++-
 docs/apis/c_api/doxygen/Doxyfile              |   3 +-
 docs/feature-options.md                       |  26 ++
 docs/usage.md                                 |   6 +-
 example/cpp/unix/simple_tts.cpp               |  11 +-
 example/cpp/windows/simple_tts/simple_tts.cpp |  11 +-
 example/kotlin/README.md                      |   9 +-
 example/kotlin/app/src/main/kotlin/app/App.kt |   9 +-
 example/python/run-asyncio.py                 |  31 +-
 example/python/run.py                         |  31 +-
 84 files changed, 2253 insertions(+), 323 deletions(-)
 create mode 100644 crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Onnxruntime.java
 create mode 100644 crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InitInferenceRuntimeException.java
 create mode 100644 crates/voicevox_core_java_api/src/onnxruntime.rs
 create mode 100644 crates/voicevox_core_python_api/python/test/test_type_stub_consts.py
 create mode 100644 docs/feature-options.md

diff --git a/.github/workflows/build_and_deploy.yml b/.github/workflows/build_and_deploy.yml
index 8ac31c592..e9b5e9eb5 100644
--- a/.github/workflows/build_and_deploy.yml
+++ b/.github/workflows/build_and_deploy.yml
@@ -41,7 +41,14 @@ defaults:
     shell: bash
 
 jobs:
-  config: # 全 jobs で利用する定数の定義。実行対象の条件をフィルタリングする。
+  # 全 jobs で利用する定数の定義。実行対象の条件をフィルタリングする。
+  #
+  # c_release_format = plain-cdylib | ios-xcframework
+  #
+  #     `plain-cdylib`の場合、動的ライブラリとその付属物をZIPに固めたものをC APIとしてリリースする。
+  #     `ios-xcframework`の場合はiOS用のXCFrameworkをC APIとしてリリースする。また、ONNX Runtimeの
+  #     リンク方法に関わるCargoフィーチャも`c_release_format`によって選択される。
+  config:
     runs-on: ubuntu-latest
     outputs:
       includes: ${{ steps.strategy_matrix.outputs.includes }}
@@ -57,6 +64,7 @@ jobs:
               "features": "",
               "target": "x86_64-pc-windows-msvc",
               "artifact_name": "windows-x64-cpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cpu",
               "can_skip_in_simple_test": true
             },
@@ -65,6 +73,7 @@ jobs:
               "features": "directml",
               "target": "x86_64-pc-windows-msvc",
               "artifact_name": "windows-x64-directml",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "directml",
               "can_skip_in_simple_test": false
             },
@@ -73,6 +82,7 @@ jobs:
               "features": "cuda",
               "target": "x86_64-pc-windows-msvc",
               "artifact_name": "windows-x64-cuda",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cuda",
               "can_skip_in_simple_test": true
             },
@@ -81,6 +91,7 @@ jobs:
               "features": "",
               "target": "i686-pc-windows-msvc",
               "artifact_name": "windows-x86-cpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cpu",
               "can_skip_in_simple_test": true
             },
@@ -89,6 +100,7 @@ jobs:
               "features": "",
               "target": "x86_64-unknown-linux-gnu",
               "artifact_name": "linux-x64-cpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cpu",
               "can_skip_in_simple_test": true
             },
@@ -97,6 +109,7 @@ jobs:
               "features": "cuda",
               "target": "x86_64-unknown-linux-gnu",
               "artifact_name": "linux-x64-gpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cuda",
               "can_skip_in_simple_test": false
             },
@@ -105,6 +118,7 @@ jobs:
               "features": "",
               "target": "aarch64-unknown-linux-gnu",
               "artifact_name": "linux-arm64-cpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cpu",
               "can_skip_in_simple_test": true
             },
@@ -113,6 +127,7 @@ jobs:
               "features": "",
               "target": "aarch64-linux-android",
               "artifact_name": "android-arm64-cpu",
+              "c_release_format": "plain-cdylib",
               "can_skip_in_simple_test": true
             },
             {
@@ -120,6 +135,7 @@ jobs:
               "features": "",
               "target": "x86_64-linux-android",
               "artifact_name": "android-x86_64-cpu",
+              "c_release_format": "plain-cdylib",
               "can_skip_in_simple_test": true
             },
             {
@@ -127,6 +143,7 @@ jobs:
               "features": "",
               "target": "aarch64-apple-darwin",
               "artifact_name": "osx-arm64-cpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cpu",
               "can_skip_in_simple_test": false
             },
@@ -135,6 +152,7 @@ jobs:
               "features": "",
               "target": "x86_64-apple-darwin",
               "artifact_name": "osx-x64-cpu",
+              "c_release_format": "plain-cdylib",
               "whl_local_version": "cpu",
               "can_skip_in_simple_test": true
             },
@@ -143,6 +161,7 @@ jobs:
               "features": "",
               "target": "aarch64-apple-ios",
               "artifact_name": "ios-arm64-cpu",
+              "c_release_format": "ios-xcframework",
               "can_skip_in_simple_test": true
             },
             {
@@ -150,6 +169,7 @@ jobs:
               "features": "",
               "target": "aarch64-apple-ios-sim",
               "artifact_name": "ios-arm64-cpu-sim",
+              "c_release_format": "ios-xcframework",
               "can_skip_in_simple_test": true
             },
             {
@@ -157,6 +177,7 @@ jobs:
               "features": "",
               "target": "x86_64-apple-ios",
               "artifact_name": "ios-x64-cpu",
+              "c_release_format": "ios-xcframework",
               "can_skip_in_simple_test": true
             }
           ]'
@@ -244,8 +265,12 @@ jobs:
       - name: build voicevox_core_c_api
         shell: bash
         run: |
+          case ${{ matrix.c_release_format }} in
+            plain-cdylib) linking=load-onnxruntime ;;
+            ios-xcframework) linking=link-onnxruntime ;;
+          esac
           function build() {
-            cargo build -p voicevox_core_c_api -vv --features ${{ matrix.features }}, --target ${{ matrix.target }} --release
+            cargo build -p voicevox_core_c_api -vv --features "$linking",${{ matrix.features }} --target ${{ matrix.target }} --release
           }
           if ${{ !inputs.is_production }}; then
             build
@@ -285,7 +310,12 @@ jobs:
       - name: Organize artifact
         run: |
           mkdir -p "artifact/${{ env.ASSET_NAME }}"
-          cp -v crates/voicevox_core_c_api/include/voicevox_core.h "artifact/${{ env.ASSET_NAME }}"
+          case ${{ matrix.c_release_format }} in
+            plain-cdylib) feature=VOICEVOX_LOAD_ONNXRUNTIME ;;
+            ios-xcframework) feature=VOICEVOX_LINK_ONNXRUNTIME ;;
+          esac
+          sed 's:^//\(#define '"$feature"'\)$:\1:' crates/voicevox_core_c_api/include/voicevox_core.h \
+            > "artifact/${{ env.ASSET_NAME }}/voicevox_core.h"
           cp -v target/${{ matrix.target }}/release/*voicevox_core.{dll,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
           cp -v target/${{ matrix.target }}/release/voicevox_core.dll.lib "artifact/${{ env.ASSET_NAME }}/voicevox_core.lib" || true
           cp -v -n target/${{ matrix.target }}/release/{,lib}onnxruntime*.{dll,so.*,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
@@ -305,7 +335,7 @@ jobs:
           ESIGNERCKA_PASSWORD: ${{ secrets.ESIGNERCKA_PASSWORD }}
           ESIGNERCKA_TOTP_SECRET: ${{ secrets.ESIGNERCKA_TOTP_SECRET }}
       - name: Upload artifact to build XCFramework
-        if: contains(matrix.target, 'ios')
+        if: matrix.c_release_format == 'ios-xcframework'
         uses: actions/upload-artifact@v4
         with:
           name: voicevox_core-${{ matrix.target }}
@@ -315,7 +345,7 @@ jobs:
           cd artifact
           7z a "../${{ env.ASSET_NAME }}.zip" "${{ env.ASSET_NAME }}"
       - name: Upload to Release
-        if: fromJson(needs.config.outputs.deploy) && !contains(matrix.target, 'ios')
+        if: fromJson(needs.config.outputs.deploy) && matrix.c_release_format == 'plain-cdylib'
         uses: softprops/action-gh-release@v2
         with:
           prerelease: true
diff --git a/.github/workflows/generate_document.yml b/.github/workflows/generate_document.yml
index 039800df1..c4af6b80b 100644
--- a/.github/workflows/generate_document.yml
+++ b/.github/workflows/generate_document.yml
@@ -64,9 +64,7 @@ jobs:
         with:
           working-directory: "docs/apis/c_api/doxygen"
       - name: Build voicevox_core_python_api
-        run: |
-          cargo build -p voicevox_core_c_api -vv
-          maturin develop --manifest-path ./crates/voicevox_core_python_api/Cargo.toml --locked
+        run: maturin develop --manifest-path ./crates/voicevox_core_python_api/Cargo.toml --locked
       # https://github.com/readthedocs/sphinx-autoapi/issues/405
       - name: Workaround to make Sphinx recognize `_rust` as a module
         run: touch ./crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.py
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 14bfbddd0..8550fbfca 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -72,8 +72,10 @@ jobs:
         with:
           python-version: "3.8"
       - uses: Swatinem/rust-cache@v2
-      - run: cargo clippy -vv --all-features --tests -- -D clippy::all -D warnings --no-deps
-      - run: cargo clippy -vv --all-features -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv --features directml,cuda --tests -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv --features directml,cuda -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv -p voicevox_core -p voicevox_core_c_api --features link-onnxruntime,directml,cuda --tests -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv -p voicevox_core -p voicevox_core_c_api --features link-onnxruntime,directml,cuda -- -D clippy::all -D warnings --no-deps
       - run: cargo fmt -- --check
 
   rust-unit-test:
@@ -134,7 +136,7 @@ jobs:
       - uses: Swatinem/rust-cache@v2
         with:
           key: "cargo-integration-test-cache-${{ matrix.features }}-${{ matrix.os }}"
-      - name: Run cargo integration test
+      - name: Run cargo integration test (load-onnxruntime)
         run: RUST_BACKTRACE=full cargo test --test "*" -vv --features ,${{ matrix.features }} -- --include-ignored
 
   c-header:
@@ -193,11 +195,13 @@ jobs:
       - name: Install cargo-binstall
         uses: taiki-e/install-action@cargo-binstall
       - name: build voicevox_core_c_api
-        run: cargo build -p voicevox_core_c_api -vv
+        run: cargo build -p voicevox_core_c_api --features load-onnxruntime -vv
       - name: 必要なfileをunix用exampleのディレクトリに移動させる
         run: |
           mkdir -p example/cpp/unix/voicevox_core/
-          cp -v crates/voicevox_core_c_api/include/voicevox_core.h example/cpp/unix/voicevox_core/
+          sed 's:^//\(#define VOICEVOX_LOAD_ONNXRUNTIME\)$:\1:' \
+            crates/voicevox_core_c_api/include/voicevox_core.h \
+            > example/cpp/unix/voicevox_core/voicevox_core.h
           cp -v target/debug/libvoicevox_core.{so,dylib} example/cpp/unix/voicevox_core/ || true
           cp -v target/debug/libonnxruntime.so.* example/cpp/unix/voicevox_core/ || true
           cp -v target/debug/libonnxruntime.*.dylib example/cpp/unix/voicevox_core/ || true
@@ -235,11 +239,14 @@ jobs:
       - name: Install cargo-binstall
         uses: taiki-e/install-action@cargo-binstall
       - name: build voicevox_core_c_api
-        run: cargo build -p voicevox_core_c_api -vv
+        run: cargo build -p voicevox_core_c_api --features load-onnxruntime -vv
       - name: 必要なfileをexampleのディレクトリに移動させる
+        shell: bash
         run: |
           mkdir -p example/cpp/windows/simple_tts/lib/x64
-          cp -v crates/voicevox_core_c_api/include/voicevox_core.h example/cpp/windows/simple_tts/
+          sed 's:^//\(#define VOICEVOX_LOAD_ONNXRUNTIME\)$:\1:' \
+            crates/voicevox_core_c_api/include/voicevox_core.h \
+            > example/cpp/windows/simple_tts/voicevox_core.h
           cp target/debug/voicevox_core.dll.lib example/cpp/windows/simple_tts/lib/x64/voicevox_core.lib
 
       - name: Add MSBuild to PATH
diff --git a/Cargo.lock b/Cargo.lock
index d3846b8a0..a612d57e6 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -362,6 +362,32 @@ name = "camino"
 version = "1.1.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c59e92b5a388f549b863a7bea62612c09f24c8393560709a54558a9abdfb3b9c"
+dependencies = [
+ "serde",
+]
+
+[[package]]
+name = "cargo-platform"
+version = "0.1.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "24b1f0365a6c6bb4020cd05806fd0d33c44d38046b8bd7f0e40814b9763cabfc"
+dependencies = [
+ "serde",
+]
+
+[[package]]
+name = "cargo_metadata"
+version = "0.18.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2d886547e41f740c616ae73108f6eb70afe6d940c7bc697cb30f13daec073037"
+dependencies = [
+ "camino",
+ "cargo-platform",
+ "semver",
+ "serde",
+ "serde_json",
+ "thiserror",
+]
 
 [[package]]
 name = "cbindgen"
@@ -443,7 +469,7 @@ checksum = "77ed9a53e5d4d9c573ae844bfac6872b159cb1d1585a83b29e7a64b7eef7332a"
 dependencies = [
  "glob",
  "libc",
- "libloading",
+ "libloading 0.7.3",
 ]
 
 [[package]]
@@ -599,6 +625,26 @@ dependencies = [
  "windows-sys 0.42.0",
 ]
 
+[[package]]
+name = "const_format"
+version = "0.2.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e3a214c7af3d04997541b18d432afaff4c455e79e2029079647e72fc2bd27673"
+dependencies = [
+ "const_format_proc_macros",
+]
+
+[[package]]
+name = "const_format_proc_macros"
+version = "0.2.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c7f6ff08fd20f4f299298a28e2dfa8a8ba1036e6cd2460ac1de7b425d76f2500"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "unicode-xid",
+]
+
 [[package]]
 name = "constant_time_eq"
 version = "0.1.5"
@@ -1100,10 +1146,11 @@ dependencies = [
 
 [[package]]
 name = "fs-err"
-version = "2.9.0"
+version = "2.11.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0845fa252299212f0389d64ba26f34fa32cfe41588355f21ed507c59a0f64541"
+checksum = "88a41f105fe1d5b6b34b2055e3dc59bb79b46b48b2040b9e6c7b4b5de097aa41"
 dependencies = [
+ "autocfg",
  "tokio",
 ]
 
@@ -1675,6 +1722,16 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "libloading"
+version = "0.8.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0c2a198fb6b0eada2a8df47933734e6d35d350665a33a3593d7164fa52c75c19"
+dependencies = [
+ "cfg-if",
+ "windows-targets 0.48.0",
+]
+
 [[package]]
 name = "libm"
 version = "0.2.6"
@@ -1990,9 +2047,9 @@ dependencies = [
 
 [[package]]
 name = "once_cell"
-version = "1.18.0"
+version = "1.19.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
+checksum = "3fdb12b2476b595f9358c5161aa467c2438859caa136dec86c26fdd2efe17b92"
 
 [[package]]
 name = "opaque-debug"
@@ -2502,6 +2559,26 @@ dependencies = [
  "bitflags 1.3.2",
 ]
 
+[[package]]
+name = "ref-cast"
+version = "1.0.23"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ccf0a6f84d5f1d581da8b41b47ec8600871962f2a528115b542b362d4b744931"
+dependencies = [
+ "ref-cast-impl",
+]
+
+[[package]]
+name = "ref-cast-impl"
+version = "1.0.23"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bcc303e793d3734489387d205e9b186fac9c6cfacedd98cbb2e8a5943595f3e6"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.48",
+]
+
 [[package]]
 name = "regex"
 version = "1.10.0"
@@ -2793,21 +2870,24 @@ name = "semver"
 version = "1.0.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "e25dfac463d778e353db5be2449d1cce89bd6fd23c9f1ea21310ce6e5a1b29c4"
+dependencies = [
+ "serde",
+]
 
 [[package]]
 name = "serde"
-version = "1.0.164"
+version = "1.0.203"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9e8c8cf938e98f769bc164923b06dce91cea1751522f46f8466461af04c9027d"
+checksum = "7253ab4de971e72fb7be983802300c30b5a7f0c2e56fab8abfc6a214307c0094"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.164"
+version = "1.0.203"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d9735b638ccc51c28bf6914d90a2e9725b377144fc612c49a611fddd1b631d68"
+checksum = "500cbc0ebeb6f46627f50f3f5811ccf6bf00643be300b4c3eabc0ef55dc5b5ba"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -3136,16 +3216,18 @@ dependencies = [
  "anyhow",
  "bindgen 0.69.4",
  "camino",
+ "cargo_metadata",
  "flate2",
  "fs-err",
  "indoc",
- "libloading",
+ "libloading 0.7.3",
  "once_cell",
  "reqwest",
  "serde",
  "serde_json",
  "tar",
  "tokio",
+ "voicevox-ort",
  "zip",
 ]
 
@@ -3465,6 +3547,12 @@ version = "0.1.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b"
 
+[[package]]
+name = "unicode-xid"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f962df74c8c05a667b5ee8bcf162993134c104e96440b663c8daa176dc772d8c"
+
 [[package]]
 name = "unindent"
 version = "0.2.3"
@@ -3535,11 +3623,14 @@ checksum = "49874b5167b65d7193b8aba1567f5c7d93d001cafc34600cee003eda787e483f"
 [[package]]
 name = "voicevox-ort"
 version = "2.0.0-rc.2"
-source = "git+https://github.com/VOICEVOX/ort.git?rev=a2d6ae22327869e896bf4c16828734d09516d2d9#a2d6ae22327869e896bf4c16828734d09516d2d9"
+source = "git+https://github.com/VOICEVOX/ort.git?rev=07c047c449b959d8f76593046e139bae520d59c3#07c047c449b959d8f76593046e139bae520d59c3"
 dependencies = [
+ "anyhow",
  "half",
  "js-sys",
+ "libloading 0.8.3",
  "ndarray",
+ "once_cell",
  "thiserror",
  "tracing",
  "voicevox-ort-sys",
@@ -3549,7 +3640,7 @@ dependencies = [
 [[package]]
 name = "voicevox-ort-sys"
 version = "2.0.0-rc.2"
-source = "git+https://github.com/VOICEVOX/ort.git?rev=a2d6ae22327869e896bf4c16828734d09516d2d9#a2d6ae22327869e896bf4c16828734d09516d2d9"
+source = "git+https://github.com/VOICEVOX/ort.git?rev=07c047c449b959d8f76593046e139bae520d59c3#07c047c449b959d8f76593046e139bae520d59c3"
 dependencies = [
  "flate2",
  "sha2",
@@ -3564,6 +3655,7 @@ dependencies = [
  "anyhow",
  "async_zip",
  "camino",
+ "const_format",
  "derive-getters",
  "derive-new",
  "derive_more",
@@ -3584,6 +3676,7 @@ dependencies = [
  "ouroboros",
  "pretty_assertions",
  "rayon",
+ "ref-cast",
  "regex",
  "rstest",
  "rstest_reuse",
@@ -3616,6 +3709,7 @@ dependencies = [
  "chrono",
  "clap 4.0.10",
  "colorchoice",
+ "const_format",
  "cstr",
  "derive-getters",
  "duct",
@@ -3624,12 +3718,13 @@ dependencies = [
  "inventory",
  "itertools 0.10.5",
  "libc",
- "libloading",
+ "libloading 0.7.3",
  "libtest-mimic",
  "ndarray",
  "ndarray-stats",
  "once_cell",
  "process_path",
+ "ref-cast",
  "regex",
  "serde",
  "serde_json",
@@ -3642,6 +3737,7 @@ dependencies = [
  "tracing-subscriber",
  "typetag",
  "uuid",
+ "voicevox-ort",
  "voicevox_core",
 ]
 
@@ -3652,6 +3748,7 @@ dependencies = [
  "android_logger",
  "chrono",
  "derive_more",
+ "duplicate",
  "easy-ext",
  "jni",
  "once_cell",
@@ -3681,6 +3778,7 @@ dependencies = [
  "camino",
  "easy-ext",
  "log",
+ "once_cell",
  "pyo3",
  "pyo3-asyncio",
  "pyo3-log",
diff --git a/Cargo.toml b/Cargo.toml
index 4ea3d3757..b467c583e 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -13,11 +13,13 @@ bindgen = "0.69.4"
 binstall-tar = "0.4.39"
 bytes = "1.1.0"
 camino = "1.1.6"
+cargo_metadata = "0.18.1"
 cbindgen = "0.24.3"
 chrono = { version = "0.4.26", default-features = false }
 clap = "4.0.10"
 color-eyre = "0.6.2"
 colorchoice = "1.0.0"
+const_format = "0.2.32"
 cstr = "0.2.11" # https://github.com/dtolnay/syn/issues/1502
 derive-getters = "0.2.0"
 derive-new = "0.5.9"
@@ -29,7 +31,7 @@ educe = "0.4.23"
 enum-map = "3.0.0-beta.1"
 eyre = "0.6.8"
 flate2 = "1.0.25"
-fs-err = "2.9.0"
+fs-err = "2.11.0"
 futures = "0.3.26"
 futures-core = "0.3.25"
 futures-util = "0.3.25"
@@ -50,7 +52,7 @@ log = "0.4.17"
 ndarray = "0.15.6"
 ndarray-stats = "0.5.1"
 octocrab = { version = "0.19.0", default-features = false }
-once_cell = "1.18.0"
+once_cell = "1.19.0"
 ouroboros = "0.18.0"
 parse-display = "0.8.2"
 pretty_assertions = "1.3.0"
@@ -60,11 +62,12 @@ pyo3-asyncio = "0.20.0"
 pyo3-log = "0.9.0"
 quote = "1.0.33"
 rayon = "1.6.1"
+ref-cast = "1.0.23"
 regex = "1.10.0"
 reqwest = { version = "0.11.13", default-features = false }
 rstest = "0.15.0"
 rstest_reuse = "0.6.0"
-serde = "1.0.145"
+serde = "1.0.203"
 serde_json = "1.0.85"
 serde_with = "3.3.0"
 smallvec = "1.13.1"
@@ -87,7 +90,7 @@ zip = "0.6.3"
 
 [workspace.dependencies.voicevox-ort]
 git = "https://github.com/VOICEVOX/ort.git"
-rev = "a2d6ae22327869e896bf4c16828734d09516d2d9"
+rev = "07c047c449b959d8f76593046e139bae520d59c3"
 
 [workspace.dependencies.open_jtalk]
 git = "https://github.com/VOICEVOX/open_jtalk-rs.git"
diff --git a/README.md b/README.md
index 4024e9721..ae60f587b 100644
--- a/README.md
+++ b/README.md
@@ -150,10 +150,18 @@ model フォルダにある onnx モデルはダミーのため、ノイズの
 
 ```bash
 # DLLをビルド
-cargo build --release -p voicevox_core_c_api
+cargo build --release -p voicevox_core_c_api --features load-onnxruntime
 ```
 
-DLL 用のヘッダファイルは [crates/voicevox_core_c_api/include/voicevox_core.h](https://github.com/VOICEVOX/voicevox_core/tree/main/crates/voicevox_core_c_api/include/voicevox_core.h) にあります。
+DLL 用のヘッダファイルの雛形は [crates/voicevox_core_c_api/include/voicevox_core.h](https://github.com/VOICEVOX/voicevox_core/tree/main/crates/voicevox_core_c_api/include/voicevox_core.h) にあります。
+詳しくは[feature-options.md](./docs/feature-options.md)を参照してください。
+
+```bash
+# ヘッダファイルを加工し、マクロ`VOICEVOX_LOAD_ONNXRUNTIME`を宣言
+sed 's:^//\(#define VOICEVOX_LOAD_ONNXRUNTIME\)$:\1:' \
+  crates/voicevox_core_c_api/include/voicevox_core.h \
+  > ./voicevox_core.h
+```
 
 ## コアライブラリのテスト
 
diff --git a/crates/test_util/Cargo.toml b/crates/test_util/Cargo.toml
index d113b57ce..fe0c2f6dd 100644
--- a/crates/test_util/Cargo.toml
+++ b/crates/test_util/Cargo.toml
@@ -13,6 +13,7 @@ anyhow.workspace = true
 tokio = { workspace = true, features = ["macros", "rt-multi-thread"] }
 bindgen.workspace = true
 camino.workspace = true
+cargo_metadata.workspace = true
 flate2.workspace = true
 fs-err.workspace = true
 indoc.workspace = true
@@ -20,6 +21,7 @@ serde = { workspace = true, features = ["derive"] }
 serde_json = { workspace = true, features = ["preserve_order"] }
 reqwest = { workspace = true, features = ["rustls-tls"] }
 tar.workspace = true
+voicevox-ort.workspace = true
 zip.workspace = true
 
 [lints.rust]
diff --git a/crates/test_util/build.rs b/crates/test_util/build.rs
index 79e3bc90e..3cdc88d78 100644
--- a/crates/test_util/build.rs
+++ b/crates/test_util/build.rs
@@ -6,6 +6,7 @@ use std::{
 
 use anyhow::{anyhow, ensure};
 use camino::{Utf8Path, Utf8PathBuf};
+use cargo_metadata::MetadataCommand;
 use flate2::read::GzDecoder;
 use indoc::formatdoc;
 use tar::Archive;
@@ -27,6 +28,8 @@ async fn main() -> anyhow::Result<()> {
         ensure!(dic_dir.exists(), "`{dic_dir}` does not exist");
     }
 
+    copy_onnxruntime(out_dir.as_ref(), dist)?;
+
     create_sample_voice_model_file(out_dir, dist)?;
 
     generate_example_data_json(dist.as_ref())?;
@@ -92,6 +95,35 @@ fn create_sample_voice_model_file(out_dir: &Utf8Path, dist: &Utf8Path) -> anyhow
     Ok(())
 }
 
+fn copy_onnxruntime(out_dir: &Path, dist: &Utf8Path) -> anyhow::Result<()> {
+    use std::env::consts::{DLL_PREFIX, DLL_SUFFIX};
+
+    let cargo_metadata::Metadata {
+        target_directory, ..
+    } = MetadataCommand::new()
+        .manifest_path(Path::new(env!("CARGO_MANIFEST_DIR")).join("Cargo.toml"))
+        .exec()?;
+
+    const VERSION: &str = ort::downloaded_version!();
+    let filename = &if cfg!(target_os = "linux") {
+        format!("libonnxruntime.so.{VERSION}")
+    } else if cfg!(any(target_os = "macos", target_os = "ios")) {
+        format!("libonnxruntime.{VERSION}.dylib")
+    } else {
+        format!("{DLL_PREFIX}onnxruntime{DLL_SUFFIX}")
+    };
+    let src = &target_directory.join("debug").join(filename);
+    let dst_dir = &dist.join("lib");
+    let dst = &dst_dir.join(filename);
+    fs_err::create_dir_all(dst_dir)?;
+    fs_err::copy(src, dst)?;
+    println!("cargo:rerun-if-changed={src}");
+
+    fs_err::write(out_dir.join("onnxruntime-dylib-path.txt"), dst.as_str())?;
+
+    Ok(())
+}
+
 /// OpenJTalkの辞書をダウンロードして展開する。
 async fn download_open_jtalk_dict(dist: &Path) -> anyhow::Result<()> {
     let download_url = format!(
@@ -187,6 +219,8 @@ fn generate_c_api_rs_bindings(out_dir: &Utf8Path) -> anyhow::Result<()> {
     bindgen::Builder::default()
         .header(C_BINDINGS_PATH)
         .header(ADDITIONAL_C_BINDINGS_PATH)
+        // we test for `--feature load-onnxruntime`
+        .clang_arg("-DVOICEVOX_LOAD_ONNXRUNTIME=")
         .parse_callbacks(Box::new(bindgen::CargoCallbacks::new()))
         .dynamic_library_name("CApi")
         .generate()?
diff --git a/crates/test_util/src/lib.rs b/crates/test_util/src/lib.rs
index f234d7f76..6473e438e 100644
--- a/crates/test_util/src/lib.rs
+++ b/crates/test_util/src/lib.rs
@@ -23,6 +23,9 @@ pub use self::typing::{
     DecodeExampleData, DurationExampleData, ExampleData, IntonationExampleData,
 };
 
+pub const ONNXRUNTIME_DYLIB_PATH: &str =
+    include_str!(concat!(env!("OUT_DIR"), "/onnxruntime-dylib-path.txt"));
+
 pub const OPEN_JTALK_DIC_DIR: &str = concat!(
     env!("CARGO_MANIFEST_DIR"),
     "/data/open_jtalk_dic_utf_8-1.11"
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index 9957c1373..527fa7494 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -4,8 +4,18 @@ version.workspace = true
 edition.workspace = true
 publish.workspace = true
 
+[package.metadata.docs.rs]
+features = ["load-onnxruntime", "link-onnxruntime"]
+rustdoc-args = ["--cfg", "docsrs"]
+
 [features]
 default = []
+
+# ONNX Runtimeのリンク方法を決めるフィーチャ（rustdocを参照）。
+load-onnxruntime = ["voicevox-ort/load-dynamic"]
+link-onnxruntime = []
+
+# GPUを利用可能にするフィーチャ（rustdocを参照）。
 cuda = ["voicevox-ort/cuda"]
 directml = ["voicevox-ort/directml"]
 
@@ -13,6 +23,7 @@ directml = ["voicevox-ort/directml"]
 anyhow.workspace = true
 async_zip = { workspace = true, features = ["deflate"] }
 camino.workspace = true
+const_format.workspace = true
 derive-getters.workspace = true
 derive-new.workspace = true
 derive_more.workspace = true
@@ -30,6 +41,7 @@ once_cell.workspace = true
 open_jtalk.workspace = true
 ouroboros.workspace = true
 rayon.workspace = true
+ref-cast.workspace = true
 regex.workspace = true
 serde = { workspace = true, features = ["derive", "rc"] }
 serde_json = { workspace = true, features = ["preserve_order"] }
@@ -41,8 +53,8 @@ thiserror.workspace = true
 tokio = { workspace = true, features = ["rt"] } # FIXME: feature-gateする
 tracing.workspace = true
 uuid = { workspace = true, features = ["v4", "serde"] }
+voicevox-ort = { workspace = true, features = ["download-binaries", "__init-for-voicevox"] }
 voicevox_core_macros = { path = "../voicevox_core_macros" }
-voicevox-ort = { workspace = true, features = ["ndarray", "download-binaries"] }
 zip.workspace = true
 
 [dev-dependencies]
@@ -51,7 +63,7 @@ pretty_assertions.workspace = true
 rstest.workspace = true
 rstest_reuse.workspace = true
 test_util.workspace = true
-tokio = { workspace = true, features = ["rt", "macros"] }
+tokio = { workspace = true, features = ["rt-multi-thread", "macros"] }
 
 [target."cfg(windows)".dependencies]
 humansize.workspace = true
diff --git a/crates/voicevox_core/src/__internal/doctest_fixtures.rs b/crates/voicevox_core/src/__internal/doctest_fixtures.rs
index f314845fe..8f45cba73 100644
--- a/crates/voicevox_core/src/__internal/doctest_fixtures.rs
+++ b/crates/voicevox_core/src/__internal/doctest_fixtures.rs
@@ -1,4 +1,4 @@
-use std::path::Path;
+use std::{ffi::OsString, path::Path};
 
 use camino::Utf8Path;
 
@@ -6,9 +6,19 @@ use crate::{AccelerationMode, InitializeOptions};
 
 pub async fn synthesizer_with_sample_voice_model(
     voice_model_path: impl AsRef<Path>,
+    #[cfg_attr(feature = "link-onnxruntime", allow(unused_variables))] onnxruntime_dylib_path: impl Into<
+        OsString,
+    >,
     open_jtalk_dic_dir: impl AsRef<Utf8Path>,
 ) -> anyhow::Result<crate::tokio::Synthesizer<crate::tokio::OpenJtalk>> {
     let syntesizer = crate::tokio::Synthesizer::new(
+        #[cfg(feature = "load-onnxruntime")]
+        crate::tokio::Onnxruntime::load_once()
+            .filename(onnxruntime_dylib_path)
+            .exec()
+            .await?,
+        #[cfg(feature = "link-onnxruntime")]
+        crate::tokio::Onnxruntime::init_once().await?,
         crate::tokio::OpenJtalk::new(open_jtalk_dic_dir).await?,
         &InitializeOptions {
             acceleration_mode: AccelerationMode::Cpu,
diff --git a/crates/voicevox_core/src/blocking.rs b/crates/voicevox_core/src/blocking.rs
index aa600c598..8d0bc2129 100644
--- a/crates/voicevox_core/src/blocking.rs
+++ b/crates/voicevox_core/src/blocking.rs
@@ -1,6 +1,13 @@
 //! ブロッキング版API。
 
 pub use crate::{
-    engine::open_jtalk::blocking::OpenJtalk, synthesizer::blocking::Synthesizer,
-    user_dict::dict::blocking::UserDict, voice_model::blocking::VoiceModel,
+    engine::open_jtalk::blocking::OpenJtalk, infer::runtimes::onnxruntime::blocking::Onnxruntime,
+    synthesizer::blocking::Synthesizer, user_dict::dict::blocking::UserDict,
+    voice_model::blocking::VoiceModel,
 };
+
+pub mod onnxruntime {
+    #[cfg(feature = "load-onnxruntime")]
+    #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+    pub use crate::infer::runtimes::onnxruntime::blocking::LoadOnce;
+}
diff --git a/crates/voicevox_core/src/devices.rs b/crates/voicevox_core/src/devices.rs
index 54b3de2f7..140105962 100644
--- a/crates/voicevox_core/src/devices.rs
+++ b/crates/voicevox_core/src/devices.rs
@@ -1,8 +1,6 @@
 use derive_getters::Getters;
 use serde::{Deserialize, Serialize};
 
-use crate::{infer::InferenceRuntime, synthesizer::InferenceRuntimeImpl, Result};
-
 /// このライブラリで利用可能なデバイスの情報。
 ///
 /// あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったと
@@ -30,37 +28,7 @@ pub struct SupportedDevices {
 }
 
 impl SupportedDevices {
-    /// `SupportedDevices`をコンストラクトする。
-    ///
-    /// # Example
-    ///
-    #[cfg_attr(windows, doc = "```no_run")] // https://github.com/VOICEVOX/voicevox_core/issues/537
-    #[cfg_attr(not(windows), doc = "```")]
-    /// use voicevox_core::SupportedDevices;
-    ///
-    /// let supported_devices = SupportedDevices::create()?;
-    /// #
-    /// # Result::<_, anyhow::Error>::Ok(())
-    /// ```
-    pub fn create() -> Result<Self> {
-        <InferenceRuntimeImpl as InferenceRuntime>::supported_devices()
-    }
-
     pub fn to_json(&self) -> serde_json::Value {
         serde_json::to_value(self).expect("should not fail")
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use rstest::rstest;
-
-    use super::SupportedDevices;
-
-    #[rstest]
-    fn supported_devices_create_works() {
-        let result = SupportedDevices::create();
-        // 環境によって結果が変わるので、関数呼び出しが成功するかどうかの確認のみ行う
-        assert!(result.is_ok(), "{result:?}");
-    }
-}
diff --git a/crates/voicevox_core/src/error.rs b/crates/voicevox_core/src/error.rs
index 916964429..d0e7fced0 100644
--- a/crates/voicevox_core/src/error.rs
+++ b/crates/voicevox_core/src/error.rs
@@ -34,6 +34,7 @@ impl Error {
         match &self.0 {
             ErrorRepr::NotLoadedOpenjtalkDict => ErrorKind::NotLoadedOpenjtalkDict,
             ErrorRepr::GpuSupport => ErrorKind::GpuSupport,
+            ErrorRepr::InitInferenceRuntime { .. } => ErrorKind::InitInferenceRuntime,
             ErrorRepr::LoadModel(LoadModelError { context, .. }) => match context {
                 LoadModelErrorKind::OpenZipFile => ErrorKind::OpenZipFile,
                 LoadModelErrorKind::ReadZipEntry { .. } => ErrorKind::ReadZipEntry,
@@ -65,6 +66,13 @@ pub(crate) enum ErrorRepr {
     #[error("GPU機能をサポートすることができません")]
     GpuSupport,
 
+    #[error("{runtime_display_name}のロードまたは初期化ができませんでした")]
+    InitInferenceRuntime {
+        runtime_display_name: &'static str,
+        #[source]
+        source: anyhow::Error,
+    },
+
     #[error(transparent)]
     LoadModel(#[from] LoadModelError),
 
@@ -119,6 +127,8 @@ pub enum ErrorKind {
     NotLoadedOpenjtalkDict,
     /// GPUモードがサポートされていない。
     GpuSupport,
+    /// 推論ライブラリのロードまたは初期化ができなかった。
+    InitInferenceRuntime,
     /// ZIPファイルを開くことに失敗した。
     OpenZipFile,
     /// ZIP内のファイルが読めなかった。
diff --git a/crates/voicevox_core/src/infer.rs b/crates/voicevox_core/src/infer.rs
index c2cad1d7d..cffd0d524 100644
--- a/crates/voicevox_core/src/infer.rs
+++ b/crates/voicevox_core/src/infer.rs
@@ -18,10 +18,12 @@ pub(crate) trait InferenceRuntime: 'static {
     type Session: Sized + Send + 'static;
     type RunContext<'a>: From<&'a mut Self::Session> + PushInputTensor;
 
-    fn supported_devices() -> crate::Result<SupportedDevices>;
+    /// このライブラリで利用可能なデバイスの情報を取得する。
+    fn supported_devices(&self) -> crate::Result<SupportedDevices>;
 
     #[allow(clippy::type_complexity)]
     fn new_session(
+        &self,
         model: impl FnOnce() -> std::result::Result<Vec<u8>, DecryptModelError>,
         options: InferenceSessionOptions,
     ) -> anyhow::Result<(
diff --git a/crates/voicevox_core/src/infer/runtimes.rs b/crates/voicevox_core/src/infer/runtimes.rs
index 7934027b6..e9d3d31c4 100644
--- a/crates/voicevox_core/src/infer/runtimes.rs
+++ b/crates/voicevox_core/src/infer/runtimes.rs
@@ -1,3 +1 @@
-mod onnxruntime;
-
-pub(crate) use self::onnxruntime::Onnxruntime;
+pub(crate) mod onnxruntime;
diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
index f8f376837..74dc8a601 100644
--- a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
+++ b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -15,17 +15,14 @@ use super::super::{
     OutputScalarKind, OutputTensor, ParamInfo, PushInputTensor,
 };
 
-#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Debug)]
-pub(crate) enum Onnxruntime {}
-
-impl InferenceRuntime for Onnxruntime {
+// TODO: `trait AsyncRuntime`みたいなものを作って抽象化しながら同期版と非同期版に別個の役割を
+// 持たせる
+// （なぜそうしたいかの理由の一つとしては<https://github.com/VOICEVOX/voicevox_core/issues/687>）
+impl InferenceRuntime for self::blocking::Onnxruntime {
     type Session = ort::Session;
     type RunContext<'a> = OnnxruntimeRunContext<'a>;
 
-    fn supported_devices() -> crate::Result<SupportedDevices> {
-        // TODO: `InferenceRuntime::init`と`InitInferenceRuntimeError`を作る
-        build_ort_env_once().unwrap();
-
+    fn supported_devices(&self) -> crate::Result<SupportedDevices> {
         (|| {
             let cpu = CPUExecutionProvider::default().is_available()?;
             let cuda = CUDAExecutionProvider::default().is_available()?;
@@ -44,6 +41,7 @@ impl InferenceRuntime for Onnxruntime {
     }
 
     fn new_session(
+        &self,
         model: impl FnOnce() -> std::result::Result<Vec<u8>, DecryptModelError>,
         options: InferenceSessionOptions,
     ) -> anyhow::Result<(
@@ -51,9 +49,6 @@ impl InferenceRuntime for Onnxruntime {
         Vec<ParamInfo<InputScalarKind>>,
         Vec<ParamInfo<OutputScalarKind>>,
     )> {
-        // TODO: `InferenceRuntime::init`と`InitInferenceRuntimeError`を作る
-        build_ort_env_once().unwrap();
-
         let mut builder = ort::Session::builder()?
             .with_optimization_level(GraphOptimizationLevel::Level1)?
             .with_intra_threads(options.cpu_num_threads.into())?;
@@ -181,12 +176,6 @@ impl InferenceRuntime for Onnxruntime {
     }
 }
 
-fn build_ort_env_once() -> ort::Result<()> {
-    static ONCE: once_cell::sync::OnceCell<()> = once_cell::sync::OnceCell::new();
-    ONCE.get_or_try_init(|| ort::init().with_name(env!("CARGO_PKG_NAME")).commit())?;
-    Ok(())
-}
-
 pub(crate) struct OnnxruntimeRunContext<'sess> {
     sess: &'sess ort::Session,
     inputs: Vec<ort::SessionInputValue<'static>>,
@@ -225,3 +214,365 @@ impl PushInputTensor for OnnxruntimeRunContext<'_> {
         self.push_input(tensor)
     }
 }
+
+pub(crate) mod blocking {
+    use ort::EnvHandle;
+    use ref_cast::{ref_cast_custom, RefCastCustom};
+
+    use crate::{error::ErrorRepr, SupportedDevices};
+
+    use super::super::super::InferenceRuntime;
+
+    /// ONNX Runtime。
+    ///
+    /// シングルトンであり、インスタンスは高々一つ。
+    ///
+    /// # Rust APIにおけるインスタンスの共有
+    ///
+    /// インスタンスは[voicevox-ort]側に作られる。Rustのクレートとしてこのライブラリを利用する場合、
+    /// Tokio版APIやvoicevox-ortを利用する他クレートともインスタンスが共有される。
+    ///
+    #[cfg_attr(feature = "load-onnxruntime", doc = "```")]
+    #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```compile_fail")]
+    /// # use voicevox_core as another_lib;
+    /// #
+    /// # fn main() -> anyhow::Result<()> {
+    /// # if cfg!(windows) {
+    /// #     // Windows\System32\onnxruntime.dllを回避
+    /// #     voicevox_core::blocking::Onnxruntime::load_once()
+    /// #         .filename(test_util::ONNXRUNTIME_DYLIB_PATH)
+    /// #         .exec()?;
+    /// # }
+    /// let ort1 = voicevox_core::blocking::Onnxruntime::load_once().exec()?;
+    /// let ort2 = another_lib::tokio::Onnxruntime::get().expect("`ort1`と同一のはず");
+    /// assert_eq!(ptr_addr(ort1), ptr_addr(ort2));
+    ///
+    /// fn ptr_addr(obj: &impl Sized) -> usize {
+    ///     obj as *const _ as _
+    /// }
+    /// # Ok(())
+    /// # }
+    /// ```
+    ///
+    /// [voicevox-ort]: https://github.com/VOICEVOX/ort
+    #[derive(Debug, RefCastCustom)]
+    #[repr(transparent)]
+    pub struct Onnxruntime {
+        _inner: EnvHandle,
+    }
+
+    impl Onnxruntime {
+        /// ONNX Runtimeのライブラリ名。
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub const LIB_NAME: &'static str = "onnxruntime";
+
+        /// 推奨されるONNX Runtimeのバージョン。
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub const LIB_VERSION: &'static str = ort::downloaded_version!();
+
+        /// [`LIB_NAME`]と[`LIB_VERSION`]からなる動的ライブラリのファイル名。
+        ///
+        /// WindowsとAndroidでは[`LIB_UNVERSIONED_FILENAME`]と同じ。
+        ///
+        /// [`LIB_NAME`]: Self::LIB_NAME
+        /// [`LIB_VERSION`]: Self::LIB_VERSION
+        /// [`LIB_UNVERSIONED_FILENAME`]: Self::LIB_UNVERSIONED_FILENAME
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub const LIB_VERSIONED_FILENAME: &'static str = if cfg!(target_os = "linux") {
+            const_format::concatcp!(
+                "lib",
+                Onnxruntime::LIB_NAME,
+                ".so.",
+                Onnxruntime::LIB_VERSION,
+            )
+        } else if cfg!(any(target_os = "macos", target_os = "ios")) {
+            const_format::concatcp!(
+                "lib",
+                Onnxruntime::LIB_NAME,
+                ".",
+                Onnxruntime::LIB_VERSION,
+                ".dylib",
+            )
+        } else {
+            Self::LIB_UNVERSIONED_FILENAME
+        };
+
+        /// [`LIB_NAME`]からなる動的ライブラリのファイル名。
+        ///
+        /// [`LIB_NAME`]: Self::LIB_NAME
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub const LIB_UNVERSIONED_FILENAME: &'static str = const_format::concatcp!(
+            std::env::consts::DLL_PREFIX,
+            Onnxruntime::LIB_NAME,
+            std::env::consts::DLL_SUFFIX,
+        );
+
+        #[ref_cast_custom]
+        const fn new(inner: &EnvHandle) -> &Self;
+
+        /// インスタンスが既に作られているならそれを得る。
+        ///
+        /// 作られていなければ`None`を返す。
+        pub fn get() -> Option<&'static Self> {
+            EnvHandle::get().map(Self::new)
+        }
+
+        fn once(
+            init: impl FnOnce() -> anyhow::Result<&'static EnvHandle>,
+        ) -> crate::Result<&'static Self> {
+            let inner = init().map_err(|source| ErrorRepr::InitInferenceRuntime {
+                runtime_display_name: "ONNX Runtime",
+                source,
+            })?;
+            Ok(Self::new(inner))
+        }
+
+        /// ONNX Runtimeをロードして初期化する。
+        ///
+        /// 一度成功したら、以後は引数を無視して同じ参照を返す。
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub fn load_once() -> LoadOnce {
+            LoadOnce::default()
+        }
+
+        /// ONNX Runtimeを初期化する。
+        ///
+        /// 一度成功したら以後は同じ参照を返す。
+        #[cfg(feature = "link-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "link-onnxruntime")))]
+        pub fn init_once() -> crate::Result<&'static Self> {
+            Self::once(|| ort::try_init(None))
+        }
+
+        #[cfg(test)]
+        pub(crate) fn from_test_util_data() -> anyhow::Result<&'static Self> {
+            #[cfg(feature = "load-onnxruntime")]
+            {
+                Self::load_once()
+                    .filename(test_util::ONNXRUNTIME_DYLIB_PATH)
+                    .exec()
+                    .map_err(Into::into)
+            }
+
+            #[cfg(feature = "link-onnxruntime")]
+            {
+                Self::init_once().map_err(Into::into)
+            }
+        }
+
+        /// このライブラリで利用可能なデバイスの情報を取得する。
+        pub fn supported_devices(&self) -> crate::Result<SupportedDevices> {
+            <Self as InferenceRuntime>::supported_devices(self)
+        }
+    }
+
+    /// [`Onnxruntime::load_once`]のビルダー。
+    #[cfg(feature = "load-onnxruntime")]
+    pub struct LoadOnce {
+        filename: std::ffi::OsString,
+    }
+
+    #[cfg(feature = "load-onnxruntime")]
+    impl Default for LoadOnce {
+        fn default() -> Self {
+            let filename = Onnxruntime::LIB_VERSIONED_FILENAME.into();
+            Self { filename }
+        }
+    }
+
+    #[cfg(feature = "load-onnxruntime")]
+    impl LoadOnce {
+        /// ONNX Runtimeのファイル名（モジュール名）もしくはファイルパスを指定する。
+        ///
+        /// `dlopen`/[`LoadLibraryExW`]の引数に使われる。デフォルト
+        /// は[`Onnxruntime::LIB_VERSIONED_FILENAME`]。
+        ///
+        /// [`LoadLibraryExW`]:
+        /// https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw
+        pub fn filename(mut self, filename: impl Into<std::ffi::OsString>) -> Self {
+            self.filename = filename.into();
+            self
+        }
+
+        /// 実行する。
+        pub fn exec(self) -> crate::Result<&'static Onnxruntime> {
+            Onnxruntime::once(|| ort::try_init_from(&self.filename, None))
+        }
+    }
+}
+
+pub(crate) mod tokio {
+    use ref_cast::{ref_cast_custom, RefCastCustom};
+
+    use crate::SupportedDevices;
+
+    /// ONNX Runtime。
+    ///
+    /// シングルトンであり、インスタンスは高々一つ。
+    ///
+    /// # Rust APIにおけるインスタンスの共有
+    ///
+    /// インスタンスは[voicevox-ort]側に作られる。Rustのクレートとしてこのライブラリを利用する場合、
+    /// ブロッキング版APIやvoicevox-ortを利用する他クレートともインスタンスが共有される。
+    ///
+    #[cfg_attr(feature = "load-onnxruntime", doc = "```")]
+    #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```compile_fail")]
+    /// # use voicevox_core as another_lib;
+    /// #
+    /// # #[tokio::main]
+    /// # async fn main() -> anyhow::Result<()> {
+    /// # if cfg!(windows) {
+    /// #     // Windows\System32\onnxruntime.dllを回避
+    /// #     voicevox_core::blocking::Onnxruntime::load_once()
+    /// #         .filename(test_util::ONNXRUNTIME_DYLIB_PATH)
+    /// #         .exec()?;
+    /// # }
+    /// let ort1 = voicevox_core::tokio::Onnxruntime::load_once().exec().await?;
+    /// let ort2 = another_lib::blocking::Onnxruntime::get().expect("`ort1`と同一のはず");
+    /// assert_eq!(ptr_addr(ort1), ptr_addr(ort2));
+    ///
+    /// fn ptr_addr(obj: &impl Sized) -> usize {
+    ///     obj as *const _ as _
+    /// }
+    /// # Ok(())
+    /// # }
+    /// ```
+    ///
+    /// [voicevox-ort]: https://github.com/VOICEVOX/ort
+    #[derive(Debug, RefCastCustom)]
+    #[repr(transparent)]
+    pub struct Onnxruntime(pub(crate) super::blocking::Onnxruntime);
+
+    impl Onnxruntime {
+        /// ONNX Runtimeのライブラリ名。
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        // ブロッキング版と等しいことはテストで担保
+        pub const LIB_NAME: &'static str = "onnxruntime";
+
+        /// 推奨されるONNX Runtimeのバージョン。
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        // ブロッキング版と等しいことはテストで担保
+        pub const LIB_VERSION: &'static str = ort::downloaded_version!();
+
+        /// [`LIB_NAME`]と[`LIB_VERSION`]からなる動的ライブラリのファイル名。
+        ///
+        /// WindowsとAndroidでは[`LIB_UNVERSIONED_FILENAME`]と同じ。
+        ///
+        /// [`LIB_NAME`]: Self::LIB_NAME
+        /// [`LIB_VERSION`]: Self::LIB_VERSION
+        /// [`LIB_UNVERSIONED_FILENAME`]: Self::LIB_UNVERSIONED_FILENAME
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub const LIB_VERSIONED_FILENAME: &'static str =
+            super::blocking::Onnxruntime::LIB_VERSIONED_FILENAME;
+
+        /// [`LIB_NAME`]からなる動的ライブラリのファイル名。
+        ///
+        /// [`LIB_NAME`]: Self::LIB_NAME
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub const LIB_UNVERSIONED_FILENAME: &'static str =
+            super::blocking::Onnxruntime::LIB_UNVERSIONED_FILENAME;
+
+        #[ref_cast_custom]
+        pub(crate) const fn from_blocking(blocking: &super::blocking::Onnxruntime) -> &Self;
+
+        /// インスタンスが既に作られているならそれを得る。
+        ///
+        /// 作られていなければ`None`を返す。
+        pub fn get() -> Option<&'static Self> {
+            super::blocking::Onnxruntime::get().map(Self::from_blocking)
+        }
+
+        /// ONNX Runtimeをロードして初期化する。
+        ///
+        /// 一度成功したら、以後は引数を無視して同じ参照を返す。
+        #[cfg(feature = "load-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+        pub fn load_once() -> LoadOnce {
+            LoadOnce::default()
+        }
+
+        /// ONNX Runtimeを初期化する。
+        ///
+        /// 一度成功したら以後は同じ参照を返す。
+        #[cfg(feature = "link-onnxruntime")]
+        #[cfg_attr(docsrs, doc(cfg(feature = "link-onnxruntime")))]
+        pub async fn init_once() -> crate::Result<&'static Self> {
+            let inner = crate::task::asyncify(super::blocking::Onnxruntime::init_once).await?;
+            Ok(Self::from_blocking(inner))
+        }
+
+        #[cfg(test)]
+        pub(crate) async fn from_test_util_data() -> anyhow::Result<&'static Self> {
+            crate::task::asyncify(super::blocking::Onnxruntime::from_test_util_data)
+                .await
+                .map(Self::from_blocking)
+        }
+
+        /// このライブラリで利用可能なデバイスの情報を取得する。
+        pub fn supported_devices(&self) -> crate::Result<SupportedDevices> {
+            self.0.supported_devices()
+        }
+    }
+
+    /// [`Onnxruntime::load_once`]のビルダー。
+    #[cfg(feature = "load-onnxruntime")]
+    #[derive(Default)]
+    pub struct LoadOnce(super::blocking::LoadOnce);
+
+    #[cfg(feature = "load-onnxruntime")]
+    impl LoadOnce {
+        /// ONNX Runtimeのファイル名（モジュール名）もしくはファイルパスを指定する。
+        ///
+        /// `dlopen`/[`LoadLibraryExW`]の引数に使われる。デフォルト
+        /// は[`Onnxruntime::LIB_VERSIONED_FILENAME`]。
+        ///
+        /// [`LoadLibraryExW`]:
+        /// https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw
+        pub fn filename(self, filename: impl Into<std::ffi::OsString>) -> Self {
+            Self(self.0.filename(filename))
+        }
+
+        /// 実行する。
+        pub async fn exec(self) -> crate::Result<&'static Onnxruntime> {
+            let inner = crate::task::asyncify(|| self.0.exec()).await?;
+            Ok(Onnxruntime::from_blocking(inner))
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use rstest::rstest;
+
+    #[cfg(feature = "load-onnxruntime")]
+    #[test]
+    fn assert_same_lib_names_and_versions() {
+        use pretty_assertions::assert_eq;
+
+        assert_eq!(
+            super::blocking::Onnxruntime::LIB_NAME,
+            super::tokio::Onnxruntime::LIB_NAME,
+        );
+        assert_eq!(
+            super::blocking::Onnxruntime::LIB_VERSION,
+            super::tokio::Onnxruntime::LIB_VERSION,
+        );
+    }
+
+    #[rstest]
+    fn supported_devices_works() {
+        let result = super::blocking::Onnxruntime::from_test_util_data()
+            .and_then(|o| o.supported_devices().map_err(Into::into));
+        // 環境によって結果が変わるので、関数呼び出しが成功するかどうかの確認のみ行う
+        assert!(result.is_ok(), "{result:?}");
+    }
+}
diff --git a/crates/voicevox_core/src/infer/session_set.rs b/crates/voicevox_core/src/infer/session_set.rs
index cdd179680..95f081bac 100644
--- a/crates/voicevox_core/src/infer/session_set.rs
+++ b/crates/voicevox_core/src/infer/session_set.rs
@@ -17,6 +17,7 @@ pub(crate) struct InferenceSessionSet<R: InferenceRuntime, D: InferenceDomain>(
 
 impl<R: InferenceRuntime, D: InferenceDomain> InferenceSessionSet<R, D> {
     pub(crate) fn new(
+        rt: &R,
         model_bytes: &EnumMap<D::Operation, Vec<u8>>,
         options: &EnumMap<D::Operation, InferenceSessionOptions>,
     ) -> anyhow::Result<Self> {
@@ -27,7 +28,7 @@ impl<R: InferenceRuntime, D: InferenceDomain> InferenceSessionSet<R, D> {
                     <D::Operation as InferenceOperation>::PARAM_INFOS[op];
 
                 let (sess, actual_input_param_infos, actual_output_param_infos) =
-                    R::new_session(|| model_file::decrypt(model_bytes), options[op])?;
+                    rt.new_session(|| model_file::decrypt(model_bytes), options[op])?;
 
                 check_param_infos(expected_input_param_infos, &actual_input_param_infos)?;
                 check_param_infos(expected_output_param_infos, &actual_output_param_infos)?;
diff --git a/crates/voicevox_core/src/lib.rs b/crates/voicevox_core/src/lib.rs
index 0f34c5962..910f9eeef 100644
--- a/crates/voicevox_core/src/lib.rs
+++ b/crates/voicevox_core/src/lib.rs
@@ -1,4 +1,66 @@
 //! 無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのコア。
+//!
+//! # Feature flags
+//!
+//! ## ONNX Runtimeのリンク方法を決めるフィーチャ
+//!
+//! このクレートの利用にあたっては以下の二つの[Cargoフィーチャ]のうちどちらかを有効にしなければなり
+//! ません。両方の有効化はコンパイルエラーとなります。[`Onnxruntime`]の初期化方法はこれらの
+//! フィーチャによって決まります。
+//!
+//! - **`load-onnxruntime`**: ONNX Runtimeを`dlopen`/`LoadLibraryExW`で開きます。
+//! - **`link-onnxruntime`**: ONNX Runtimeをロード時動的リンクします。iOSのような`dlopen`の利用が
+//!     困難な環境でのみこちらを利用するべきです。_Note_:
+//!     [動的リンク対象のライブラリ名]は`onnxruntime`で固定です。変更
+//!     は`patchelf(1)`や`install_name_tool(1)`で行ってください。
+//!
+//! ## GPUを利用可能にするフィーチャ
+//!
+//! - **`cuda`**
+//! - **`directml`**
+// TODO: こんな感じ(↓)で書く
+////! - **`cuda`**: [CUDAを用いた機械学習推論]を可能にします。
+////!     - ❗ <code>[acceleration\_mode]={Gpu,Auto}</code>のときの挙動が変化します。`directml`と共に
+////!         有効化したときの挙動は未規定です。
+////! - **`directml`**: [DirectMLを用いた機械学習推論]を可能にします。
+////!     - ❗ 〃
+////!
+////! [CUDAを用いた機械学習推論]:
+////! https://onnxruntime.ai/docs/execution-providers/CUDA-ExecutionProvider.html
+////! [DirectMLを用いた機械学習推論]:
+////! https://onnxruntime.ai/docs/execution-providers/DirectML-ExecutionProvider.html
+////! [acceleration\_mode]: InitializeOptions::acceleration_mode
+//!
+//! [Cargoフィーチャ]: https://doc.rust-lang.org/stable/cargo/reference/features.html
+//! [動的リンク対象のライブラリ名]:
+//! https://doc.rust-lang.org/cargo/reference/build-scripts.html#rustc-link-lib
+//! [`Onnxruntime`]: blocking::Onnxruntime
+
+#![cfg_attr(docsrs, feature(doc_cfg))]
+
+#[cfg(not(any(feature = "load-onnxruntime", feature = "link-onnxruntime")))]
+compile_error!("either `load-onnxruntime` or `link-onnxruntime` must be enabled");
+
+#[cfg(not(doc))]
+const _: () = {
+    #[cfg(all(feature = "load-onnxruntime", feature = "link-onnxruntime"))]
+    compile_error!("`load-onnxruntime` and `link-onnxruntime` cannot be enabled at the same time");
+
+    // Rust APIでvoicevox-ortを他のクレートが利用する可能性を考え、voicevox-ort側とfeatureがズレ
+    // ないようにする
+
+    #[cfg(feature = "load-onnxruntime")]
+    ort::assert_feature!(
+        cfg(feature = "load-dynamic"),
+        "when `load-onnxruntime` is enabled,`voicevox-ort/load-dynamic` must be also enabled",
+    );
+
+    #[cfg(feature = "link-onnxruntime")]
+    ort::assert_feature!(
+        cfg(not(feature = "load-dynamic")),
+        "when `link-onnxruntime` is enabled,`voicevox-ort/load-dynamic` must be disabled",
+    );
+};
 
 mod devices;
 /// cbindgen:ignore
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index f590e18f4..475031f1c 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -21,13 +21,18 @@ use crate::{
 };
 
 pub(crate) struct Status<R: InferenceRuntime> {
+    pub(crate) rt: &'static R,
     loaded_models: std::sync::Mutex<LoadedModels<R>>,
     session_options: InferenceDomainMap<SessionOptionsByDomain>,
 }
 
 impl<R: InferenceRuntime> Status<R> {
-    pub(crate) fn new(session_options: InferenceDomainMap<SessionOptionsByDomain>) -> Self {
+    pub(crate) fn new(
+        rt: &'static R,
+        session_options: InferenceDomainMap<SessionOptionsByDomain>,
+    ) -> Self {
         Self {
+            rt,
             loaded_models: Default::default(),
             session_options,
         }
@@ -44,7 +49,7 @@ impl<R: InferenceRuntime> Status<R> {
             .ensure_acceptable(model_header)?;
 
         let session_sets_with_inner_ids = model_contents
-            .create_session_sets(&self.session_options)
+            .create_session_sets(self.rt, &self.session_options)
             .map_err(|source| LoadModelError {
                 path: model_header.path.clone(),
                 context: LoadModelErrorKind::InvalidModelData,
@@ -310,6 +315,7 @@ impl<R: InferenceRuntime> InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomai
 impl InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain> {
     fn create_session_sets<R: InferenceRuntime>(
         &self,
+        rt: &R,
         session_options: &InferenceDomainMap<SessionOptionsByDomain>,
     ) -> anyhow::Result<InferenceDomainMap<SessionSetsWithInnerVoiceIdsByDomain<R>>> {
         duplicate! {
@@ -321,7 +327,7 @@ impl InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain> {
                 .field
                 .as_ref()
                 .map(|(inner_voice_ids, model_bytes)| {
-                    let session_set = InferenceSessionSet::new(model_bytes, &session_options.field)?;
+                    let session_set = InferenceSessionSet::new(rt, model_bytes, &session_options.field)?;
                     Ok::<_, anyhow::Error>((inner_voice_ids.clone(), session_set))
                 })
                 .transpose()?;
@@ -348,7 +354,6 @@ mod tests {
             InferenceSessionOptions,
         },
         macros::tests::assert_debug_fmt_eq,
-        synthesizer::InferenceRuntimeImpl,
     };
 
     use super::Status;
@@ -371,7 +376,10 @@ mod tests {
                 TalkOperation::Decode => heavy_session_options,
             },
         };
-        let status = Status::<InferenceRuntimeImpl>::new(session_options);
+        let status = Status::new(
+            crate::blocking::Onnxruntime::from_test_util_data().unwrap(),
+            session_options,
+        );
 
         assert_eq!(
             light_session_options,
@@ -392,9 +400,12 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn status_load_model_works() {
-        let status = Status::<InferenceRuntimeImpl>::new(InferenceDomainMap {
-            talk: enum_map!(_ => InferenceSessionOptions::new(0, false)),
-        });
+        let status = Status::new(
+            crate::blocking::Onnxruntime::from_test_util_data().unwrap(),
+            InferenceDomainMap {
+                talk: enum_map!(_ => InferenceSessionOptions::new(0, false)),
+            },
+        );
         let model = &crate::tokio::VoiceModel::sample().await.unwrap();
         let model_contents = &model.read_inference_models().await.unwrap();
         let result = status.insert_model(model.header(), model_contents);
@@ -405,9 +416,12 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn status_is_model_loaded_works() {
-        let status = Status::<InferenceRuntimeImpl>::new(InferenceDomainMap {
-            talk: enum_map!(_ => InferenceSessionOptions::new(0, false)),
-        });
+        let status = Status::new(
+            crate::blocking::Onnxruntime::from_test_util_data().unwrap(),
+            InferenceDomainMap {
+                talk: enum_map!(_ => InferenceSessionOptions::new(0, false)),
+            },
+        );
         let vvm = &crate::tokio::VoiceModel::sample().await.unwrap();
         let model_header = vvm.header();
         let model_contents = &vvm.read_inference_models().await.unwrap();
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 4b26eb56b..767d27b1c 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -1,5 +1,3 @@
-use crate::infer::runtimes::Onnxruntime;
-
 /// [`blocking::Synthesizer::synthesis`]および[`tokio::Synthesizer::synthesis`]のオプション。
 ///
 /// [`blocking::Synthesizer::synthesis`]: blocking::Synthesizer::synthesis
@@ -68,8 +66,6 @@ pub struct InitializeOptions {
     pub cpu_num_threads: u16,
 }
 
-pub(crate) type InferenceRuntimeImpl = Onnxruntime;
-
 pub(crate) mod blocking {
     // FIXME: ここのdocのコードブロックはasync版のものなので、`tokio`モジュールの方に移した上で、
     // (ブロッキング版をpublic APIにするならの話ではあるが)ブロッキング版はブロッキング版でコード例
@@ -93,16 +89,16 @@ pub(crate) mod blocking {
         status::Status,
         text_analyzer::{KanaAnalyzer, OpenJTalkAnalyzer, TextAnalyzer},
         AccentPhraseModel, AudioQueryModel, FullcontextExtractor, Result, StyleId,
-        SupportedDevices, SynthesisOptions, VoiceModelId, VoiceModelMeta,
+        SynthesisOptions, VoiceModelId, VoiceModelMeta,
     };
 
-    use super::{AccelerationMode, InferenceRuntimeImpl, InitializeOptions, TtsOptions};
+    use super::{AccelerationMode, InitializeOptions, TtsOptions};
 
     const DEFAULT_SAMPLING_RATE: u32 = 24000;
 
     /// 音声シンセサイザ。
     pub struct Synthesizer<O> {
-        pub(super) status: Status<InferenceRuntimeImpl>,
+        pub(super) status: Status<crate::blocking::Onnxruntime>,
         open_jtalk_analyzer: OpenJTalkAnalyzer<O>,
         kana_analyzer: KanaAnalyzer,
         use_gpu: bool,
@@ -113,22 +109,29 @@ pub(crate) mod blocking {
         ///
         /// # Example
         ///
-        #[cfg_attr(windows, doc = "```no_run")] // https://github.com/VOICEVOX/voicevox_core/issues/537
-        #[cfg_attr(not(windows), doc = "```")]
+        #[cfg_attr(feature = "load-onnxruntime", doc = "```")]
+        #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```compile_fail")]
         /// # #[tokio::main]
         /// # async fn main() -> anyhow::Result<()> {
-        /// # use test_util::OPEN_JTALK_DIC_DIR;
+        /// # use test_util::{ONNXRUNTIME_DYLIB_PATH, OPEN_JTALK_DIC_DIR};
         /// #
         /// # const ACCELERATION_MODE: AccelerationMode = AccelerationMode::Cpu;
         /// #
         /// use std::sync::Arc;
         ///
         /// use voicevox_core::{
-        ///     tokio::{OpenJtalk, Synthesizer},
+        ///     tokio::{Onnxruntime, OpenJtalk, Synthesizer},
         ///     AccelerationMode, InitializeOptions,
         /// };
         ///
+        /// # if cfg!(windows) {
+        /// #     // Windows\System32\onnxruntime.dllを回避
+        /// #     voicevox_core::blocking::Onnxruntime::load_once()
+        /// #         .filename(test_util::ONNXRUNTIME_DYLIB_PATH)
+        /// #         .exec()?;
+        /// # }
         /// let mut syntesizer = Synthesizer::new(
+        ///     Onnxruntime::load_once().exec().await?,
         ///     Arc::new(OpenJtalk::new(OPEN_JTALK_DIC_DIR).await.unwrap()),
         ///     &InitializeOptions {
         ///         acceleration_mode: ACCELERATION_MODE,
@@ -139,13 +142,17 @@ pub(crate) mod blocking {
         /// # Ok(())
         /// # }
         /// ```
-        pub fn new(open_jtalk: O, options: &InitializeOptions) -> Result<Self> {
+        pub fn new(
+            onnxruntime: &'static crate::blocking::Onnxruntime,
+            open_jtalk: O,
+            options: &InitializeOptions,
+        ) -> Result<Self> {
             #[cfg(windows)]
             list_windows_video_cards();
 
             let use_gpu = match options.acceleration_mode {
                 AccelerationMode::Auto => {
-                    let supported_devices = SupportedDevices::create()?;
+                    let supported_devices = onnxruntime.supported_devices()?;
 
                     if cfg!(feature = "directml") {
                         *supported_devices.dml()
@@ -157,7 +164,7 @@ pub(crate) mod blocking {
                 AccelerationMode::Gpu => true,
             };
 
-            if use_gpu && !can_support_gpu_feature()? {
+            if use_gpu && !can_support_gpu_feature(onnxruntime)? {
                 return Err(ErrorRepr::GpuSupport.into());
             }
 
@@ -169,13 +176,16 @@ pub(crate) mod blocking {
             let heavy_session_options =
                 InferenceSessionOptions::new(options.cpu_num_threads, use_gpu);
 
-            let status = Status::new(InferenceDomainMap {
-                talk: enum_map! {
-                    TalkOperation::PredictDuration
-                    | TalkOperation::PredictIntonation => light_session_options,
-                    TalkOperation::Decode => heavy_session_options,
+            let status = Status::new(
+                onnxruntime,
+                InferenceDomainMap {
+                    talk: enum_map! {
+                        TalkOperation::PredictDuration
+                        | TalkOperation::PredictIntonation => light_session_options,
+                        TalkOperation::Decode => heavy_session_options,
+                    },
                 },
-            });
+            );
 
             return Ok(Self {
                 status,
@@ -184,8 +194,8 @@ pub(crate) mod blocking {
                 use_gpu,
             });
 
-            fn can_support_gpu_feature() -> Result<bool> {
-                let supported_devices = SupportedDevices::create()?;
+            fn can_support_gpu_feature(onnxruntime: &crate::blocking::Onnxruntime) -> Result<bool> {
+                let supported_devices = onnxruntime.supported_devices()?;
 
                 if cfg!(feature = "directml") {
                     Ok(*supported_devices.dml())
@@ -195,6 +205,10 @@ pub(crate) mod blocking {
             }
         }
 
+        pub fn onnxruntime(&self) -> &'static crate::blocking::Onnxruntime {
+            self.status.rt
+        }
+
         /// ハードウェアアクセラレーションがGPUモードか判定する。
         pub fn is_gpu_mode(&self) -> bool {
             self.use_gpu
@@ -437,13 +451,13 @@ pub(crate) mod blocking {
         ///
         /// # Example
         ///
-        #[cfg_attr(windows, doc = "```no_run")] // https://github.com/VOICEVOX/voicevox_core/issues/537
-        #[cfg_attr(not(windows), doc = "```")]
+        /// ```
         /// # #[tokio::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
         /// #         test_util::SAMPLE_VOICE_MODEL_FILE_PATH,
+        /// #         test_util::ONNXRUNTIME_DYLIB_PATH,
         /// #         test_util::OPEN_JTALK_DIC_DIR,
         /// #     )
         /// #     .await?;
@@ -677,13 +691,13 @@ pub(crate) mod blocking {
         ///
         /// # Example
         ///
-        #[cfg_attr(windows, doc = "```no_run")] // https://github.com/VOICEVOX/voicevox_core/issues/537
-        #[cfg_attr(not(windows), doc = "```")]
+        /// ```
         /// # #[tokio::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
         /// #         test_util::SAMPLE_VOICE_MODEL_FILE_PATH,
+        /// #         test_util::ONNXRUNTIME_DYLIB_PATH,
         /// #         test_util::OPEN_JTALK_DIC_DIR,
         /// #     )
         /// #     .await?;
@@ -726,13 +740,13 @@ pub(crate) mod blocking {
         ///
         /// # Example
         ///
-        #[cfg_attr(windows, doc = "```no_run")] // https://github.com/VOICEVOX/voicevox_core/issues/537
-        #[cfg_attr(not(windows), doc = "```")]
+        /// ```
         /// # #[tokio::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
         /// #         test_util::SAMPLE_VOICE_MODEL_FILE_PATH,
+        /// #         test_util::ONNXRUNTIME_DYLIB_PATH,
         /// #         test_util::OPEN_JTALK_DIC_DIR,
         /// #     )
         /// #     .await?;
@@ -759,13 +773,13 @@ pub(crate) mod blocking {
         ///
         /// # Examples
         ///
-        #[cfg_attr(windows, doc = "```no_run")] // https://github.com/VOICEVOX/voicevox_core/issues/537
-        #[cfg_attr(not(windows), doc = "```")]
+        /// ```
         /// # #[tokio::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
         /// #         test_util::SAMPLE_VOICE_MODEL_FILE_PATH,
+        /// #         test_util::ONNXRUNTIME_DYLIB_PATH,
         /// #         test_util::OPEN_JTALK_DIC_DIR,
         /// #     )
         /// #     .await?;
@@ -1135,12 +1149,20 @@ pub(crate) mod tokio {
 
     // FIXME: docを書く
     impl<O: Send + Sync + 'static> self::Synthesizer<O> {
-        pub fn new(open_jtalk: O, options: &InitializeOptions) -> Result<Self> {
-            super::blocking::Synthesizer::new(open_jtalk, options)
+        pub fn new(
+            onnxruntime: &'static crate::tokio::Onnxruntime,
+            open_jtalk: O,
+            options: &InitializeOptions,
+        ) -> Result<Self> {
+            super::blocking::Synthesizer::new(&onnxruntime.0, open_jtalk, options)
                 .map(Into::into)
                 .map(Self)
         }
 
+        pub fn onnxruntime(&self) -> &'static crate::tokio::Onnxruntime {
+            crate::tokio::Onnxruntime::from_blocking(self.0.onnxruntime())
+        }
+
         pub fn is_gpu_mode(&self) -> bool {
             self.0.is_gpu_mode()
         }
@@ -1305,6 +1327,9 @@ mod tests {
     #[tokio::test]
     async fn load_model_works(#[case] expected_result_at_initialized: Result<()>) {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             (),
             &InitializeOptions {
                 acceleration_mode: AccelerationMode::Cpu,
@@ -1328,6 +1353,9 @@ mod tests {
     #[tokio::test]
     async fn is_use_gpu_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             (),
             &InitializeOptions {
                 acceleration_mode: AccelerationMode::Cpu,
@@ -1344,6 +1372,9 @@ mod tests {
     async fn is_loaded_model_by_style_id_works(#[case] style_id: u32, #[case] expected: bool) {
         let style_id = StyleId::new(style_id);
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             (),
             &InitializeOptions {
                 acceleration_mode: AccelerationMode::Cpu,
@@ -1372,6 +1403,9 @@ mod tests {
     #[tokio::test]
     async fn predict_duration_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             (),
             &InitializeOptions {
                 acceleration_mode: AccelerationMode::Cpu,
@@ -1403,6 +1437,9 @@ mod tests {
     #[tokio::test]
     async fn predict_intonation_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             (),
             &InitializeOptions {
                 acceleration_mode: AccelerationMode::Cpu,
@@ -1442,6 +1479,9 @@ mod tests {
     #[tokio::test]
     async fn decode_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             (),
             &InitializeOptions {
                 acceleration_mode: AccelerationMode::Cpu,
@@ -1534,6 +1574,9 @@ mod tests {
         #[case] expected_kana_text: &str,
     ) {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
@@ -1604,6 +1647,9 @@ mod tests {
         #[case] expected_text_consonant_vowel_data: &TextConsonantVowelData,
     ) {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
@@ -1671,6 +1717,9 @@ mod tests {
     #[tokio::test]
     async fn create_accent_phrases_works_for_japanese_commas_and_periods() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
@@ -1732,6 +1781,9 @@ mod tests {
     #[tokio::test]
     async fn mora_length_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
@@ -1770,6 +1822,9 @@ mod tests {
     #[tokio::test]
     async fn mora_pitch_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
@@ -1804,6 +1859,9 @@ mod tests {
     #[tokio::test]
     async fn mora_data_works() {
         let syntesizer = super::tokio::Synthesizer::new(
+            crate::tokio::Onnxruntime::from_test_util_data()
+                .await
+                .unwrap(),
             crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
diff --git a/crates/voicevox_core/src/tokio.rs b/crates/voicevox_core/src/tokio.rs
index 49451a310..1e2fabada 100644
--- a/crates/voicevox_core/src/tokio.rs
+++ b/crates/voicevox_core/src/tokio.rs
@@ -1,6 +1,13 @@
 //! Tokio版API。
 
 pub use crate::{
-    engine::open_jtalk::tokio::OpenJtalk, synthesizer::tokio::Synthesizer,
-    user_dict::dict::tokio::UserDict, voice_model::tokio::VoiceModel,
+    engine::open_jtalk::tokio::OpenJtalk, infer::runtimes::onnxruntime::tokio::Onnxruntime,
+    synthesizer::tokio::Synthesizer, user_dict::dict::tokio::UserDict,
+    voice_model::tokio::VoiceModel,
 };
+
+pub mod onnxruntime {
+    #[cfg(feature = "load-onnxruntime")]
+    #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+    pub use crate::infer::runtimes::onnxruntime::tokio::LoadOnce;
+}
diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml
index f10e2a6f4..29b66e55a 100644
--- a/crates/voicevox_core_c_api/Cargo.toml
+++ b/crates/voicevox_core_c_api/Cargo.toml
@@ -13,6 +13,8 @@ harness = false
 name = "e2e"
 
 [features]
+load-onnxruntime = ["voicevox_core/load-onnxruntime"]
+link-onnxruntime = ["voicevox_core/link-onnxruntime"]
 cuda = ["voicevox_core/cuda"]
 directml = ["voicevox_core/directml"]
 
@@ -22,6 +24,7 @@ anstyle-query.workspace = true
 camino.workspace = true
 chrono = { workspace = true, default-features = false, features = ["clock"] }
 colorchoice.workspace = true
+const_format.workspace = true
 cstr.workspace = true
 derive-getters.workspace = true
 easy-ext.workspace = true
@@ -30,6 +33,7 @@ itertools.workspace = true
 libc.workspace = true
 once_cell.workspace = true
 process_path.workspace = true
+ref-cast.workspace = true
 serde_json = { workspace = true, features = ["preserve_order"] }
 thiserror.workspace = true
 tracing.workspace = true
@@ -55,6 +59,7 @@ tempfile.workspace = true
 test_util.workspace = true
 toml.workspace = true
 typetag.workspace = true
+voicevox-ort.workspace = true
 
 [lints.rust]
 unsafe_code = "allow" # C APIのための操作
diff --git a/crates/voicevox_core_c_api/build.rs b/crates/voicevox_core_c_api/build.rs
index 535e73676..6b0934882 100644
--- a/crates/voicevox_core_c_api/build.rs
+++ b/crates/voicevox_core_c_api/build.rs
@@ -1,3 +1,4 @@
+// TODO: voicevox_onnxruntimeになったらやめる
 fn main() {
     #[cfg(target_os = "linux")]
     println!("cargo:rustc-link-arg=-Wl,-rpath,$ORIGIN");
diff --git a/crates/voicevox_core_c_api/cbindgen.toml b/crates/voicevox_core_c_api/cbindgen.toml
index 7615280f6..c377daa20 100644
--- a/crates/voicevox_core_c_api/cbindgen.toml
+++ b/crates/voicevox_core_c_api/cbindgen.toml
@@ -9,6 +9,19 @@ header = """
  * 無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのコア。
  *
  * <dl>
+ *   <dt id="voicevox-core-availability">
+ *     <a href="#voicevox-core-availability">Availability</a>
+ *   </dt>
+ *
+ *   <dd>
+ *     ヘッダによって次の二つのマクロのうちどちらかが存在する。[リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSでのみ`VOICEVOX_LINK_ONNXRUNTIME`が、他のプラットフォームでは`VOICEVOX_LOAD_ONNXRUNTIME`が存在する。
+ *
+ *     - `VOICEVOX_LOAD_ONNXRUNTIME`: ::voicevox_onnxruntime_load_once と、それに付属するアイテムが利用可能になる。
+ *     - `VOICEVOX_LINK_ONNXRUNTIME`: ::voicevox_onnxruntime_init_once が利用可能になる。またこのマクロが存在するなら、このライブラリはONNX Runtimeをロード時動的リンクする。
+ *   </dd>
+ * </dl>
+ *
+ * <dl>
  *   <dt id="voicevox-core-safety">
  *     <a href="#voicevox-core-safety">⚠️ Safety</a>
  *   </dt>
@@ -55,7 +68,18 @@ after_includes = """
 #else // __cplusplus
 #include <stdbool.h>
 #include <stdint.h>
-#endif // __cplusplus"""
+#endif // __cplusplus
+
+//#define VOICEVOX_LINK_ONNXRUNTIME
+//#define VOICEVOX_LOAD_ONNXRUNTIME
+
+#if !(defined(VOICEVOX_LINK_ONNXRUNTIME) || defined(VOICEVOX_LOAD_ONNXRUNTIME))
+#error "either `VOICEVOX_LINK_ONNXRUNTIME` or `VOICEVOX_LOAD_ONNXRUNTIME` must be enabled"
+#endif
+
+#if defined(VOICEVOX_LINK_ONNXRUNTIME) && defined(VOICEVOX_LOAD_ONNXRUNTIME)
+#error "`VOICEVOX_LINK_ONNXRUNTIME` or `VOICEVOX_LOAD_ONNXRUNTIME` cannot be enabled at the same time"
+#endif"""
 
 # Code Style Options
 
@@ -78,3 +102,7 @@ rename_variants = "ScreamingSnakeCase"
 [parse]
 parse_deps = true
 include = ["voicevox_core"]
+
+[defines]
+"feature = load-onnxruntime" = "VOICEVOX_LOAD_ONNXRUNTIME"
+"feature = link-onnxruntime" = "VOICEVOX_LINK_ONNXRUNTIME"
diff --git a/crates/voicevox_core_c_api/include/voicevox_core.h b/crates/voicevox_core_c_api/include/voicevox_core.h
index da921c869..fe19a4c2e 100644
--- a/crates/voicevox_core_c_api/include/voicevox_core.h
+++ b/crates/voicevox_core_c_api/include/voicevox_core.h
@@ -4,6 +4,19 @@
  * 無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのコア。
  *
  * <dl>
+ *   <dt id="voicevox-core-availability">
+ *     <a href="#voicevox-core-availability">Availability</a>
+ *   </dt>
+ *
+ *   <dd>
+ *     ヘッダによって次の二つのマクロのうちどちらかが存在する。[リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSでのみ`VOICEVOX_LINK_ONNXRUNTIME`が、他のプラットフォームでは`VOICEVOX_LOAD_ONNXRUNTIME`が存在する。
+ *
+ *     - `VOICEVOX_LOAD_ONNXRUNTIME`: ::voicevox_onnxruntime_load_once と、それに付属するアイテムが利用可能になる。
+ *     - `VOICEVOX_LINK_ONNXRUNTIME`: ::voicevox_onnxruntime_init_once が利用可能になる。またこのマクロが存在するなら、このライブラリはONNX Runtimeをロード時動的リンクする。
+ *   </dd>
+ * </dl>
+ *
+ * <dl>
  *   <dt id="voicevox-core-safety">
  *     <a href="#voicevox-core-safety">⚠️ Safety</a>
  *   </dt>
@@ -53,6 +66,17 @@
 #include <stdint.h>
 #endif // __cplusplus
 
+//#define VOICEVOX_LINK_ONNXRUNTIME
+//#define VOICEVOX_LOAD_ONNXRUNTIME
+
+#if !(defined(VOICEVOX_LINK_ONNXRUNTIME) || defined(VOICEVOX_LOAD_ONNXRUNTIME))
+#error "either `VOICEVOX_LINK_ONNXRUNTIME` or `VOICEVOX_LOAD_ONNXRUNTIME` must be enabled"
+#endif
+
+#if defined(VOICEVOX_LINK_ONNXRUNTIME) && defined(VOICEVOX_LOAD_ONNXRUNTIME)
+#error "`VOICEVOX_LINK_ONNXRUNTIME` or `VOICEVOX_LOAD_ONNXRUNTIME` cannot be enabled at the same time"
+#endif
+
 /**
  * ハードウェアアクセラレーションモードを設定する設定値。
  */
@@ -102,6 +126,10 @@ enum VoicevoxResultCode
    * GPUモードがサポートされていない
    */
   VOICEVOX_RESULT_GPU_SUPPORT_ERROR = 4,
+  /**
+   * 推論ライブラリのロードまたは初期化ができなかった
+   */
+  VOICEVOX_RESULT_INIT_INFERENCE_RUNTIME_ERROR = 29,
   /**
    * スタイルIDに対するスタイルが見つからなかった
    */
@@ -239,6 +267,21 @@ typedef int32_t VoicevoxUserDictWordType;
  */
 typedef struct OpenJtalkRc OpenJtalkRc;
 
+/**
+ * ONNX Runtime。
+ *
+ * シングルトンであり、インスタンスは高々一つ。
+ *
+ * ```c
+ * const VoicevoxOnnxruntime *ort1;
+ * voicevox_onnxruntime_load_once(voicevox_make_default_load_onnxruntime_options,
+ *                                &ort1);
+ * const VoicevoxOnnxruntime *ort2 = voicevox_onnxruntime_get();
+ * assert(ort1 == ort2);
+ * ```
+ */
+typedef struct VoicevoxOnnxruntime VoicevoxOnnxruntime;
+
 /**
  * 音声シンセサイザ。
  *
@@ -259,6 +302,24 @@ typedef struct VoicevoxUserDict VoicevoxUserDict;
  */
 typedef struct VoicevoxVoiceModel VoicevoxVoiceModel;
 
+#if defined(VOICEVOX_LOAD_ONNXRUNTIME)
+/**
+ * ::voicevox_onnxruntime_load_once のオプション。
+ *
+ * \availability{
+ *   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+ * }
+ */
+typedef struct VoicevoxLoadOnnxruntimeOptions {
+  /**
+   * ONNX Runtimeのファイル名（モジュール名）もしくはファイルパスを指定する。
+   *
+   * `dlopen`/[`LoadLibraryExW`](https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw)の引数に使われる。デフォルトは ::voicevox_get_onnxruntime_lib_versioned_filename と同じ。
+   */
+  const char *filename;
+} VoicevoxLoadOnnxruntimeOptions;
+#endif
+
 /**
  * ::voicevox_synthesizer_new のオプション。
  */
@@ -336,6 +397,115 @@ typedef struct VoicevoxUserDictWord {
 extern "C" {
 #endif // __cplusplus
 
+#if defined(VOICEVOX_LOAD_ONNXRUNTIME)
+/**
+ * ONNX Runtimeの動的ライブラリの、バージョン付きのファイル名。
+ *
+ * WindowsとAndroidでは ::voicevox_get_onnxruntime_lib_unversioned_filename と同じ。
+ *
+ * \availability{
+ *   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+ * }
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+const char *voicevox_get_onnxruntime_lib_versioned_filename(void);
+#endif
+
+#if defined(VOICEVOX_LOAD_ONNXRUNTIME)
+/**
+ * ONNX Runtimeの動的ライブラリの、バージョン無しのファイル名。
+ *
+ * \availability{
+ *   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+ * }
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+const char *voicevox_get_onnxruntime_lib_unversioned_filename(void);
+#endif
+
+#if defined(VOICEVOX_LOAD_ONNXRUNTIME)
+/**
+ * デフォルトの ::voicevox_onnxruntime_load_once のオプションを生成する。
+ *
+ * @return デフォルトの ::voicevox_onnxruntime_load_once のオプション
+ *
+ * \availability{
+ *   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+ * }
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+struct VoicevoxLoadOnnxruntimeOptions voicevox_make_default_load_onnxruntime_options(void);
+#endif
+
+/**
+ * ::VoicevoxOnnxruntime のインスタンスが既に作られているならそれを得る。
+ *
+ * 作られていなければ`NULL`を返す。
+ *
+ * @returns ::VoicevoxOnnxruntime のインスタンス
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+const struct VoicevoxOnnxruntime *voicevox_onnxruntime_get(void);
+
+#if defined(VOICEVOX_LOAD_ONNXRUNTIME)
+/**
+ * ONNX Runtimeをロードして初期化する。
+ *
+ * 一度成功したら、以後は引数を無視して同じ参照を返す。
+ *
+ * @param [in] options オプション
+ * @param [out] out_onnxruntime ::VoicevoxOnnxruntime のインスタンス
+ *
+ * @returns 結果コード
+ *
+ * \availability{
+ *   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+ * }
+ *
+ * \safety{
+ * - `options.filename`はヌル終端文字列を指し、かつ<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
+ * - `out_onnxruntime`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
+ * }
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+VoicevoxResultCode voicevox_onnxruntime_load_once(struct VoicevoxLoadOnnxruntimeOptions options,
+                                                  const struct VoicevoxOnnxruntime **out_onnxruntime);
+#endif
+
+#if defined(VOICEVOX_LINK_ONNXRUNTIME)
+/**
+ * ONNX Runtimeを初期化する。
+ *
+ * 一度成功したら以後は同じ参照を返す。
+ *
+ * @param [out] out_onnxruntime ::VoicevoxOnnxruntime のインスタンス
+ *
+ * @returns 結果コード
+ *
+ * \availability{
+ *   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSでのみ利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+ * }
+ *
+ * \safety{
+ * - `out_onnxruntime`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
+ * }
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+VoicevoxResultCode voicevox_onnxruntime_init_once(const struct VoicevoxOnnxruntime **out_onnxruntime);
+#endif
+
 /**
  * ::OpenJtalkRc を<b>構築</b>(_construct_)する。
  *
@@ -492,6 +662,7 @@ void voicevox_voice_model_delete(struct VoicevoxVoiceModel *model);
 /**
  * ::VoicevoxSynthesizer を<b>構築</b>(_construct_)する。
  *
+ * @param [in] onnxruntime
  * @param [in] open_jtalk Open JTalkのオブジェクト
  * @param [in] options オプション
  * @param [out] out_synthesizer 構築先
@@ -499,6 +670,7 @@ void voicevox_voice_model_delete(struct VoicevoxVoiceModel *model);
  * @returns 結果コード
  *
  * \safety{
+ * - `onnxruntime`は ::voicevox_onnxruntime_load_once または ::voicevox_onnxruntime_init_once で得たものでなければならない。
  * - `open_jtalk`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_open_jtalk_rc_new で解放されていてはいけない。
  * - `out_synthesizer`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
  * }
@@ -506,7 +678,8 @@ void voicevox_voice_model_delete(struct VoicevoxVoiceModel *model);
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
-VoicevoxResultCode voicevox_synthesizer_new(const struct OpenJtalkRc *open_jtalk,
+VoicevoxResultCode voicevox_synthesizer_new(const struct VoicevoxOnnxruntime *onnxruntime,
+                                            const struct OpenJtalkRc *open_jtalk,
                                             struct VoicevoxInitializeOptions options,
                                             struct VoicevoxSynthesizer **out_synthesizer);
 
@@ -563,6 +736,22 @@ __declspec(dllimport)
 VoicevoxResultCode voicevox_synthesizer_unload_voice_model(const struct VoicevoxSynthesizer *synthesizer,
                                                            VoicevoxVoiceModelId model_id);
 
+/**
+ * ::VoicevoxOnnxruntime のインスタンスを得る。
+ *
+ * @param [in] synthesizer 音声シンセサイザ
+ *
+ * @returns ::VoicevoxOnnxruntime のインスタンス
+ *
+ * \safety{
+ * - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
+ * }
+ */
+#ifdef _WIN32
+__declspec(dllimport)
+#endif
+const struct VoicevoxOnnxruntime *voicevox_synthesizer_get_onnxruntime(const struct VoicevoxSynthesizer *synthesizer);
+
 /**
  * ハードウェアアクセラレーションがGPUモードか判定する。
  *
@@ -623,6 +812,7 @@ char *voicevox_synthesizer_create_metas_json(const struct VoicevoxSynthesizer *s
  *
  * あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても`cuda`や`dml`は`true`を示しうる。
  *
+ * @param [in] onnxruntime
  * @param [out] output_supported_devices_json サポートデバイス情報のJSON文字列
  *
  * @returns 結果コード
@@ -630,18 +820,20 @@ char *voicevox_synthesizer_create_metas_json(const struct VoicevoxSynthesizer *s
  * \example{
  * ```c
  * char *supported_devices;
- * VoicevoxResultCode result = voicevox_create_supported_devices_json(&supported_devices);
+ * VoicevoxResultCode result = voicevox_onnxruntime_create_supported_devices_json(onnxruntime, &supported_devices);
  * ```
  * }
  *
  * \safety{
+ * - `onnxruntime`は ::voicevox_onnxruntime_load_once または ::voicevox_onnxruntime_init_once で得たものでなければならない。
  * - `output_supported_devices_json`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
  * }
  */
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
-VoicevoxResultCode voicevox_create_supported_devices_json(char **output_supported_devices_json);
+VoicevoxResultCode voicevox_onnxruntime_create_supported_devices_json(const struct VoicevoxOnnxruntime *onnxruntime,
+                                                                      char **output_supported_devices_json);
 
 /**
  * AquesTalk風記法から、AudioQueryをJSONとして生成する。
@@ -980,7 +1172,7 @@ VoicevoxResultCode voicevox_synthesizer_tts(const struct VoicevoxSynthesizer *sy
  *
  * \safety{
  * - `json`は以下のAPIで得られたポインタでなくてはいけない。
- *     - ::voicevox_create_supported_devices_json
+ *     - ::voicevox_onnxruntime_create_supported_devices_json
  *     - ::voicevox_synthesizer_create_metas_json
  *     - ::voicevox_synthesizer_create_audio_query
  *     - ::voicevox_synthesizer_create_accent_phrases
diff --git a/crates/voicevox_core_c_api/src/c_impls.rs b/crates/voicevox_core_c_api/src/c_impls.rs
index fe4afcf65..1adc402cd 100644
--- a/crates/voicevox_core_c_api/src/c_impls.rs
+++ b/crates/voicevox_core_c_api/src/c_impls.rs
@@ -1,13 +1,64 @@
 use std::{ffi::CString, path::Path};
 
 use camino::Utf8Path;
+use ref_cast::ref_cast_custom;
 use voicevox_core::{InitializeOptions, Result, VoiceModelId};
 
-use crate::{helpers::CApiResult, OpenJtalkRc, VoicevoxSynthesizer, VoicevoxVoiceModel};
+use crate::{
+    helpers::CApiResult, OpenJtalkRc, VoicevoxOnnxruntime, VoicevoxSynthesizer, VoicevoxVoiceModel,
+};
 
 // FIXME: 中身(Rust API)を直接操作するかラッパーメソッド越しにするのかが混在していて、一貫性を
 // 欠いている
 
+impl VoicevoxOnnxruntime {
+    #[cfg(feature = "load-onnxruntime")]
+    pub(crate) fn lib_versioned_filename() -> &'static std::ffi::CStr {
+        to_cstr!(voicevox_core::blocking::Onnxruntime::LIB_VERSIONED_FILENAME)
+    }
+
+    #[cfg(feature = "load-onnxruntime")]
+    pub(crate) fn lib_unversioned_filename() -> &'static std::ffi::CStr {
+        to_cstr!(voicevox_core::blocking::Onnxruntime::LIB_UNVERSIONED_FILENAME)
+    }
+
+    #[ref_cast_custom]
+    fn new(rust: &voicevox_core::blocking::Onnxruntime) -> &Self;
+
+    pub(crate) fn get() -> Option<&'static Self> {
+        voicevox_core::blocking::Onnxruntime::get().map(Self::new)
+    }
+
+    #[cfg(feature = "load-onnxruntime")]
+    pub(crate) fn load_once(filename: &std::ffi::CStr) -> CApiResult<&'static Self> {
+        use crate::helpers::ensure_utf8;
+
+        let inner = voicevox_core::blocking::Onnxruntime::load_once()
+            .filename(ensure_utf8(filename)?)
+            .exec()?;
+        Ok(Self::new(inner))
+    }
+
+    #[cfg(feature = "link-onnxruntime")]
+    pub(crate) fn init_once() -> CApiResult<&'static Self> {
+        let inner = voicevox_core::blocking::Onnxruntime::init_once()?;
+        Ok(Self::new(inner))
+    }
+}
+
+#[cfg(feature = "load-onnxruntime")]
+macro_rules! to_cstr {
+    ($s:expr) => {{
+        const __RUST_STR: &str = $s;
+        static __C_STR: &[u8] = const_format::concatcp!(__RUST_STR, '\0').as_bytes();
+
+        std::ffi::CStr::from_bytes_with_nul(__C_STR)
+            .unwrap_or_else(|e| panic!("{__RUST_STR:?} should not contain `\\0`: {e}"))
+    }};
+}
+#[cfg(feature = "load-onnxruntime")]
+use to_cstr;
+
 impl OpenJtalkRc {
     pub(crate) fn new(open_jtalk_dic_dir: impl AsRef<Utf8Path>) -> Result<Self> {
         Ok(Self {
@@ -17,12 +68,23 @@ impl OpenJtalkRc {
 }
 
 impl VoicevoxSynthesizer {
-    pub(crate) fn new(open_jtalk: &OpenJtalkRc, options: &InitializeOptions) -> Result<Self> {
-        let synthesizer =
-            voicevox_core::blocking::Synthesizer::new(open_jtalk.open_jtalk.clone(), options)?;
+    pub(crate) fn new(
+        onnxruntime: &'static VoicevoxOnnxruntime,
+        open_jtalk: &OpenJtalkRc,
+        options: &InitializeOptions,
+    ) -> Result<Self> {
+        let synthesizer = voicevox_core::blocking::Synthesizer::new(
+            &onnxruntime.0,
+            open_jtalk.open_jtalk.clone(),
+            options,
+        )?;
         Ok(Self { synthesizer })
     }
 
+    pub(crate) fn onnxruntime(&self) -> &'static VoicevoxOnnxruntime {
+        VoicevoxOnnxruntime::new(self.synthesizer.onnxruntime())
+    }
+
     pub(crate) fn load_voice_model(
         &self,
         model: &voicevox_core::blocking::VoiceModel,
diff --git a/crates/voicevox_core_c_api/src/compatible_engine.rs b/crates/voicevox_core_c_api/src/compatible_engine.rs
index ae4d21a93..bd66210e2 100644
--- a/crates/voicevox_core_c_api/src/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/src/compatible_engine.rs
@@ -8,11 +8,9 @@ use std::{
 use libc::c_int;
 
 use once_cell::sync::Lazy;
-use voicevox_core::{
-    StyleId, SupportedDevices, VoiceModelId, __internal::interop::PerformInference as _,
-};
+use voicevox_core::{StyleId, VoiceModelId, __internal::interop::PerformInference as _};
 
-use crate::init_logger_once;
+use crate::{helpers::display_error, init_logger_once};
 
 macro_rules! ensure_initialized {
     ($synthesizer:expr $(,)?) => {
@@ -28,6 +26,15 @@ macro_rules! ensure_initialized {
 
 static ERROR_MESSAGE: Lazy<Mutex<String>> = Lazy::new(|| Mutex::new(String::new()));
 
+static ONNXRUNTIME: Lazy<&'static voicevox_core::blocking::Onnxruntime> = Lazy::new(|| {
+    voicevox_core::blocking::Onnxruntime::load_once()
+        .exec()
+        .unwrap_or_else(|err| {
+            display_error(&err);
+            panic!("ONNX Runtimeをロードもしくは初期化ができなかったため、クラッシュします");
+        })
+});
+
 struct VoiceModelSet {
     all_vvms: Vec<voicevox_core::blocking::VoiceModel>,
     all_metas_json: CString,
@@ -111,6 +118,7 @@ pub extern "C" fn initialize(use_gpu: bool, cpu_num_threads: c_int, load_all_mod
     init_logger_once();
     let result = (|| {
         let synthesizer = voicevox_core::blocking::Synthesizer::new(
+            *ONNXRUNTIME,
             (),
             &voicevox_core::InitializeOptions {
                 acceleration_mode: if use_gpu {
@@ -196,7 +204,14 @@ pub extern "C" fn supported_devices() -> *const c_char {
     return SUPPORTED_DEVICES.as_ptr();
 
     static SUPPORTED_DEVICES: Lazy<CString> = Lazy::new(|| {
-        CString::new(SupportedDevices::create().unwrap().to_json().to_string()).unwrap()
+        CString::new(
+            ONNXRUNTIME
+                .supported_devices()
+                .unwrap()
+                .to_json()
+                .to_string(),
+        )
+        .unwrap()
     });
 }
 
diff --git a/crates/voicevox_core_c_api/src/helpers.rs b/crates/voicevox_core_c_api/src/helpers.rs
index ac0cab286..5066b643a 100644
--- a/crates/voicevox_core_c_api/src/helpers.rs
+++ b/crates/voicevox_core_c_api/src/helpers.rs
@@ -1,5 +1,5 @@
 use easy_ext::ext;
-use std::{error::Error as _, ffi::CStr, fmt::Debug, iter};
+use std::{ffi::CStr, fmt::Debug, iter};
 use uuid::Uuid;
 use voicevox_core::{AudioQueryModel, UserDictWord, VoiceModelId};
 
@@ -19,14 +19,6 @@ pub(crate) fn into_result_code_with_error(result: CApiResult<()>) -> VoicevoxRes
     }
     return into_result_code(result);
 
-    fn display_error(err: &CApiError) {
-        itertools::chain(
-            [err.to_string()],
-            iter::successors(err.source(), |&e| e.source()).map(|e| format!("Caused by: {e}")),
-        )
-        .for_each(|msg| error!("{msg}"));
-    }
-
     fn into_result_code(result: CApiResult<()>) -> VoicevoxResultCode {
         use voicevox_core::ErrorKind::*;
         use CApiError::*;
@@ -37,6 +29,7 @@ pub(crate) fn into_result_code_with_error(result: CApiResult<()>) -> VoicevoxRes
             Err(RustApi(err)) => match err.kind() {
                 NotLoadedOpenjtalkDict => VOICEVOX_RESULT_NOT_LOADED_OPENJTALK_DICT_ERROR,
                 GpuSupport => VOICEVOX_RESULT_GPU_SUPPORT_ERROR,
+                InitInferenceRuntime => VOICEVOX_RESULT_INIT_INFERENCE_RUNTIME_ERROR,
                 OpenZipFile => VOICEVOX_RESULT_OPEN_ZIP_FILE_ERROR,
                 ReadZipEntry => VOICEVOX_RESULT_READ_ZIP_ENTRY_ERROR,
                 InvalidModelFormat => VOICEVOX_RESULT_INVALID_MODEL_HEADER_ERROR,
@@ -63,6 +56,14 @@ pub(crate) fn into_result_code_with_error(result: CApiResult<()>) -> VoicevoxRes
     }
 }
 
+pub(crate) fn display_error(err: &impl std::error::Error) {
+    itertools::chain(
+        [err.to_string()],
+        iter::successors(err.source(), |&e| e.source()).map(|e| format!("Caused by: {e}")),
+    )
+    .for_each(|msg| error!("{msg}"));
+}
+
 pub(crate) type CApiResult<T> = std::result::Result<T, CApiError>;
 
 #[derive(Error, Debug)]
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index eb2e4698e..964e635ab 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -4,6 +4,7 @@
 
 mod c_impls;
 /// cbindgen:ignore
+#[cfg(feature = "load-onnxruntime")]
 mod compatible_engine;
 mod drop_check;
 mod helpers;
@@ -20,6 +21,7 @@ use anstream::{AutoStream, RawStream};
 use chrono::SecondsFormat;
 use colorchoice::ColorChoice;
 use derive_getters::Getters;
+use ref_cast::RefCastCustom;
 use std::env;
 use std::ffi::{CStr, CString};
 use std::fmt;
@@ -32,7 +34,7 @@ use tracing_subscriber::EnvFilter;
 use uuid::Uuid;
 use voicevox_core::__internal::interop::IdRef as _;
 use voicevox_core::{AccentPhraseModel, AudioQueryModel, TtsOptions, UserDictWord};
-use voicevox_core::{StyleId, SupportedDevices, SynthesisOptions};
+use voicevox_core::{StyleId, SynthesisOptions};
 
 fn init_logger_once() {
     static ONCE: Once = Once::new();
@@ -60,13 +62,7 @@ fn init_logger_once() {
             .with_env_filter(if env::var_os(EnvFilter::DEFAULT_ENV).is_some() {
                 EnvFilter::from_default_env()
             } else {
-                pub const ORT_LOGGING_LEVEL: &str = if cfg!(debug_assertions) {
-                    "info"
-                } else {
-                    "warn"
-                };
-                format!("error,voicevox_core=info,voicevox_core_c_api=info,ort={ORT_LOGGING_LEVEL}")
-                    .into()
+                "error,voicevox_core=info,voicevox_core_c_api=info,ort=info".into()
             })
             .with_timer(local_time as fn(&mut Writer<'_>) -> _)
             .with_ansi(ansi)
@@ -92,6 +88,171 @@ fn init_logger_once() {
  * voicevox_core/publish.rsにある対応する関数とはこのファイルに定義してある公開関数からvoicevoxプレフィックスを取り除いた名前の関数である
  */
 
+// TODO: https://github.com/mozilla/cbindgen/issues/927
+//#[cfg(feature = "load-onnxruntime")]
+//pub const VOICEVOX_ONNXRUNTIME_LIB_NAME: &CStr = ..;
+//#[cfg(feature = "load-onnxruntime")]
+//pub const VOICEVOX_ONNXRUNTIME_LIB_VERSION: &CStr = ..;
+
+/// ONNX Runtimeの動的ライブラリの、バージョン付きのファイル名。
+///
+/// WindowsとAndroidでは ::voicevox_get_onnxruntime_lib_unversioned_filename と同じ。
+///
+/// \availability{
+///   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+/// }
+#[cfg(feature = "load-onnxruntime")]
+#[no_mangle]
+pub extern "C" fn voicevox_get_onnxruntime_lib_versioned_filename() -> *const c_char {
+    init_logger_once();
+    let filename = VoicevoxOnnxruntime::lib_versioned_filename();
+    C_STRING_DROP_CHECKER.blacklist(filename).as_ptr()
+}
+
+/// ONNX Runtimeの動的ライブラリの、バージョン無しのファイル名。
+///
+/// \availability{
+///   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+/// }
+#[cfg(feature = "load-onnxruntime")]
+#[no_mangle]
+pub extern "C" fn voicevox_get_onnxruntime_lib_unversioned_filename() -> *const c_char {
+    init_logger_once();
+    let filename = VoicevoxOnnxruntime::lib_unversioned_filename();
+    C_STRING_DROP_CHECKER.blacklist(filename).as_ptr()
+}
+
+/// ::voicevox_onnxruntime_load_once のオプション。
+///
+/// \availability{
+///   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+/// }
+#[cfg(feature = "load-onnxruntime")]
+#[repr(C)]
+pub struct VoicevoxLoadOnnxruntimeOptions {
+    /// ONNX Runtimeのファイル名（モジュール名）もしくはファイルパスを指定する。
+    ///
+    /// `dlopen`/[`LoadLibraryExW`](https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw)の引数に使われる。デフォルトは ::voicevox_get_onnxruntime_lib_versioned_filename と同じ。
+    filename: *const c_char,
+}
+
+/// デフォルトの ::voicevox_onnxruntime_load_once のオプションを生成する。
+///
+/// @return デフォルトの ::voicevox_onnxruntime_load_once のオプション
+///
+/// \availability{
+///   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+/// }
+#[cfg(feature = "load-onnxruntime")]
+#[no_mangle]
+pub extern "C" fn voicevox_make_default_load_onnxruntime_options() -> VoicevoxLoadOnnxruntimeOptions
+{
+    init_logger_once();
+    let filename = VoicevoxOnnxruntime::lib_versioned_filename();
+    let filename = C_STRING_DROP_CHECKER.blacklist(filename).as_ptr();
+    VoicevoxLoadOnnxruntimeOptions { filename }
+}
+
+// https://github.com/mozilla/cbindgen/issues/967
+// FIXME: このコードブロックのコードが動くかどうか未確認
+/// ONNX Runtime。
+///
+/// シングルトンであり、インスタンスは高々一つ。
+///
+/// ```c
+/// const VoicevoxOnnxruntime *ort1;
+/// voicevox_onnxruntime_load_once(voicevox_make_default_load_onnxruntime_options,
+///                                &ort1);
+/// const VoicevoxOnnxruntime *ort2 = voicevox_onnxruntime_get();
+/// assert(ort1 == ort2);
+/// ```
+#[cfg(any())]
+pub struct VoicevoxOnnxruntime(!);
+
+/// cbindgen:ignore
+#[derive(RefCastCustom)]
+#[repr(transparent)]
+pub struct VoicevoxOnnxruntime(voicevox_core::blocking::Onnxruntime);
+
+/// ::VoicevoxOnnxruntime のインスタンスが既に作られているならそれを得る。
+///
+/// 作られていなければ`NULL`を返す。
+///
+/// @returns ::VoicevoxOnnxruntime のインスタンス
+#[no_mangle]
+pub extern "C" fn voicevox_onnxruntime_get() -> Option<&'static VoicevoxOnnxruntime> {
+    VoicevoxOnnxruntime::get()
+}
+
+/// ONNX Runtimeをロードして初期化する。
+///
+/// 一度成功したら、以後は引数を無視して同じ参照を返す。
+///
+/// @param [in] options オプション
+/// @param [out] out_onnxruntime ::VoicevoxOnnxruntime のインスタンス
+///
+/// @returns 結果コード
+///
+/// \availability{
+///   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSを除くプラットフォームで利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+/// }
+///
+/// \safety{
+/// - `options.filename`はヌル終端文字列を指し、かつ<a href="#voicevox-core-safety">読み込みについて有効</a>でなければならない。
+/// - `out_onnxruntime`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
+/// }
+#[cfg(feature = "load-onnxruntime")]
+#[no_mangle]
+pub unsafe extern "C" fn voicevox_onnxruntime_load_once(
+    options: VoicevoxLoadOnnxruntimeOptions,
+    out_onnxruntime: NonNull<&'static VoicevoxOnnxruntime>,
+) -> VoicevoxResultCode {
+    init_logger_once();
+    let filename = unsafe {
+        // SAFETY: ユーザーに要求している条件で十分
+        CStr::from_ptr(options.filename)
+    };
+    into_result_code_with_error((|| {
+        let instance = VoicevoxOnnxruntime::load_once(filename)?;
+        unsafe {
+            // SAFETY: ユーザーに要求している条件で十分
+            out_onnxruntime.as_ptr().write_unaligned(instance);
+        }
+        Ok(())
+    })())
+}
+
+/// ONNX Runtimeを初期化する。
+///
+/// 一度成功したら以後は同じ参照を返す。
+///
+/// @param [out] out_onnxruntime ::VoicevoxOnnxruntime のインスタンス
+///
+/// @returns 結果コード
+///
+/// \availability{
+///   [リリース](https://github.com/voicevox/voicevox_core/releases)されているライブラリではiOSでのみ利用可能。詳細は<a href="#voicevox-core-availability">ファイルレベルの"Availability"の節</a>を参照。
+/// }
+///
+/// \safety{
+/// - `out_onnxruntime`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
+/// }
+#[cfg(feature = "link-onnxruntime")]
+#[no_mangle]
+pub unsafe extern "C" fn voicevox_onnxruntime_init_once(
+    out_onnxruntime: NonNull<&'static VoicevoxOnnxruntime>,
+) -> VoicevoxResultCode {
+    init_logger_once();
+    into_result_code_with_error((|| {
+        let instance = VoicevoxOnnxruntime::init_once()?;
+        unsafe {
+            // SAFETY: ユーザーに要求している条件で十分
+            out_onnxruntime.as_ptr().write_unaligned(instance);
+        }
+        Ok(())
+    })())
+}
+
 /// テキスト解析器としてのOpen JTalk。
 ///
 /// <b>構築</b>(_construction_)は ::voicevox_open_jtalk_rc_new で行い、<b>破棄</b>(_destruction_)は ::voicevox_open_jtalk_rc_delete で行う。
@@ -226,6 +387,7 @@ pub extern "C" fn voicevox_get_version() -> *const c_char {
     init_logger_once();
     return C_STRING_DROP_CHECKER.blacklist(VERSION).as_ptr();
 
+    // FIXME: 実行時チェックにすることでこの`unsafe`は削れるはず
     const VERSION: &CStr = unsafe {
         // SAFETY: The package version is a SemVer, so it should not contain '\0'
         CStr::from_bytes_with_nul_unchecked(concat!(env!("CARGO_PKG_VERSION"), '\0').as_bytes())
@@ -330,6 +492,7 @@ pub struct VoicevoxSynthesizer {
 
 /// ::VoicevoxSynthesizer を<b>構築</b>(_construct_)する。
 ///
+/// @param [in] onnxruntime
 /// @param [in] open_jtalk Open JTalkのオブジェクト
 /// @param [in] options オプション
 /// @param [out] out_synthesizer 構築先
@@ -337,11 +500,13 @@ pub struct VoicevoxSynthesizer {
 /// @returns 結果コード
 ///
 /// \safety{
+/// - `onnxruntime`は ::voicevox_onnxruntime_load_once または ::voicevox_onnxruntime_init_once で得たものでなければならない。
 /// - `open_jtalk`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_open_jtalk_rc_new で解放されていてはいけない。
 /// - `out_synthesizer`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
 /// }
 #[no_mangle]
 pub unsafe extern "C" fn voicevox_synthesizer_new(
+    onnxruntime: &'static VoicevoxOnnxruntime,
     open_jtalk: &OpenJtalkRc,
     options: VoicevoxInitializeOptions,
     out_synthesizer: NonNull<Box<VoicevoxSynthesizer>>,
@@ -350,7 +515,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_new(
     into_result_code_with_error((|| {
         let options = options.into();
 
-        let synthesizer = VoicevoxSynthesizer::new(open_jtalk, &options)?.into();
+        let synthesizer = VoicevoxSynthesizer::new(onnxruntime, open_jtalk, &options)?.into();
         out_synthesizer.as_ptr().write_unaligned(synthesizer);
         Ok(())
     })())
@@ -411,6 +576,22 @@ pub extern "C" fn voicevox_synthesizer_unload_voice_model(
     into_result_code_with_error(synthesizer.unload_voice_model(model_id).map_err(Into::into))
 }
 
+/// ::VoicevoxOnnxruntime のインスタンスを得る。
+///
+/// @param [in] synthesizer 音声シンセサイザ
+///
+/// @returns ::VoicevoxOnnxruntime のインスタンス
+///
+/// \safety{
+/// - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
+/// }
+#[no_mangle]
+pub extern "C" fn voicevox_synthesizer_get_onnxruntime(
+    synthesizer: &VoicevoxSynthesizer,
+) -> &'static VoicevoxOnnxruntime {
+    synthesizer.onnxruntime()
+}
+
 /// ハードウェアアクセラレーションがGPUモードか判定する。
 ///
 /// @param [in] synthesizer 音声シンセサイザ
@@ -473,6 +654,7 @@ pub extern "C" fn voicevox_synthesizer_create_metas_json(
 ///
 /// あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても`cuda`や`dml`は`true`を示しうる。
 ///
+/// @param [in] onnxruntime
 /// @param [out] output_supported_devices_json サポートデバイス情報のJSON文字列
 ///
 /// @returns 結果コード
@@ -480,21 +662,23 @@ pub extern "C" fn voicevox_synthesizer_create_metas_json(
 /// \example{
 /// ```c
 /// char *supported_devices;
-/// VoicevoxResultCode result = voicevox_create_supported_devices_json(&supported_devices);
+/// VoicevoxResultCode result = voicevox_onnxruntime_create_supported_devices_json(onnxruntime, &supported_devices);
 /// ```
 /// }
 ///
 /// \safety{
+/// - `onnxruntime`は ::voicevox_onnxruntime_load_once または ::voicevox_onnxruntime_init_once で得たものでなければならない。
 /// - `output_supported_devices_json`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
 /// }
 #[no_mangle]
-pub unsafe extern "C" fn voicevox_create_supported_devices_json(
+pub unsafe extern "C" fn voicevox_onnxruntime_create_supported_devices_json(
+    onnxruntime: &'static VoicevoxOnnxruntime,
     output_supported_devices_json: NonNull<*mut c_char>,
 ) -> VoicevoxResultCode {
     init_logger_once();
     into_result_code_with_error((|| {
         let supported_devices =
-            CString::new(SupportedDevices::create()?.to_json().to_string()).unwrap();
+            CString::new(onnxruntime.0.supported_devices()?.to_json().to_string()).unwrap();
         output_supported_devices_json.as_ptr().write_unaligned(
             C_STRING_DROP_CHECKER
                 .whitelist(supported_devices)
@@ -980,7 +1164,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_tts(
 ///
 /// \safety{
 /// - `json`は以下のAPIで得られたポインタでなくてはいけない。
-///     - ::voicevox_create_supported_devices_json
+///     - ::voicevox_onnxruntime_create_supported_devices_json
 ///     - ::voicevox_synthesizer_create_metas_json
 ///     - ::voicevox_synthesizer_create_audio_query
 ///     - ::voicevox_synthesizer_create_accent_phrases
diff --git a/crates/voicevox_core_c_api/src/result_code.rs b/crates/voicevox_core_c_api/src/result_code.rs
index 0897dfa87..085f2b8c6 100644
--- a/crates/voicevox_core_c_api/src/result_code.rs
+++ b/crates/voicevox_core_c_api/src/result_code.rs
@@ -17,6 +17,8 @@ pub enum VoicevoxResultCode {
     VOICEVOX_RESULT_GET_SUPPORTED_DEVICES_ERROR = 3,
     /// GPUモードがサポートされていない
     VOICEVOX_RESULT_GPU_SUPPORT_ERROR = 4,
+    /// 推論ライブラリのロードまたは初期化ができなかった
+    VOICEVOX_RESULT_INIT_INFERENCE_RUNTIME_ERROR = 29,
     /// スタイルIDに対するスタイルが見つからなかった
     VOICEVOX_RESULT_STYLE_NOT_FOUND_ERROR = 6,
     /// 音声モデルIDに対する音声モデルが見つからなかった
@@ -69,6 +71,9 @@ pub(crate) const fn error_result_to_message(result_code: VoicevoxResultCode) ->
         VOICEVOX_RESULT_GET_SUPPORTED_DEVICES_ERROR => {
             cstr!("サポートされているデバイス情報取得中にエラーが発生しました")
         }
+        VOICEVOX_RESULT_INIT_INFERENCE_RUNTIME_ERROR => {
+            cstr!("推論ライブラリのロードまたは初期化ができませんでした")
+        }
         VOICEVOX_RESULT_OK => cstr!("エラーが発生しませんでした"),
         VOICEVOX_RESULT_STYLE_NOT_FOUND_ERROR => cstr!(
             "指定されたIDに対するスタイルが見つかりませんでした。音声モデルが読み込まれていないか\
diff --git a/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs b/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs
index cfbec5c31..e779fdc23 100644
--- a/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/assert_cdylib.rs
@@ -8,6 +8,7 @@ use assert_cmd::assert::{Assert, AssertResult, OutputAssertExt as _};
 use clap::Parser as _;
 use duct::cmd;
 use easy_ext::ext;
+use itertools::Itertools as _;
 use libloading::Library;
 use libtest_mimic::{Failed, Trial};
 
@@ -46,7 +47,15 @@ pub(crate) fn exec<C: TestContext>() -> anyhow::Result<()> {
     // テスト対象が無いときに`cargo build`をスキップしたいが、判定部分がプライベート。
     // そのためスキップするのはCLIオプションに`--ignored`か`--include-ignored`が無いときのみ
     if args.ignored || args.include_ignored {
-        cmd!(env!("CARGO"), "build", "--release", "--lib").run()?;
+        cmd!(
+            env!("CARGO"),
+            "build",
+            "--release",
+            "--lib",
+            "--features",
+            &format!(",{}", C::FEATURES.iter().format(",")),
+        )
+        .run()?;
 
         ensure!(
             C::cdylib_path().exists(),
@@ -96,6 +105,7 @@ pub(crate) fn exec<C: TestContext>() -> anyhow::Result<()> {
 }
 
 pub(crate) trait TestContext {
+    const FEATURES: &'static [&'static str];
     const TARGET_DIR: &'static str;
     const CDYLIB_NAME: &'static str;
     const RUNTIME_ENVS: &'static [(&'static str, &'static str)];
diff --git a/crates/voicevox_core_c_api/tests/e2e/log_mask.rs b/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
index b28442bdb..9b08c9af7 100644
--- a/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
@@ -20,6 +20,13 @@ impl Utf8Output {
         )
     }
 
+    pub(crate) fn mask_onnxruntime_version(self) -> Self {
+        self.mask_stderr(
+            static_regex!(regex::escape(ort::downloaded_version!())),
+            "{onnxruntime_version}",
+        )
+    }
+
     pub(crate) fn mask_windows_video_cards(self) -> Self {
         self.mask_stderr(
             static_regex!(
diff --git a/crates/voicevox_core_c_api/tests/e2e/main.rs b/crates/voicevox_core_c_api/tests/e2e/main.rs
index 43dc3a95e..0a7520c76 100644
--- a/crates/voicevox_core_c_api/tests/e2e/main.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/main.rs
@@ -22,6 +22,7 @@ fn main() -> anyhow::Result<()> {
     enum TestContext {}
 
     impl assert_cdylib::TestContext for TestContext {
+        const FEATURES: &'static [&'static str] = &["load-onnxruntime"];
         const TARGET_DIR: &'static str = "../../target";
         const CDYLIB_NAME: &'static str = "voicevox_core";
         const RUNTIME_ENVS: &'static [(&'static str, &'static str)] =
diff --git a/crates/voicevox_core_c_api/tests/e2e/snapshots.toml b/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
index 151074cb3..b623119dd 100644
--- a/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
+++ b/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
@@ -51,9 +51,12 @@ metas = '''
   }
 ]'''
 stderr.windows = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
 '''
-stderr.unix = ""
+stderr.unix = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+'''
 
 [compatible_engine_load_model_before_initialize]
 last_error_message = "Statusが初期化されていません"
@@ -83,14 +86,21 @@ result_messages.22 = "ユーザー辞書に単語が見つかりませんでし
 result_messages.23 = "OpenJTalkのユーザー辞書の設定に失敗しました"
 result_messages.24 = "ユーザー辞書の単語のバリデーションに失敗しました"
 result_messages.25 = "UUIDの変換に失敗しました"
-stderr = ""
+# FIXME: 26, 27, 28が抜けている
+result_messages.29 = "推論ライブラリのロードまたは初期化ができませんでした"
+stderr = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+'''
 
 [simple_tts]
 output."こんにちは、音声合成の世界へようこそ".wav_length = 176172
 stderr.windows = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
 '''
-stderr.unix = ""
+stderr.unix = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+'''
 
 [synthesizer_new_output_json]
 metas = '''
@@ -145,22 +155,32 @@ metas = '''
   }
 ]'''
 stderr.windows = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
 '''
-stderr.unix = ""
+stderr.unix = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+'''
 
 [tts_via_audio_query]
 output."こんにちは、音声合成の世界へようこそ".wav_length = 176172
 stderr.windows = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
 '''
-stderr.unix = ""
+stderr.unix = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+'''
 
+# FIXME: "user_dict_load"のはず
 [user_dict]
 stderr.windows = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
 '''
-stderr.unix = ""
+stderr.unix = '''
+{timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+'''
 
 [user_dict_manipulate]
 stderr = ""
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs
index c2fc211c2..79b1d5dc8 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs
@@ -31,12 +31,10 @@ impl assert_cdylib::TestCase for TestCase {
             serde_json::to_string_pretty(&metas_json.parse::<serde_json::Value>()?).unwrap()
         };
 
-        let supported_devices = {
+        {
             let supported_devices = lib.supported_devices();
-            CStr::from_ptr(supported_devices)
-                .to_str()?
-                .parse::<serde_json::Value>()?
-        };
+            serde_json::from_str::<SupportedDevices>(CStr::from_ptr(supported_devices).to_str()?)?;
+        }
 
         assert!(lib.initialize(false, 0, false));
 
@@ -86,10 +84,6 @@ impl assert_cdylib::TestCase for TestCase {
         };
 
         std::assert_eq!(SNAPSHOTS.metas, metas_json);
-        std::assert_eq!(
-            SupportedDevices::create().unwrap().to_json(),
-            supported_devices,
-        );
 
         float_assert::close_l1(&phoneme_length, &EXAMPLE_DATA.duration.result, 0.01);
         float_assert::close_l1(&intonation_list, &EXAMPLE_DATA.intonation.result, 0.01);
@@ -103,6 +97,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs
index 173e32f8c..18482f0de 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs
@@ -34,6 +34,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
index c6ea390ed..d2a8fc7e7 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
@@ -28,16 +28,23 @@ impl assert_cdylib::TestCase for TestCase {
             CStr::from_ptr(lib.voicevox_get_version()).to_str()?,
         );
 
+        let onnxruntime = {
+            let mut onnxruntime = MaybeUninit::uninit();
+            assert_ok(lib.voicevox_onnxruntime_load_once(
+                lib.voicevox_make_default_load_onnxruntime_options(),
+                onnxruntime.as_mut_ptr(),
+            ));
+            onnxruntime.assume_init()
+        };
+
         {
             let mut supported_devices = MaybeUninit::uninit();
-            assert_ok(lib.voicevox_create_supported_devices_json(supported_devices.as_mut_ptr()));
+            assert_ok(lib.voicevox_onnxruntime_create_supported_devices_json(
+                onnxruntime,
+                supported_devices.as_mut_ptr(),
+            ));
             let supported_devices = supported_devices.assume_init();
-            std::assert_eq!(
-                SupportedDevices::create()?.to_json(),
-                CStr::from_ptr(supported_devices)
-                    .to_str()?
-                    .parse::<serde_json::Value>()?,
-            );
+            serde_json::from_str::<SupportedDevices>(CStr::from_ptr(supported_devices).to_str()?)?;
             lib.voicevox_json_free(supported_devices);
         }
 
@@ -83,6 +90,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
index 4ac4030e1..4635b0271 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
@@ -37,6 +37,15 @@ impl assert_cdylib::TestCase for TestCase {
             model.assume_init()
         };
 
+        let onnxruntime = {
+            let mut onnxruntime = MaybeUninit::uninit();
+            assert_ok(lib.voicevox_onnxruntime_load_once(
+                lib.voicevox_make_default_load_onnxruntime_options(),
+                onnxruntime.as_mut_ptr(),
+            ));
+            onnxruntime.assume_init()
+        };
+
         let openjtalk = {
             let mut openjtalk = MaybeUninit::uninit();
             let open_jtalk_dic_dir = CString::new(OPEN_JTALK_DIC_DIR).unwrap();
@@ -49,6 +58,7 @@ impl assert_cdylib::TestCase for TestCase {
         let synthesizer = {
             let mut synthesizer = MaybeUninit::uninit();
             assert_ok(lib.voicevox_synthesizer_new(
+                onnxruntime,
                 openjtalk,
                 VoicevoxInitializeOptions {
                     acceleration_mode:
@@ -96,6 +106,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
index c27bd4703..8a2fd1951 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
@@ -28,6 +28,15 @@ impl assert_cdylib::TestCase for TestCase {
     unsafe fn exec(&self, lib: Library) -> anyhow::Result<()> {
         let lib = CApi::from_library(lib)?;
 
+        let onnxruntime = {
+            let mut onnxruntime = MaybeUninit::uninit();
+            assert_ok(lib.voicevox_onnxruntime_load_once(
+                lib.voicevox_make_default_load_onnxruntime_options(),
+                onnxruntime.as_mut_ptr(),
+            ));
+            onnxruntime.assume_init()
+        };
+
         let openjtalk = {
             let mut openjtalk = MaybeUninit::uninit();
             let open_jtalk_dic_dir = CString::new(OPEN_JTALK_DIC_DIR).unwrap();
@@ -40,6 +49,7 @@ impl assert_cdylib::TestCase for TestCase {
         let synthesizer = {
             let mut synthesizer = MaybeUninit::uninit();
             assert_ok(lib.voicevox_synthesizer_new(
+                onnxruntime,
                 openjtalk,
                 VoicevoxInitializeOptions {
                     acceleration_mode:
@@ -85,6 +95,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
index d380b71b2..728f21339 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
@@ -37,6 +37,15 @@ impl assert_cdylib::TestCase for TestCase {
             model.assume_init()
         };
 
+        let onnxruntime = {
+            let mut onnxruntime = MaybeUninit::uninit();
+            assert_ok(lib.voicevox_onnxruntime_load_once(
+                lib.voicevox_make_default_load_onnxruntime_options(),
+                onnxruntime.as_mut_ptr(),
+            ));
+            onnxruntime.assume_init()
+        };
+
         let openjtalk = {
             let mut openjtalk = MaybeUninit::uninit();
             let open_jtalk_dic_dir = CString::new(OPEN_JTALK_DIC_DIR).unwrap();
@@ -49,6 +58,7 @@ impl assert_cdylib::TestCase for TestCase {
         let synthesizer = {
             let mut synthesizer = MaybeUninit::uninit();
             assert_ok(lib.voicevox_synthesizer_new(
+                onnxruntime,
                 openjtalk,
                 VoicevoxInitializeOptions {
                     acceleration_mode:
@@ -108,6 +118,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
index 2e6875e97..646c5647b 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
@@ -54,6 +54,15 @@ impl assert_cdylib::TestCase for TestCase {
             model.assume_init()
         };
 
+        let onnxruntime = {
+            let mut onnxruntime = MaybeUninit::uninit();
+            assert_ok(lib.voicevox_onnxruntime_load_once(
+                lib.voicevox_make_default_load_onnxruntime_options(),
+                onnxruntime.as_mut_ptr(),
+            ));
+            onnxruntime.assume_init()
+        };
+
         let openjtalk = {
             let mut openjtalk = MaybeUninit::uninit();
             let open_jtalk_dic_dir = CString::new(OPEN_JTALK_DIC_DIR).unwrap();
@@ -66,6 +75,7 @@ impl assert_cdylib::TestCase for TestCase {
         let synthesizer = {
             let mut synthesizer = MaybeUninit::uninit();
             assert_ok(lib.voicevox_synthesizer_new(
+                onnxruntime,
                 openjtalk,
                 VoicevoxInitializeOptions {
                     acceleration_mode:
@@ -125,6 +135,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs
index fd3d575e3..bec0d61b5 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs
@@ -140,6 +140,7 @@ impl assert_cdylib::TestCase for TestCase {
     fn assert_output(&self, output: Utf8Output) -> AssertResult {
         output
             .mask_timestamps()
+            .mask_onnxruntime_version()
             .mask_windows_video_cards()
             .assert()
             .try_success()?
diff --git a/crates/voicevox_core_java_api/Cargo.toml b/crates/voicevox_core_java_api/Cargo.toml
index b39a98b2a..e9cced8b2 100644
--- a/crates/voicevox_core_java_api/Cargo.toml
+++ b/crates/voicevox_core_java_api/Cargo.toml
@@ -15,6 +15,7 @@ directml = ["voicevox_core/directml"]
 android_logger.workspace = true
 chrono = { workspace = true, default-features = false, features = ["clock"] }
 derive_more.workspace = true
+duplicate.workspace = true
 easy-ext.workspace = true
 jni.workspace = true
 once_cell.workspace = true
@@ -24,7 +25,7 @@ serde_json = { workspace = true, features = ["preserve_order"] }
 tracing = { workspace = true, features = ["log"] }
 tracing-subscriber = { workspace = true, features = ["env-filter"] }
 uuid.workspace = true
-voicevox_core.workspace = true
+voicevox_core = { workspace = true, features = ["load-onnxruntime"] }
 
 [lints.rust]
 unsafe_code = "allow" # jni-rsが要求
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java
index 26f9ccddd..010e69073 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java
@@ -1,6 +1,5 @@
 package jp.hiroshiba.voicevoxcore;
 
-import com.google.gson.Gson;
 import com.google.gson.annotations.Expose;
 import com.google.gson.annotations.SerializedName;
 import jakarta.annotation.Nonnull;
@@ -17,28 +16,13 @@ public static String getVersion() {
     return rsGetVersion();
   }
 
-  /**
-   * このライブラリで利用可能なデバイスの情報を取得する。
-   *
-   * @return {@link SupportedDevices}。
-   */
-  @Nonnull
-  public static SupportedDevices getSupportedDevices() {
-    Gson gson = new Gson();
-    String supportedDevicesJson = rsGetSupportedDevicesJson();
-    SupportedDevices supportedDevices = gson.fromJson(supportedDevicesJson, SupportedDevices.class);
-    if (supportedDevices == null) {
-      throw new NullPointerException("supported_devices");
-    }
-    return supportedDevices;
-  }
-
   @Nonnull
   private static native String rsGetVersion();
 
   @Nonnull
   private static native String rsGetSupportedDevicesJson();
 
+  // FIXME: `Onnxruntime`に移すか、独立させる
   /**
    * このライブラリで利用可能なデバイスの情報。
    *
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Onnxruntime.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Onnxruntime.java
new file mode 100644
index 000000000..9a9cbe133
--- /dev/null
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Onnxruntime.java
@@ -0,0 +1,132 @@
+package jp.hiroshiba.voicevoxcore;
+
+import static jp.hiroshiba.voicevoxcore.GlobalInfo.SupportedDevices;
+
+import com.google.gson.Gson;
+import jakarta.annotation.Nonnull;
+import jakarta.annotation.Nullable;
+import java.util.Optional;
+
+/**
+ * ONNX Runtime。
+ *
+ * <p>シングルトンであり、インスタンスは高々一つ。
+ *
+ * <pre>
+ * Onnxruntime ort1 = Onnxruntime.loadOnce().exec();
+ * Onnxruntime ort2 = Onnxruntime.get().get();
+ * assert ort1 == ort2;
+ * </pre>
+ */
+public class Onnxruntime extends Dll {
+  /** ONNX Runtimeのライブラリ名。 */
+  public static final String LIB_NAME = "onnxruntime";
+
+  /** 推奨されるONNX Runtimeのバージョン。 */
+  public static final String LIB_VERSION = "1.17.3";
+
+  /**
+   * {@link LIB_NAME}と{@link LIB_VERSION}からなる動的ライブラリのファイル名。
+   *
+   * <p>WindowsとAndroidでは{@link LIB_UNVERSIONED_FILENAME}と同じ。
+   */
+  public static final String LIB_VERSIONED_FILENAME = rsLibVersionedFilename();
+
+  /** {@link LIB_NAME}からなる動的ライブラリのファイル名。 */
+  public static final String LIB_UNVERSIONED_FILENAME = rsLibUnversionedFilename();
+
+  @Nullable private static Onnxruntime instance = null;
+
+  /**
+   * インスタンスが既に作られているならそれを得る。
+   *
+   * @return インスタンスがあるなら{@code Optional.of(…)}、そうでなければ{@code Optional.empty()}。
+   */
+  public static Optional<Onnxruntime> get() {
+    synchronized (Onnxruntime.class) {
+      return Optional.ofNullable(instance);
+    }
+  }
+
+  /**
+   * ONNX Runtimeをロードして初期化する。
+   *
+   * <p>一度成功したら、以後は引数を無視して同じインスタンスを返す。
+   *
+   * @return {@link LoadOnce}。
+   */
+  public static LoadOnce loadOnce() {
+    return new LoadOnce();
+  }
+
+  private static native String rsLibName();
+
+  private static native String rsLibVersion();
+
+  private static native String rsLibVersionedFilename();
+
+  private static native String rsLibUnversionedFilename();
+
+  static {
+    assert LIB_NAME.equals(rsLibName()) && LIB_VERSION.equals(rsLibVersion());
+  }
+
+  /** {@link #loadOnce}のビルダー。 */
+  public static class LoadOnce {
+    /**
+     * ONNX Runtimeのファイル名（モジュール名）もしくはファイルパスを指定する。
+     *
+     * @param filename {@code dlopen}/<a
+     *     href="https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw">{@code
+     *     LoadLibraryExW}</a>の引数に使われる。デフォルトは{@link LIB_VERSIONED_FILENAME}。
+     * @return このオブジェクト。
+     */
+    public LoadOnce filename(@Nonnull String filename) {
+      this.filename = filename;
+      return this;
+    }
+
+    /**
+     * 実行する。
+     *
+     * @return {@link Onnxruntime}。
+     */
+    public Onnxruntime exec() {
+      synchronized (Onnxruntime.class) {
+        if (instance == null) {
+          instance = new Onnxruntime(filename);
+        }
+      }
+      return instance;
+    }
+
+    private LoadOnce() {}
+
+    @Nonnull private String filename = LIB_VERSIONED_FILENAME;
+  }
+
+  private long handle;
+
+  private Onnxruntime(@Nullable String filename) {
+    rsNew(filename);
+  }
+
+  /**
+   * このライブラリで利用可能なデバイスの情報を取得する。
+   *
+   * @return {@link SupportedDevices}。
+   */
+  public SupportedDevices supportedDevices() {
+    Gson gson = new Gson();
+    String supportedDevicesJson = rsSupportedDevices();
+    SupportedDevices supportedDevices = gson.fromJson(supportedDevicesJson, SupportedDevices.class);
+    if (supportedDevices == null) {
+      throw new NullPointerException("supported_devices");
+    }
+    return supportedDevices;
+  }
+
+  private native void rsNew(@Nullable String filename);
+
+  private native String rsSupportedDevices();
+}
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
index 6ec6d9108..8d5694267 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
@@ -5,6 +5,7 @@
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.List;
+import java.util.Optional;
 import java.util.UUID;
 import jp.hiroshiba.voicevoxcore.exceptions.InferenceFailedException;
 import jp.hiroshiba.voicevoxcore.exceptions.InvalidModelDataException;
@@ -17,8 +18,8 @@
 public class Synthesizer extends Dll {
   private long handle;
 
-  private Synthesizer(OpenJtalk openJtalk, Builder builder) {
-    rsNew(openJtalk, builder);
+  private Synthesizer(Onnxruntime onnxruntime, OpenJtalk openJtalk, Builder builder) {
+    rsNew(onnxruntime, openJtalk, builder);
   }
 
   protected void finalize() throws Throwable {
@@ -26,6 +27,18 @@ protected void finalize() throws Throwable {
     super.finalize();
   }
 
+  /**
+   * ONNX Runtime。
+   *
+   * @return {@link Onnxruntime}。
+   */
+  @Nonnull
+  public Onnxruntime getOnnxruntime() {
+    Optional<Onnxruntime> onnxruntime = Onnxruntime.get();
+    assert onnxruntime.isPresent() : "`Synthesizer`のコンストラクタで要求しているはず";
+    return onnxruntime.get();
+  }
+
   /**
    * ハードウェアアクセラレーションがGPUモードかどうかを返す。
    *
@@ -266,7 +279,7 @@ public TtsConfigurator tts(String text, int styleId) {
     return new TtsConfigurator(this, text, styleId);
   }
 
-  private native void rsNew(OpenJtalk openJtalk, Builder builder);
+  private native void rsNew(Onnxruntime onnxruntime, OpenJtalk openJtalk, Builder builder);
 
   private native boolean rsIsGpuMode();
 
@@ -320,8 +333,8 @@ private native byte[] rsTts(String text, int styleId, boolean enableInterrogativ
 
   private native void rsDrop();
 
-  public static Builder builder(OpenJtalk openJtalk) {
-    return new Builder(openJtalk);
+  public static Builder builder(Onnxruntime onnxruntime, OpenJtalk openJtalk) {
+    return new Builder(onnxruntime, openJtalk);
   }
 
   /**
@@ -330,6 +343,7 @@ public static Builder builder(OpenJtalk openJtalk) {
    * @see Synthesizer#builder
    */
   public static class Builder {
+    private Onnxruntime onnxruntime;
     private OpenJtalk openJtalk;
 
     @SuppressWarnings("unused")
@@ -338,7 +352,8 @@ public static class Builder {
     @SuppressWarnings("unused")
     private int cpuNumThreads;
 
-    public Builder(OpenJtalk openJtalk) {
+    public Builder(Onnxruntime onnxruntime, OpenJtalk openJtalk) {
+      this.onnxruntime = onnxruntime;
       this.openJtalk = openJtalk;
     }
 
@@ -373,7 +388,7 @@ public Builder cpuNumThreads(int cpuNumThreads) {
      * @return {@link Synthesizer}。
      */
     public Synthesizer build() {
-      Synthesizer synthesizer = new Synthesizer(openJtalk, this);
+      Synthesizer synthesizer = new Synthesizer(onnxruntime, openJtalk, this);
       return synthesizer;
     }
   }
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InitInferenceRuntimeException.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InitInferenceRuntimeException.java
new file mode 100644
index 000000000..c981ea034
--- /dev/null
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InitInferenceRuntimeException.java
@@ -0,0 +1,14 @@
+package jp.hiroshiba.voicevoxcore.exceptions;
+
+import java.io.IOException;
+
+/** 推論ライブラリのロードまたは初期化ができなかった。 */
+public class InitInferenceRuntimeException extends IOException {
+  public InitInferenceRuntimeException(String message) {
+    super(message);
+  }
+
+  public InitInferenceRuntimeException(String message, Throwable cause) {
+    super(message, cause);
+  }
+}
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/InfoTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/InfoTest.java
index 52915abad..c9e71ed1c 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/InfoTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/InfoTest.java
@@ -8,15 +8,16 @@
 
 import org.junit.jupiter.api.Test;
 
-class InfoTest {
+class InfoTest extends TestUtils {
   @Test
   void checkVersion() {
     assertNotNull(GlobalInfo.getVersion());
   }
 
+  // TODO: 別の場所に移す
   @Test
   void checkSupportedDevices() {
-    GlobalInfo.SupportedDevices supportedDevices = GlobalInfo.getSupportedDevices();
+    GlobalInfo.SupportedDevices supportedDevices = loadOnnxruntime().supportedDevices();
 
     assertNotNull(supportedDevices);
     assertTrue(supportedDevices.cpu);
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
index 1eb8fe057..4de2f617b 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
@@ -20,9 +20,12 @@ interface MoraCheckCallback {
 
   @Test
   void checkIsGpuMode() {
+    Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
     Synthesizer synthesizer =
-        Synthesizer.builder(openJtalk).accelerationMode(Synthesizer.AccelerationMode.CPU).build();
+        Synthesizer.builder(onnxruntime, openJtalk)
+            .accelerationMode(Synthesizer.AccelerationMode.CPU)
+            .build();
     assertFalse(synthesizer.isGpuMode());
   }
 
@@ -45,9 +48,10 @@ boolean checkAllMoras(
 
   @Test
   void checkModel() throws InvalidModelDataException {
+    Onnxruntime onnxruntime = loadOnnxruntime();
     VoiceModel model = loadModel();
     OpenJtalk openJtalk = loadOpenJtalk();
-    Synthesizer synthesizer = Synthesizer.builder(openJtalk).build();
+    Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
 
     assertTrue(synthesizer.metas().length == 0);
 
@@ -65,8 +69,9 @@ void checkModel() throws InvalidModelDataException {
   @Test
   void checkAudioQuery() throws InferenceFailedException, InvalidModelDataException {
     VoiceModel model = loadModel();
+    Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
-    Synthesizer synthesizer = Synthesizer.builder(openJtalk).build();
+    Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
     synthesizer.loadVoiceModel(model);
     AudioQuery query = synthesizer.createAudioQuery("こんにちは", model.metas[0].styles[0].id);
 
@@ -77,7 +82,8 @@ void checkAudioQuery() throws InferenceFailedException, InvalidModelDataExceptio
   void checkAccentPhrases() throws InferenceFailedException, InvalidModelDataException {
     VoiceModel model = loadModel();
     OpenJtalk openJtalk = loadOpenJtalk();
-    Synthesizer synthesizer = Synthesizer.builder(openJtalk).build();
+    Onnxruntime onnxruntime = loadOnnxruntime();
+    Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
     synthesizer.loadVoiceModel(model);
     List<AccentPhrase> accentPhrases =
         synthesizer.createAccentPhrases("こんにちは", model.metas[0].styles[0].id);
@@ -106,8 +112,9 @@ void checkAccentPhrases() throws InferenceFailedException, InvalidModelDataExcep
   @Test
   void checkTts() throws InferenceFailedException, InvalidModelDataException {
     VoiceModel model = loadModel();
+    Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
-    Synthesizer synthesizer = Synthesizer.builder(openJtalk).build();
+    Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
     synthesizer.loadVoiceModel(model);
     synthesizer.tts("こんにちは", model.metas[0].styles[0].id);
   }
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java
index 032c38a3d..9ab731cd9 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java
@@ -15,6 +15,16 @@ VoiceModel loadModel() {
     }
   }
 
+  Onnxruntime loadOnnxruntime() {
+    final String FILENAME = "../../test_util/data/lib/" + Onnxruntime.LIB_VERSIONED_FILENAME;
+
+    try {
+      return Onnxruntime.loadOnce().filename(FILENAME).exec();
+    } catch (Exception e) {
+      throw new RuntimeException(e);
+    }
+  }
+
   OpenJtalk loadOpenJtalk() {
     String cwd = System.getProperty("user.dir");
     File path = new File(cwd + "/../../test_util/data/open_jtalk_dic_utf_8-1.11");
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
index ce9b7631a..5300b81f3 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
@@ -17,8 +17,9 @@ class UserDictTest extends TestUtils {
   void checkLoad()
       throws InferenceFailedException, InvalidModelDataException, LoadUserDictException {
     VoiceModel model = loadModel();
+    Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
-    Synthesizer synthesizer = Synthesizer.builder(openJtalk).build();
+    Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
     UserDict userDict = new UserDict();
     synthesizer.loadVoiceModel(model);
     AudioQuery query1 =
diff --git a/crates/voicevox_core_java_api/src/common.rs b/crates/voicevox_core_java_api/src/common.rs
index 6e13cee89..c55ce8106 100644
--- a/crates/voicevox_core_java_api/src/common.rs
+++ b/crates/voicevox_core_java_api/src/common.rs
@@ -72,6 +72,7 @@ where
                         let class = class!(
                             NotLoadedOpenjtalkDict,
                             GpuSupport,
+                            InitInferenceRuntime,
                             OpenZipFile,
                             ReadZipEntry,
                             InvalidModelFormat,
diff --git a/crates/voicevox_core_java_api/src/info.rs b/crates/voicevox_core_java_api/src/info.rs
index 71b8db228..7328d4de8 100644
--- a/crates/voicevox_core_java_api/src/info.rs
+++ b/crates/voicevox_core_java_api/src/info.rs
@@ -9,14 +9,3 @@ extern "system" fn Java_jp_hiroshiba_voicevoxcore_GlobalInfo_rsGetVersion(
         Ok(version.into_raw())
     })
 }
-#[no_mangle]
-extern "system" fn Java_jp_hiroshiba_voicevoxcore_GlobalInfo_rsGetSupportedDevicesJson(
-    env: JNIEnv<'_>,
-) -> jobject {
-    throw_if_err(env, std::ptr::null_mut(), |env| {
-        let supported_devices = voicevox_core::SupportedDevices::create()?;
-        let json = serde_json::to_string(&supported_devices).expect("Should not fail");
-        let json = env.new_string(json)?;
-        Ok(json.into_raw())
-    })
-}
diff --git a/crates/voicevox_core_java_api/src/lib.rs b/crates/voicevox_core_java_api/src/lib.rs
index 9615f0a94..4d61414e8 100644
--- a/crates/voicevox_core_java_api/src/lib.rs
+++ b/crates/voicevox_core_java_api/src/lib.rs
@@ -1,6 +1,7 @@
 mod common;
 mod info;
 mod logger;
+mod onnxruntime;
 mod open_jtalk;
 mod synthesizer;
 mod user_dict;
diff --git a/crates/voicevox_core_java_api/src/onnxruntime.rs b/crates/voicevox_core_java_api/src/onnxruntime.rs
new file mode 100644
index 000000000..004ff4d97
--- /dev/null
+++ b/crates/voicevox_core_java_api/src/onnxruntime.rs
@@ -0,0 +1,56 @@
+use std::ptr;
+
+use duplicate::duplicate_item;
+use jni::{
+    objects::{JObject, JString},
+    sys::jobject,
+    JNIEnv,
+};
+
+use crate::common::throw_if_err;
+
+#[duplicate_item(
+    f CONST;
+    [ Java_jp_hiroshiba_voicevoxcore_Onnxruntime_rsLibName ] [ LIB_NAME ];
+    [ Java_jp_hiroshiba_voicevoxcore_Onnxruntime_rsLibVersion ] [ LIB_VERSION ];
+    [ Java_jp_hiroshiba_voicevoxcore_Onnxruntime_rsLibVersionedFilename ] [ LIB_VERSIONED_FILENAME ];
+    [ Java_jp_hiroshiba_voicevoxcore_Onnxruntime_rsLibUnversionedFilename ] [ LIB_UNVERSIONED_FILENAME ];
+)]
+#[no_mangle]
+extern "system" fn f(env: JNIEnv<'_>) -> jobject {
+    throw_if_err(env, ptr::null_mut(), |env| {
+        let s = env.new_string(voicevox_core::blocking::Onnxruntime::CONST)?;
+        Ok(s.into_raw())
+    })
+}
+
+#[no_mangle]
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Onnxruntime_rsNew<'local>(
+    env: JNIEnv<'local>,
+    this: JObject<'local>,
+    filename: JString<'local>,
+) {
+    throw_if_err(env, (), |env| {
+        let filename = String::from(env.get_string(&filename)?);
+        let internal = voicevox_core::blocking::Onnxruntime::load_once()
+            .filename(filename)
+            .exec()?;
+        env.set_rust_field(&this, "handle", internal)?;
+        Ok(())
+    })
+}
+
+#[no_mangle]
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Onnxruntime_rsSupportedDevices<'local>(
+    env: JNIEnv<'local>,
+    this: JObject<'local>,
+) -> jobject {
+    throw_if_err(env, ptr::null_mut(), |env| {
+        let this = *env.get_rust_field::<_, _, &'static voicevox_core::blocking::Onnxruntime>(
+            &this, "handle",
+        )?;
+        let json = this.supported_devices()?.to_json().to_string();
+        let json = env.new_string(json)?;
+        Ok(json.into_raw())
+    })
+}
diff --git a/crates/voicevox_core_java_api/src/synthesizer.rs b/crates/voicevox_core_java_api/src/synthesizer.rs
index dc5dc971d..b2605e8ae 100644
--- a/crates/voicevox_core_java_api/src/synthesizer.rs
+++ b/crates/voicevox_core_java_api/src/synthesizer.rs
@@ -14,6 +14,7 @@ use std::sync::Arc;
 unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsNew<'local>(
     env: JNIEnv<'local>,
     this: JObject<'local>,
+    onnxruntime: JObject<'local>,
     open_jtalk: JObject<'local>,
     builder: JObject<'local>,
 ) {
@@ -45,11 +46,18 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsNew<'loca
         let cpu_num_threads = env.get_field(&builder, "cpuNumThreads", "I")?;
         options.cpu_num_threads = cpu_num_threads.i().expect("cpuNumThreads is not integer") as u16;
 
+        let onnxruntime = *env
+            .get_rust_field::<_, _, &'static voicevox_core::blocking::Onnxruntime>(
+                &onnxruntime,
+                "handle",
+            )?;
         let open_jtalk = env
             .get_rust_field::<_, _, voicevox_core::blocking::OpenJtalk>(&open_jtalk, "handle")?
             .clone();
         let internal = Arc::new(voicevox_core::blocking::Synthesizer::new(
-            open_jtalk, &options,
+            onnxruntime,
+            open_jtalk,
+            &options,
         )?);
         env.set_rust_field(&this, "handle", internal)?;
         Ok(())
diff --git a/crates/voicevox_core_python_api/Cargo.toml b/crates/voicevox_core_python_api/Cargo.toml
index 5ccd1dc41..48c92dfb4 100644
--- a/crates/voicevox_core_python_api/Cargo.toml
+++ b/crates/voicevox_core_python_api/Cargo.toml
@@ -15,6 +15,7 @@ directml = ["voicevox_core/directml"]
 camino.workspace = true
 easy-ext.workspace = true
 log.workspace = true
+once_cell.workspace = true
 pyo3 = { workspace = true, features = ["abi3-py38", "extension-module"] }
 pyo3-asyncio = { workspace = true, features = ["tokio-runtime"] }
 pyo3-log.workspace = true
@@ -22,7 +23,7 @@ serde = { workspace = true, features = ["derive"] }
 serde_json.workspace = true
 tracing = { workspace = true, features = ["log"] }
 uuid.workspace = true
-voicevox_core.workspace = true
+voicevox_core = { workspace = true, features = ["load-onnxruntime"] }
 
 [lints.rust]
 unsafe_code = "forbid"
diff --git a/crates/voicevox_core_python_api/python/test/conftest.py b/crates/voicevox_core_python_api/python/test/conftest.py
index eec642cb9..430e415c1 100644
--- a/crates/voicevox_core_python_api/python/test/conftest.py
+++ b/crates/voicevox_core_python_api/python/test/conftest.py
@@ -4,9 +4,17 @@
 from typing import List, TypedDict
 
 import pytest
+import voicevox_core
 
 root_dir = Path(os.path.dirname(os.path.abspath(__file__)))
 
+onnxruntime_filename = str(
+    root_dir.parent.parent.parent
+    / "test_util"
+    / "data"
+    / "lib"
+    / voicevox_core.blocking.Onnxruntime.LIB_VERSIONED_FILENAME
+)
 open_jtalk_dic_dir = (
     root_dir.parent.parent.parent / "test_util" / "data" / "open_jtalk_dic_utf_8-1.11"
 )
diff --git a/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py b/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py
index ec69032b1..aea4af999 100644
--- a/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py
+++ b/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py
@@ -7,7 +7,7 @@
 import conftest
 import pytest
 import pytest_asyncio
-from voicevox_core.asyncio import OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
 
 
 def test_voice_model_metas_works(voice_model: VoiceModel) -> None:
@@ -16,7 +16,10 @@ def test_voice_model_metas_works(voice_model: VoiceModel) -> None:
 
 @pytest.mark.asyncio
 async def test_synthesizer_metas_works(voice_model: VoiceModel) -> None:
-    synthesizer = Synthesizer(await OpenJtalk.new(conftest.open_jtalk_dic_dir))
+    synthesizer = Synthesizer(
+        await Onnxruntime.load_once(filename=conftest.onnxruntime_filename),
+        await OpenJtalk.new(conftest.open_jtalk_dic_dir),
+    )
     await synthesizer.load_voice_model(voice_model)
     _ = synthesizer.metas
 
diff --git a/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py b/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py
index c509b8c2d..d6906a6ac 100644
--- a/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py
+++ b/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py
@@ -15,9 +15,12 @@
 
 @pytest.mark.asyncio
 async def test_user_dict_load() -> None:
+    onnxruntime = await voicevox_core.asyncio.Onnxruntime.load_once(
+        filename=conftest.onnxruntime_filename
+    )
     open_jtalk = await voicevox_core.asyncio.OpenJtalk.new(conftest.open_jtalk_dic_dir)
     model = await voicevox_core.asyncio.VoiceModel.from_path(conftest.model_dir)
-    synthesizer = voicevox_core.asyncio.Synthesizer(open_jtalk)
+    synthesizer = voicevox_core.asyncio.Synthesizer(onnxruntime, open_jtalk)
 
     await synthesizer.load_voice_model(model)
 
diff --git a/crates/voicevox_core_python_api/python/test/test_blocking_metas.py b/crates/voicevox_core_python_api/python/test/test_blocking_metas.py
index c305e2cdb..00eade04b 100644
--- a/crates/voicevox_core_python_api/python/test/test_blocking_metas.py
+++ b/crates/voicevox_core_python_api/python/test/test_blocking_metas.py
@@ -6,7 +6,7 @@
 
 import conftest
 import pytest
-from voicevox_core.blocking import OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
 
 
 def test_voice_model_metas_works(voice_model: VoiceModel) -> None:
@@ -14,7 +14,10 @@ def test_voice_model_metas_works(voice_model: VoiceModel) -> None:
 
 
 def test_synthesizer_metas_works(voice_model: VoiceModel) -> None:
-    synthesizer = Synthesizer(OpenJtalk(conftest.open_jtalk_dic_dir))
+    synthesizer = Synthesizer(
+        Onnxruntime.load_once(filename=conftest.onnxruntime_filename),
+        OpenJtalk(conftest.open_jtalk_dic_dir),
+    )
     synthesizer.load_voice_model(voice_model)
     _ = synthesizer.metas
 
diff --git a/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py b/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py
index ef94d9742..198becbe2 100644
--- a/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py
+++ b/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py
@@ -13,9 +13,12 @@
 
 
 def test_user_dict_load() -> None:
+    onnxruntime = voicevox_core.blocking.Onnxruntime.load_once(
+        filename=conftest.onnxruntime_filename
+    )
     open_jtalk = voicevox_core.blocking.OpenJtalk(conftest.open_jtalk_dic_dir)
     model = voicevox_core.blocking.VoiceModel.from_path(conftest.model_dir)
-    synthesizer = voicevox_core.blocking.Synthesizer(open_jtalk)
+    synthesizer = voicevox_core.blocking.Synthesizer(onnxruntime, open_jtalk)
 
     synthesizer.load_voice_model(model)
 
diff --git a/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py b/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py
index 93d92ad28..26d389477 100644
--- a/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py
+++ b/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py
@@ -7,7 +7,7 @@
 import conftest
 import pytest
 import pytest_asyncio
-from voicevox_core.asyncio import OpenJtalk, Synthesizer
+from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer
 
 
 def test_enter_returns_workable_self(synthesizer: Synthesizer) -> None:
@@ -38,8 +38,13 @@ def test_access_after_exit_denied(synthesizer: Synthesizer) -> None:
 
 
 @pytest_asyncio.fixture
-async def synthesizer(open_jtalk: OpenJtalk) -> Synthesizer:
-    return Synthesizer(open_jtalk)
+async def synthesizer(onnxruntime: Onnxruntime, open_jtalk: OpenJtalk) -> Synthesizer:
+    return Synthesizer(onnxruntime, open_jtalk)
+
+
+@pytest_asyncio.fixture(scope="function")
+async def onnxruntime() -> Onnxruntime:
+    return await Onnxruntime.load_once(filename=conftest.onnxruntime_filename)
 
 
 @pytest_asyncio.fixture(scope="function")
diff --git a/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_blocking_synthesizer.py b/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_blocking_synthesizer.py
index 3e3f5f823..dc55eafc4 100644
--- a/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_blocking_synthesizer.py
+++ b/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_blocking_synthesizer.py
@@ -6,7 +6,7 @@
 
 import conftest
 import pytest
-from voicevox_core.blocking import OpenJtalk, Synthesizer
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer
 
 
 def test_enter_returns_workable_self(synthesizer: Synthesizer) -> None:
@@ -37,8 +37,13 @@ def test_access_after_exit_denied(synthesizer: Synthesizer) -> None:
 
 
 @pytest.fixture
-def synthesizer(open_jtalk: OpenJtalk) -> Synthesizer:
-    return Synthesizer(open_jtalk)
+def synthesizer(onnxruntime: Onnxruntime, open_jtalk: OpenJtalk) -> Synthesizer:
+    return Synthesizer(onnxruntime, open_jtalk)
+
+
+@pytest.fixture(scope="session")
+def onnxruntime() -> Onnxruntime:
+    return Onnxruntime.load_once(filename=conftest.onnxruntime_filename)
 
 
 @pytest.fixture(scope="session")
diff --git a/crates/voicevox_core_python_api/python/test/test_type_stub_consts.py b/crates/voicevox_core_python_api/python/test/test_type_stub_consts.py
new file mode 100644
index 000000000..6a44d2771
--- /dev/null
+++ b/crates/voicevox_core_python_api/python/test/test_type_stub_consts.py
@@ -0,0 +1,50 @@
+"""pyiに書かれている定数の値が、本物と合致しているかをテストする。"""
+
+import ast
+from ast import AnnAssign, ClassDef, Constant, Name
+from pathlib import Path
+from typing import Tuple
+
+import voicevox_core
+
+
+def test() -> None:
+    REAL_BLOCKING = (
+        voicevox_core.blocking.Onnxruntime.LIB_NAME,
+        voicevox_core.blocking.Onnxruntime.LIB_VERSION,
+    )
+    REAL_ASYNCIO = (
+        voicevox_core.asyncio.Onnxruntime.LIB_NAME,
+        voicevox_core.asyncio.Onnxruntime.LIB_VERSION,
+    )
+    stub_blocking = extract(Path("./python/voicevox_core/_rust/blocking.pyi"))
+    stub_asyncio = extract(Path("./python/voicevox_core/_rust/asyncio.pyi"))
+    assert len({REAL_BLOCKING, REAL_ASYNCIO, stub_blocking, stub_asyncio}) == 1
+
+
+def extract(pyi: Path) -> Tuple[str, str]:
+    module = ast.parse(pyi.read_text(encoding="utf-8"))
+    class_def = next(
+        stmt
+        for stmt in module.body
+        if isinstance(stmt, ClassDef) and stmt.name == "Onnxruntime"
+    )
+    lib_name_value = next(
+        stmt.value.value
+        for stmt in class_def.body
+        if isinstance(stmt, AnnAssign)
+        and isinstance(stmt.target, Name)
+        and stmt.target.id == "LIB_NAME"
+        and isinstance(stmt.value, Constant)
+        and isinstance(stmt.value.value, str)
+    )
+    lib_version_value = next(
+        stmt.value.value
+        for stmt in class_def.body
+        if isinstance(stmt, AnnAssign)
+        and isinstance(stmt.target, Name)
+        and stmt.target.id == "LIB_VERSION"
+        and isinstance(stmt.value, Constant)
+        and isinstance(stmt.value.value, str)
+    )
+    return (lib_name_value, lib_version_value)
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/__init__.py b/crates/voicevox_core_python_api/python/voicevox_core/__init__.py
index 4ccbad3fe..e9a0a03c0 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/__init__.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/__init__.py
@@ -19,6 +19,7 @@
     GetSupportedDevicesError,
     GpuSupportError,
     InferenceFailedError,
+    InitInferenceRuntimeError,
     InvalidModelDataError,
     InvalidWordError,
     LoadUserDictError,
@@ -34,7 +35,6 @@
     UseUserDictError,
     WordNotFoundError,
     __version__,
-    supported_devices,
 )
 
 from . import asyncio, blocking  # noqa: F401 isort: skip
@@ -50,6 +50,7 @@
     "GetSupportedDevicesError",
     "GpuSupportError",
     "InferenceFailedError",
+    "InitInferenceRuntimeError",
     "InvalidModelDataError",
     "InvalidWordError",
     "LoadUserDictError",
@@ -67,7 +68,6 @@
     "StyleNotFoundError",
     "StyleVersion",
     "SupportedDevices",
-    "supported_devices",
     "UseUserDictError",
     "UserDictWord",
     "UserDictWordType",
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py b/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py
index db8b4cdc5..0f9e3d034 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py
@@ -1,3 +1,4 @@
+# TODO: voicevox_onnxruntimeになったらやめる
 import glob
 import platform
 from ctypes import CDLL
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi
index 89a50d230..81168843f 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi
@@ -1,22 +1,5 @@
-from typing import TYPE_CHECKING
-
-if TYPE_CHECKING:
-    from voicevox_core import SupportedDevices
-
 __version__: str
 
-def supported_devices() -> SupportedDevices:
-    """
-    このライブラリで利用可能なデバイスの情報を取得する。
-
-    .. code-block::
-
-       import voicevox_core
-
-       supported_devices = voicevox_core.supported_devices()
-    """
-    ...
-
 class NotLoadedOpenjtalkDictError(Exception):
     """open_jtalk辞書ファイルが読み込まれていない。"""
 
@@ -27,6 +10,11 @@ class GpuSupportError(Exception):
 
     ...
 
+class InitInferenceRuntimeError(Exception):
+    """推論ライブラリのロードまたは初期化ができなかった。"""
+
+    ...
+
 class OpenZipFileError(Exception):
     """ZIPファイルを開くことに失敗した。"""
 
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
index 468d885ee..7652a7d2c 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
@@ -9,6 +9,7 @@ if TYPE_CHECKING:
         AudioQuery,
         SpeakerMeta,
         StyleId,
+        SupportedDevices,
         UserDictWord,
         VoiceModelId,
     )
@@ -37,6 +38,73 @@ class VoiceModel:
         """メタ情報。"""
         ...
 
+class Onnxruntime:
+    """
+    ONNX Runtime。
+
+    シングルトンであり、インスタンスは高々一つ。
+
+    .. code-block::
+
+        ort1 = await Onnxruntime.load_once()
+        ort2 = Onnxruntime.get()
+        assert ort2
+        assert ort2 is ort1
+
+    .. code-block::
+
+        ort = await voicevox_core.asyncio.Onnxruntime.load_once()
+        assert voicevox_core.blocking.Onnxruntime.get()
+    """
+
+    # ここの定数値が本物と合致するかどうかは、test_type_stub_consts.pyで担保する。
+
+    LIB_NAME: str = "onnxruntime"
+    """ONNX Runtimeのライブラリ名。"""
+
+    LIB_VERSION: str = "1.17.3"
+    """推奨されるONNX Runtimeのバージョン。"""
+
+    LIB_VERSIONED_FILENAME: str
+    """
+    :attr:`LIB_NAME` と :attr:`LIB_VERSION` からなる動的ライブラリのファイル名。
+
+    WindowsとAndroidでは :attr:`LIB_UNVERSIONED_FILENAME` と同じ。
+    """
+
+    LIB_UNVERSIONED_FILENAME: str
+    """:attr:`LIB_NAME` からなる動的ライブラリのファイル名。"""
+
+    @staticmethod
+    def get() -> Union["Onnxruntime", None]:
+        """
+        インスタンスが既に作られているならそれを得る。
+
+        作られていなければ ``None`` を返す。
+        """
+        ...
+    @staticmethod
+    async def load_once(*, filename: str = LIB_VERSIONED_FILENAME) -> "Onnxruntime":
+        """
+        ONNX Runtimeをロードして初期化する。
+
+        一度成功したら、以後は引数を無視して同じインスタンスを返す。
+
+        Parameters
+        ----------
+        filename
+            ONNX Runtimeのファイル名（モジュール名）もしくはファイルパス。
+            ``dlopen``/`LoadLibraryExW
+            <https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw>`_
+            の引数に使われる。
+        """
+        ...
+    def supported_devices(self) -> SupportedDevices:
+        """
+        このライブラリで利用可能なデバイスの情報を取得する。
+        """
+        ...
+
 class OpenJtalk:
     """
     テキスト解析器としてのOpen JTalk。
@@ -72,6 +140,8 @@ class Synthesizer:
 
     Parameters
     ----------
+    onnxruntime
+        ONNX Runtime。
     open_jtalk
         Open JTalk。
     acceleration_mode
@@ -82,6 +152,7 @@ class Synthesizer:
 
     def __init__(
         self,
+        onnxruntime: Onnxruntime,
         open_jtalk: OpenJtalk,
         acceleration_mode: Union[
             AccelerationMode, Literal["AUTO", "CPU", "GPU"]
@@ -92,6 +163,10 @@ class Synthesizer:
     def __enter__(self) -> "Synthesizer": ...
     def __exit__(self, exc_type, exc_value, traceback) -> None: ...
     @property
+    def onnxruntime(self) -> Onnxruntime:
+        """ONNX Runtime。"""
+        ...
+    @property
     def is_gpu_mode(self) -> bool:
         """ハードウェアアクセラレーションがGPUモードかどうか。"""
         ...
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
index fd09eb8cd..602ff31bc 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
@@ -9,6 +9,7 @@ if TYPE_CHECKING:
         AudioQuery,
         SpeakerMeta,
         StyleId,
+        SupportedDevices,
         UserDictWord,
         VoiceModelId,
     )
@@ -37,6 +38,73 @@ class VoiceModel:
         """メタ情報。"""
         ...
 
+class Onnxruntime:
+    """
+    ONNX Runtime。
+
+    シングルトンであり、インスタンスは高々一つ。
+
+    .. code-block::
+
+        ort1 = Onnxruntime.load_once()
+        ort2 = Onnxruntime.get()
+        assert ort2
+        assert ort2 is ort1
+
+    .. code-block::
+
+        ort = voicevox_core.blocking.Onnxruntime.load_once()
+        assert voicevox_core.asyncio.Onnxruntime.get()
+    """
+
+    # ここの定数値が本物と合致するかどうかは、test_type_stub_consts.pyで担保する。
+
+    LIB_NAME: str = "onnxruntime"
+    """ONNX Runtimeのライブラリ名。"""
+
+    LIB_VERSION: str = "1.17.3"
+    """推奨されるONNX Runtimeのバージョン。"""
+
+    LIB_VERSIONED_FILENAME: str
+    """
+    :attr:`LIB_NAME` と :attr:`LIB_VERSION` からなる動的ライブラリのファイル名。
+
+    WindowsとAndroidでは :attr:`LIB_UNVERSIONED_FILENAME` と同じ。
+    """
+
+    LIB_UNVERSIONED_FILENAME: str
+    """:attr:`LIB_NAME` からなる動的ライブラリのファイル名。"""
+
+    @staticmethod
+    def get() -> Union["Onnxruntime", None]:
+        """
+        インスタンスが既に作られているならそれを得る。
+
+        作られていなければ ``None`` を返す。
+        """
+        ...
+    @staticmethod
+    def load_once(*, filename: str = LIB_VERSIONED_FILENAME) -> "Onnxruntime":
+        """
+        ONNX Runtimeをロードして初期化する。
+
+        一度成功したら、以後は引数を無視して同じインスタンスを返す。
+
+        Parameters
+        ----------
+        filename
+            ONNX Runtimeのファイル名（モジュール名）もしくはファイルパス。
+            ``dlopen``/`LoadLibraryExW
+            <https://learn.microsoft.com/en-us/windows/win32/api/libloaderapi/nf-libloaderapi-loadlibraryexw>`_
+            の引数に使われる。
+        """
+        ...
+    def supported_devices(self) -> SupportedDevices:
+        """
+        このライブラリで利用可能なデバイスの情報を取得する。
+        """
+        ...
+
 class OpenJtalk:
     """
     テキスト解析器としてのOpen JTalk。
@@ -67,6 +135,8 @@ class Synthesizer:
 
     Parameters
     ----------
+    onnxruntime
+        ONNX Runtime。
     open_jtalk
         Open JTalk。
     acceleration_mode
@@ -77,6 +147,7 @@ class Synthesizer:
 
     def __init__(
         self,
+        onnxruntime: Onnxruntime,
         open_jtalk: OpenJtalk,
         acceleration_mode: Union[
             AccelerationMode, Literal["AUTO", "CPU", "GPU"]
@@ -87,6 +158,10 @@ class Synthesizer:
     def __enter__(self) -> "Synthesizer": ...
     def __exit__(self, exc_type, exc_value, traceback) -> None: ...
     @property
+    def onnxruntime(self) -> Onnxruntime:
+        """ONNX Runtime。"""
+        ...
+    @property
     def is_gpu_mode(self) -> bool:
         """ハードウェアアクセラレーションがGPUモードかどうか。"""
         ...
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py b/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py
index 75b160814..2cff19cdf 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py
@@ -1,4 +1,4 @@
 # pyright: reportMissingModuleSource=false
-from ._rust.asyncio import OpenJtalk, Synthesizer, UserDict, VoiceModel
+from ._rust.asyncio import Onnxruntime, OpenJtalk, Synthesizer, UserDict, VoiceModel
 
-__all__ = ["OpenJtalk", "Synthesizer", "UserDict", "VoiceModel"]
+__all__ = ["Onnxruntime", "OpenJtalk", "Synthesizer", "UserDict", "VoiceModel"]
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/blocking.py b/crates/voicevox_core_python_api/python/voicevox_core/blocking.py
index 80f61fdcb..7fed5fac7 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/blocking.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/blocking.py
@@ -1,4 +1,4 @@
 # pyright: reportMissingModuleSource=false
-from ._rust.blocking import OpenJtalk, Synthesizer, UserDict, VoiceModel
+from ._rust.blocking import Onnxruntime, OpenJtalk, Synthesizer, UserDict, VoiceModel
 
-__all__ = ["OpenJtalk", "Synthesizer", "UserDict", "VoiceModel"]
+__all__ = ["Onnxruntime", "OpenJtalk", "Synthesizer", "UserDict", "VoiceModel"]
diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs
index f40b2d449..0eee14a5b 100644
--- a/crates/voicevox_core_python_api/src/convert.rs
+++ b/crates/voicevox_core_python_api/src/convert.rs
@@ -16,10 +16,10 @@ use voicevox_core::{
 
 use crate::{
     ExtractFullContextLabelError, GetSupportedDevicesError, GpuSupportError, InferenceFailedError,
-    InvalidModelDataError, InvalidModelFormatError, InvalidWordError, LoadUserDictError,
-    ModelAlreadyLoadedError, ModelNotFoundError, NotLoadedOpenjtalkDictError, OpenZipFileError,
-    ParseKanaError, ReadZipEntryError, SaveUserDictError, StyleAlreadyLoadedError,
-    StyleNotFoundError, UseUserDictError, WordNotFoundError,
+    InitInferenceRuntimeError, InvalidModelDataError, InvalidModelFormatError, InvalidWordError,
+    LoadUserDictError, ModelAlreadyLoadedError, ModelNotFoundError, NotLoadedOpenjtalkDictError,
+    OpenZipFileError, ParseKanaError, ReadZipEntryError, SaveUserDictError,
+    StyleAlreadyLoadedError, StyleNotFoundError, UseUserDictError, WordNotFoundError,
 };
 
 pub(crate) fn from_acceleration_mode(ob: &PyAny) -> PyResult<AccelerationMode> {
@@ -191,6 +191,7 @@ pub(crate) impl<T> voicevox_core::Result<T> {
             let top = match err.kind() {
                 ErrorKind::NotLoadedOpenjtalkDict => NotLoadedOpenjtalkDictError::new_err(msg),
                 ErrorKind::GpuSupport => GpuSupportError::new_err(msg),
+                ErrorKind::InitInferenceRuntime => InitInferenceRuntimeError::new_err(msg),
                 ErrorKind::OpenZipFile => OpenZipFileError::new_err(msg),
                 ErrorKind::ReadZipEntry => ReadZipEntryError::new_err(msg),
                 ErrorKind::ModelAlreadyLoaded => ModelAlreadyLoadedError::new_err(msg),
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index e43fa4476..0da82f9ca 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -1,7 +1,7 @@
 use std::marker::PhantomData;
 
 mod convert;
-use self::convert::{from_utf8_path, to_pydantic_dataclass, VoicevoxCoreResultExt as _};
+use self::convert::{from_utf8_path, VoicevoxCoreResultExt as _};
 use easy_ext::ext;
 use log::debug;
 use pyo3::{
@@ -9,7 +9,7 @@ use pyo3::{
     exceptions::{PyException, PyKeyError, PyValueError},
     pyfunction, pymodule,
     types::PyModule,
-    wrap_pyfunction, PyAny, PyResult, PyTypeInfo, Python,
+    wrap_pyfunction, PyResult, PyTypeInfo, Python,
 };
 
 #[pymodule]
@@ -18,7 +18,6 @@ fn rust(py: Python<'_>, module: &PyModule) -> PyResult<()> {
     pyo3_log::init();
 
     module.add("__version__", env!("CARGO_PKG_VERSION"))?;
-    module.add_wrapped(wrap_pyfunction!(supported_devices))?;
     module.add_wrapped(wrap_pyfunction!(_validate_pronunciation))?;
     module.add_wrapped(wrap_pyfunction!(_to_zenkaku))?;
 
@@ -26,6 +25,7 @@ fn rust(py: Python<'_>, module: &PyModule) -> PyResult<()> {
 
     let blocking_module = PyModule::new(py, "voicevox_core._rust.blocking")?;
     blocking_module.add_class::<self::blocking::Synthesizer>()?;
+    blocking_module.add_class::<self::blocking::Onnxruntime>()?;
     blocking_module.add_class::<self::blocking::OpenJtalk>()?;
     blocking_module.add_class::<self::blocking::VoiceModel>()?;
     blocking_module.add_class::<self::blocking::UserDict>()?;
@@ -33,6 +33,7 @@ fn rust(py: Python<'_>, module: &PyModule) -> PyResult<()> {
 
     let asyncio_module = PyModule::new(py, "voicevox_core._rust.asyncio")?;
     asyncio_module.add_class::<self::asyncio::Synthesizer>()?;
+    asyncio_module.add_class::<self::asyncio::Onnxruntime>()?;
     asyncio_module.add_class::<self::asyncio::OpenJtalk>()?;
     asyncio_module.add_class::<self::asyncio::VoiceModel>()?;
     asyncio_module.add_class::<self::asyncio::UserDict>()?;
@@ -67,6 +68,7 @@ macro_rules! exceptions {
 exceptions! {
     NotLoadedOpenjtalkDictError: PyException;
     GpuSupportError: PyException;
+    InitInferenceRuntimeError: PyException;
     OpenZipFileError: PyException;
     ReadZipEntryError: PyException;
     ModelAlreadyLoadedError: PyException;
@@ -86,16 +88,6 @@ exceptions! {
     InvalidWordError: PyValueError;
 }
 
-#[pyfunction]
-fn supported_devices(py: Python<'_>) -> PyResult<&PyAny> {
-    let class = py
-        .import("voicevox_core")?
-        .getattr("SupportedDevices")?
-        .downcast()?;
-    let s = voicevox_core::SupportedDevices::create().into_py_result(py)?;
-    to_pydantic_dataclass(s, class)
-}
-
 struct Closable<T, C: PyTypeInfo> {
     content: MaybeClosed<T>,
     marker: PhantomData<C>,
@@ -149,13 +141,13 @@ fn _to_zenkaku(text: &str) -> PyResult<String> {
 }
 
 mod blocking {
-    use std::{path::PathBuf, sync::Arc};
+    use std::{ffi::OsString, path::PathBuf, sync::Arc};
 
     use camino::Utf8PathBuf;
     use pyo3::{
         pyclass, pymethods,
         types::{IntoPyDict as _, PyBytes, PyDict, PyList},
-        PyAny, PyObject, PyRef, PyResult, Python,
+        Py, PyAny, PyObject, PyRef, PyResult, Python,
     };
     use uuid::Uuid;
     use voicevox_core::{
@@ -191,6 +183,70 @@ mod blocking {
         }
     }
 
+    static ONNXRUNTIME: once_cell::sync::OnceCell<Py<Onnxruntime>> =
+        once_cell::sync::OnceCell::new();
+
+    #[pyclass]
+    #[derive(Clone)]
+    pub(crate) struct Onnxruntime(&'static voicevox_core::blocking::Onnxruntime);
+
+    #[pymethods]
+    impl Onnxruntime {
+        #[classattr]
+        const LIB_NAME: &'static str = voicevox_core::blocking::Onnxruntime::LIB_NAME;
+
+        #[classattr]
+        const LIB_VERSION: &'static str = voicevox_core::blocking::Onnxruntime::LIB_VERSION;
+
+        #[classattr]
+        const LIB_VERSIONED_FILENAME: &'static str =
+            voicevox_core::blocking::Onnxruntime::LIB_VERSIONED_FILENAME;
+
+        #[classattr]
+        const LIB_UNVERSIONED_FILENAME: &'static str =
+            voicevox_core::blocking::Onnxruntime::LIB_UNVERSIONED_FILENAME;
+
+        #[staticmethod]
+        fn get(py: Python<'_>) -> PyResult<Option<Py<Self>>> {
+            let result = ONNXRUNTIME.get_or_try_init(|| {
+                match voicevox_core::blocking::Onnxruntime::get().map(|o| Py::new(py, Self(o))) {
+                    Some(Ok(this)) => Ok(this),
+                    Some(Err(err)) => Err(Some(err)),
+                    None => Err(None),
+                }
+            });
+
+            match result {
+                Ok(this) => Ok(Some(this.clone())),
+                Err(Some(err)) => Err(err),
+                Err(None) => Ok(None),
+            }
+        }
+
+        #[staticmethod]
+        #[pyo3(signature = (*, filename = Self::LIB_VERSIONED_FILENAME.into()))]
+        fn load_once(filename: OsString, py: Python<'_>) -> PyResult<Py<Self>> {
+            ONNXRUNTIME
+                .get_or_try_init(|| {
+                    let inner = voicevox_core::blocking::Onnxruntime::load_once()
+                        .filename(filename)
+                        .exec()
+                        .into_py_result(py)?;
+                    Py::new(py, Self(inner))
+                })
+                .cloned()
+        }
+
+        fn supported_devices<'py>(&self, py: Python<'py>) -> PyResult<&'py PyAny> {
+            let class = py
+                .import("voicevox_core")?
+                .getattr("SupportedDevices")?
+                .downcast()?;
+            let s = self.0.supported_devices().into_py_result(py)?;
+            crate::convert::to_pydantic_dataclass(s, class)
+        }
+    }
+
     #[pyclass]
     #[derive(Clone)]
     pub(crate) struct OpenJtalk {
@@ -228,11 +284,13 @@ mod blocking {
     impl Synthesizer {
         #[new]
         #[pyo3(signature =(
+            onnxruntime,
             open_jtalk,
             acceleration_mode = InitializeOptions::default().acceleration_mode,
             cpu_num_threads = InitializeOptions::default().cpu_num_threads,
         ))]
         fn new(
+            onnxruntime: Onnxruntime,
             open_jtalk: OpenJtalk,
             #[pyo3(from_py_with = "crate::convert::from_acceleration_mode")]
             acceleration_mode: AccelerationMode,
@@ -240,6 +298,7 @@ mod blocking {
             py: Python<'_>,
         ) -> PyResult<Self> {
             let inner = voicevox_core::blocking::Synthesizer::new(
+                onnxruntime.0,
                 open_jtalk.open_jtalk.clone(),
                 &InitializeOptions {
                     acceleration_mode,
@@ -270,6 +329,11 @@ mod blocking {
             self.close();
         }
 
+        #[getter]
+        fn onnxruntime(&self) -> Py<Onnxruntime> {
+            ONNXRUNTIME.get().expect("should be initialized").clone()
+        }
+
         #[getter]
         fn is_gpu_mode(&self) -> PyResult<bool> {
             let synthesizer = self.synthesizer.get()?;
@@ -577,13 +641,13 @@ mod blocking {
 }
 
 mod asyncio {
-    use std::{path::PathBuf, sync::Arc};
+    use std::{ffi::OsString, path::PathBuf, sync::Arc};
 
     use camino::Utf8PathBuf;
     use pyo3::{
         pyclass, pymethods,
         types::{IntoPyDict as _, PyBytes, PyDict, PyList},
-        PyAny, PyObject, PyRef, PyResult, Python, ToPyObject as _,
+        Py, PyAny, PyObject, PyRef, PyResult, Python, ToPyObject as _,
     };
     use uuid::Uuid;
     use voicevox_core::{
@@ -622,6 +686,71 @@ mod asyncio {
         }
     }
 
+    static ONNXRUNTIME: once_cell::sync::OnceCell<Py<Onnxruntime>> =
+        once_cell::sync::OnceCell::new();
+
+    #[pyclass]
+    #[derive(Clone)]
+    pub(crate) struct Onnxruntime(&'static voicevox_core::tokio::Onnxruntime);
+
+    #[pymethods]
+    impl Onnxruntime {
+        #[classattr]
+        const LIB_NAME: &'static str = voicevox_core::tokio::Onnxruntime::LIB_NAME;
+
+        #[classattr]
+        const LIB_VERSION: &'static str = voicevox_core::tokio::Onnxruntime::LIB_VERSION;
+
+        #[classattr]
+        const LIB_VERSIONED_FILENAME: &'static str =
+            voicevox_core::tokio::Onnxruntime::LIB_VERSIONED_FILENAME;
+
+        #[classattr]
+        const LIB_UNVERSIONED_FILENAME: &'static str =
+            voicevox_core::tokio::Onnxruntime::LIB_UNVERSIONED_FILENAME;
+
+        #[staticmethod]
+        fn get(py: Python<'_>) -> PyResult<Option<Py<Self>>> {
+            let result = ONNXRUNTIME.get_or_try_init(|| {
+                match voicevox_core::tokio::Onnxruntime::get().map(|o| Py::new(py, Self(o))) {
+                    Some(Ok(this)) => Ok(this),
+                    Some(Err(err)) => Err(Some(err)),
+                    None => Err(None),
+                }
+            });
+
+            match result {
+                Ok(this) => Ok(Some(this.clone())),
+                Err(Some(err)) => Err(err),
+                Err(None) => Ok(None),
+            }
+        }
+
+        #[staticmethod]
+        #[pyo3(signature = (*, filename = Self::LIB_VERSIONED_FILENAME.into()))]
+        fn load_once(filename: OsString, py: Python<'_>) -> PyResult<&PyAny> {
+            pyo3_asyncio::tokio::future_into_py(py, async move {
+                let inner = voicevox_core::tokio::Onnxruntime::load_once()
+                    .filename(filename)
+                    .exec()
+                    .await;
+
+                ONNXRUNTIME.get_or_try_init(|| {
+                    Python::with_gil(|py| Py::new(py, Self(inner.into_py_result(py)?)))
+                })
+            })
+        }
+
+        fn supported_devices<'py>(&self, py: Python<'py>) -> PyResult<&'py PyAny> {
+            let class = py
+                .import("voicevox_core")?
+                .getattr("SupportedDevices")?
+                .downcast()?;
+            let s = self.0.supported_devices().into_py_result(py)?;
+            crate::convert::to_pydantic_dataclass(s, class)
+        }
+    }
+
     #[pyclass]
     #[derive(Clone)]
     pub(crate) struct OpenJtalk {
@@ -664,17 +793,20 @@ mod asyncio {
     impl Synthesizer {
         #[new]
         #[pyo3(signature =(
+            onnxruntime,
             open_jtalk,
             acceleration_mode = InitializeOptions::default().acceleration_mode,
             cpu_num_threads = InitializeOptions::default().cpu_num_threads,
         ))]
         fn new(
+            onnxruntime: Onnxruntime,
             open_jtalk: OpenJtalk,
             #[pyo3(from_py_with = "crate::convert::from_acceleration_mode")]
             acceleration_mode: AccelerationMode,
             cpu_num_threads: u16,
         ) -> PyResult<Self> {
             let synthesizer = voicevox_core::tokio::Synthesizer::new(
+                onnxruntime.0,
                 open_jtalk.open_jtalk.clone(),
                 &InitializeOptions {
                     acceleration_mode,
@@ -704,6 +836,11 @@ mod asyncio {
             self.close();
         }
 
+        #[getter]
+        fn onnxruntime(&self) -> Py<Onnxruntime> {
+            ONNXRUNTIME.get().expect("should be initialized").clone()
+        }
+
         #[getter]
         fn is_gpu_mode(&self) -> PyResult<bool> {
             let synthesizer = self.synthesizer.get()?;
diff --git a/docs/apis/c_api/doxygen/Doxyfile b/docs/apis/c_api/doxygen/Doxyfile
index c42bd60e0..c845adbd4 100644
--- a/docs/apis/c_api/doxygen/Doxyfile
+++ b/docs/apis/c_api/doxygen/Doxyfile
@@ -2257,7 +2257,7 @@ INCLUDE_FILE_PATTERNS  =
 # recursively expanded use the := operator instead of the = operator.
 # This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
 
-PREDEFINED             =
+PREDEFINED             = VOICEVOX_LOAD_ONNXRUNTIME= VOICEVOX_LINK_ONNXRUNTIME=
 
 # If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then this
 # tag can be used to specify a list of macro names that should be expanded. The
@@ -2660,6 +2660,7 @@ GENERATE_LEGEND        = YES
 
 DOT_CLEANUP            = YES
 
+ALIASES += availability{1}="<dl><dt>Availability</dt><dd>\1</dd></dl>"
 ALIASES += example{1}="<dl><dt>Example</dt><dd>\1</dd></dl>"
 ALIASES += examples{1}="<dl><dt>Examples</dt><dd>\1</dd></dl>"
 
diff --git a/docs/feature-options.md b/docs/feature-options.md
new file mode 100644
index 000000000..16487d3bf
--- /dev/null
+++ b/docs/feature-options.md
@@ -0,0 +1,26 @@
+## ONNX Runtimeのリンク方法のオプション
+
+Rust API（`voicevox_core`）およびC API（`voicevox_core_c_api`）においては、ビルド時に
+次のCargoフィーチャのうちどちらかを選択しなければなりません。
+詳しくは[voicevox_core/Cargo.toml](../crates/voicevox_core/Cargo.toml)のコメントを参照して
+下さい。Python APIやJava APIでは`load-onnxruntime`のみに限定しています。
+
+- `load-onnxruntime`
+- `link-onnxruntime`
+
+```console
+❯ cargo build --release -p voicevox_core_c_api --features load-onnxruntime
+❯ sed 's:^//\(#define VOICEVOX_LOAD_ONNXRUNTIME\)$:\1:' \
+  crates/voicevox_core_c_api/include/voicevox_core.h \
+  > ./voicevox_core.h
+```
+
+```console
+❯ cargo build --release -p voicevox_core_c_api --features link-onnxruntime
+❯ sed 's:^//\(#define VOICEVOX_LINK_ONNXRUNTIME\)$:\1:' \
+  crates/voicevox_core_c_api/include/voicevox_core.h \
+  > ./voicevox_core.h
+```
+
+C APIのリリースでは`dlopen`の利用が厳しいiOSでのみ`link-onnxruntime`で、その他は`load-onnxruntime`で
+ビルドしています。
diff --git a/docs/usage.md b/docs/usage.md
index 91da1c62f..e828ae220 100644
--- a/docs/usage.md
+++ b/docs/usage.md
@@ -62,11 +62,11 @@ VOICEVOX コアでは`Synthesizer`に音声モデルを読み込むことでテ
 
 ```python
 from pprint import pprint
-from voicevox_core.blocking import OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
 
 # 1. Synthesizerの初期化
 open_jtalk_dict_dir = "open_jtalk_dic_utf_8-1.11"
-synthesizer = Synthesizer(OpenJtalk(open_jtalk_dict_dir))
+synthesizer = Synthesizer(Onnxruntime.load_once(), OpenJtalk(open_jtalk_dict_dir))
 
 # 2. 音声モデルの読み込み
 model = VoiceModel.from_path("model/0.vvm")
@@ -82,7 +82,7 @@ with open("output.wav", "wb") as f:
 
 ### 1. Synthesizer の初期化
 
-辞書などを取り扱う`OpenJtalk`のインスタンスを引数に渡して`Synthesizer`を初期化します。`Synthesizer`は音声合成だけでなく、音声モデルを複数読み込んだり、イントネーションのみを生成することもできます。
+AIエンジンの`Onnxruntime`のインスタンスと、辞書などを取り扱う`OpenJtalk`のインスタンスを引数に渡して`Synthesizer`を初期化します。`Synthesizer`は音声合成だけでなく、音声モデルを複数読み込んだり、イントネーションのみを生成することもできます。
 
 ### 2. 音声モデルの読み込み
 
diff --git a/example/cpp/unix/simple_tts.cpp b/example/cpp/unix/simple_tts.cpp
index c7683d49a..5db24b12e 100644
--- a/example/cpp/unix/simple_tts.cpp
+++ b/example/cpp/unix/simple_tts.cpp
@@ -20,14 +20,21 @@ int main(int argc, char *argv[]) {
   std::cout << "coreの初期化中..." << std::endl;
 
   auto initialize_options = voicevox_make_default_initialize_options();
+  const VoicevoxOnnxruntime* onnxruntime;
+  auto load_ort_options = voicevox_make_default_load_onnxruntime_options();
+  auto result = voicevox_onnxruntime_load_once(load_ort_options, &onnxruntime);
+  if (result != VOICEVOX_RESULT_OK){
+    std::cerr << voicevox_error_result_to_message(result) << std::endl;
+    return 1;
+  }
   OpenJtalkRc* open_jtalk;
-  auto result = voicevox_open_jtalk_rc_new(open_jtalk_dict_path.c_str(),&open_jtalk);
+  result = voicevox_open_jtalk_rc_new(open_jtalk_dict_path.c_str(),&open_jtalk);
   if (result != VOICEVOX_RESULT_OK){
     std::cerr << voicevox_error_result_to_message(result) << std::endl;
     return 1;
   }
   VoicevoxSynthesizer* synthesizer;
-  result = voicevox_synthesizer_new(open_jtalk,initialize_options,&synthesizer);
+  result = voicevox_synthesizer_new(onnxruntime,open_jtalk,initialize_options,&synthesizer);
   if (result != VOICEVOX_RESULT_OK) {
     std::cerr << voicevox_error_result_to_message(result) << std::endl;
     return 1;
diff --git a/example/cpp/windows/simple_tts/simple_tts.cpp b/example/cpp/windows/simple_tts/simple_tts.cpp
index bd070505f..946ef9679 100644
--- a/example/cpp/windows/simple_tts/simple_tts.cpp
+++ b/example/cpp/windows/simple_tts/simple_tts.cpp
@@ -33,14 +33,21 @@ int main() {
   VoicevoxInitializeOptions  initializeOptions = voicevox_make_default_initialize_options();
   std::string dict = GetOpenJTalkDict();
 
+  const VoicevoxOnnxruntime* onnxruntime;
+  auto load_ort_options = voicevox_make_default_load_onnxruntime_options();
+  auto result = voicevox_onnxruntime_load_once(load_ort_options, &onnxruntime);
+  if (result != VoicevoxResultCode::VOICEVOX_RESULT_OK) {
+    OutErrorMessage(result);
+    return 0;
+  }
   OpenJtalkRc* open_jtalk;
-  auto result = voicevox_open_jtalk_rc_new(dict.c_str(),&open_jtalk);
+  result = voicevox_open_jtalk_rc_new(dict.c_str(),&open_jtalk);
   if (result != VoicevoxResultCode::VOICEVOX_RESULT_OK) {
     OutErrorMessage(result);
     return 0;
   }
   VoicevoxSynthesizer* synthesizer;
-  result = voicevox_synthesizer_new(open_jtalk,initializeOptions,&synthesizer);
+  result = voicevox_synthesizer_new(onnxruntime,open_jtalk,initializeOptions,&synthesizer);
   if (result != VoicevoxResultCode::VOICEVOX_RESULT_OK) {
     OutErrorMessage(result);
     return 0;
diff --git a/example/kotlin/README.md b/example/kotlin/README.md
index 3bcdafc94..7dc5b637c 100644
--- a/example/kotlin/README.md
+++ b/example/kotlin/README.md
@@ -47,6 +47,7 @@ Usage: voicevoxcoreexample options_list
 Options:
     --mode [AUTO] -> モード { Value should be one of [auto, cpu, gpu] }
     --vvm -> vvmファイルへのパス (always required) { String }
+    --onnxruntime [libonnxruntime.so.1.17.3] -> ONNX Runtimeのファイル名（モジュール名）もしくはファイルパス { String }
     --dictDir [./open_jtalk_dic_utf_8-1.11] -> Open JTalkの辞書ディレクトリ { String }
     --text [この音声は、ボイスボックスを使用して、出力されています。] -> 読み上げさせたい文章 { String }
     --out [./output.wav] -> 出力wavファイルのパス { String }
@@ -56,9 +57,13 @@ Options:
 
 ## 実行例
 
+<!-- FIXME: `cargo build -p test_util`するように案内するか、製品版のVVMを実行させる -->
+<!-- FIXME: libvoicevox_onnxruntimeになったら`--onnxruntime`を指定するのではなく、`$LD_LIBRARY_PATH`とかに入れて実行するように案内する -->
+
 ```console
-❯ ./gradlew run --args="--vvm ../../crates/test_util/data/model/sample.vvm"
-Inititalizing: AUTO, ./open_jtalk_dic_utf_8-1.11
+❯ # Linuxの場合
+❯ ./gradlew run --args="--vvm ../../crates/test_util/data/model/sample.vvm --onnxruntime ../../crates/test_util/data/lib/libonnxruntime.so.1.17.3"
+Inititalizing: AUTO, ../../crates/test_util/data/lib/libonnxruntime.so.1.17.3, ./open_jtalk_dic_utf_8-1.11
 Loading: ../../crates/test_util/data/model/sample.vvm
 Creating an AudioQuery from the text: この音声は、ボイスボックスを使用して、出力されています。
 Synthesizing...
diff --git a/example/kotlin/app/src/main/kotlin/app/App.kt b/example/kotlin/app/src/main/kotlin/app/App.kt
index 3e76043f4..7f2651020 100644
--- a/example/kotlin/app/src/main/kotlin/app/App.kt
+++ b/example/kotlin/app/src/main/kotlin/app/App.kt
@@ -15,6 +15,10 @@ fun main(args: Array<String>) {
   val mode by parser.option(ArgType.Choice<Mode>(), description = "モード").default(Mode.AUTO)
   val vvmPath by
       parser.option(ArgType.String, fullName = "vvm", description = "vvmファイルへのパス").required()
+  val onnxruntime by
+      parser
+          .option(ArgType.String, description = "ONNX Runtimeのファイル名（モジュール名）もしくはファイルパス")
+          .default(Onnxruntime.LIB_VERSIONED_FILENAME)
   val dictDir by
       parser
           .option(ArgType.String, description = "Open JTalkの辞書ディレクトリ")
@@ -28,10 +32,11 @@ fun main(args: Array<String>) {
 
   parser.parse(args)
 
-  println("Inititalizing: ${mode}, ${dictDir}")
+  println("Inititalizing: ${mode}, ${onnxruntime}, ${dictDir}")
+  val ort = Onnxruntime.loadOnce().filename(onnxruntime).exec()
   val openJtalk = OpenJtalk(dictDir)
   val synthesizer =
-      Synthesizer.builder(openJtalk)
+      Synthesizer.builder(ort, openJtalk)
           .accelerationMode(
               when (mode) {
                 Mode.AUTO -> Synthesizer.AccelerationMode.AUTO
diff --git a/example/python/run-asyncio.py b/example/python/run-asyncio.py
index 70d204a92..b75509183 100644
--- a/example/python/run-asyncio.py
+++ b/example/python/run-asyncio.py
@@ -8,9 +8,8 @@
 from pathlib import Path
 from typing import Tuple
 
-import voicevox_core
 from voicevox_core import AccelerationMode, AudioQuery
-from voicevox_core.asyncio import OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
 
 
 async def main() -> None:
@@ -23,17 +22,23 @@ async def main() -> None:
     (
         acceleration_mode,
         vvm_path,
+        onnxruntime_filename,
         open_jtalk_dict_dir,
         text,
         out,
         style_id,
     ) = parse_args()
 
-    logger.debug("%s", f"{voicevox_core.supported_devices()=}")
+    logger.info("%s", f"Loading ONNX Runtime ({onnxruntime_filename=})")
+    onnxruntime = await Onnxruntime.load_once(filename=onnxruntime_filename)
+
+    logger.debug("%s", f"{onnxruntime.supported_devices()=}")
 
     logger.info("%s", f"Initializing ({acceleration_mode=}, {open_jtalk_dict_dir=})")
     synthesizer = Synthesizer(
-        await OpenJtalk.new(open_jtalk_dict_dir), acceleration_mode=acceleration_mode
+        onnxruntime,
+        await OpenJtalk.new(open_jtalk_dict_dir),
+        acceleration_mode=acceleration_mode,
     )
 
     logger.debug("%s", f"{synthesizer.metas=}")
@@ -53,7 +58,7 @@ async def main() -> None:
     logger.info("%s", f"Wrote `{out}`")
 
 
-def parse_args() -> Tuple[AccelerationMode, Path, Path, str, Path, int]:
+def parse_args() -> Tuple[AccelerationMode, Path, str, Path, str, Path, int]:
     argparser = ArgumentParser()
     argparser.add_argument(
         "--mode",
@@ -66,6 +71,11 @@ def parse_args() -> Tuple[AccelerationMode, Path, Path, str, Path, int]:
         type=Path,
         help="vvmファイルへのパス",
     )
+    argparser.add_argument(
+        "--onnxruntime",
+        default=Onnxruntime.LIB_VERSIONED_FILENAME,
+        help="ONNX Runtimeのライブラリのfilename",
+    )
     argparser.add_argument(
         "--dict-dir",
         default="./open_jtalk_dic_utf_8-1.11",
@@ -90,7 +100,16 @@ def parse_args() -> Tuple[AccelerationMode, Path, Path, str, Path, int]:
         help="話者IDを指定",
     )
     args = argparser.parse_args()
-    return (args.mode, args.vvm, args.dict_dir, args.text, args.out, args.style_id)
+    # FIXME: 流石に多くなってきたので、`dataclass`化する
+    return (
+        args.mode,
+        args.vvm,
+        args.onnxruntime,
+        args.dict_dir,
+        args.text,
+        args.out,
+        args.style_id,
+    )
 
 
 def display_as_json(audio_query: AudioQuery) -> str:
diff --git a/example/python/run.py b/example/python/run.py
index a57139b1c..3a9fdd9e7 100644
--- a/example/python/run.py
+++ b/example/python/run.py
@@ -5,9 +5,8 @@
 from pathlib import Path
 from typing import Tuple
 
-import voicevox_core
 from voicevox_core import AccelerationMode, AudioQuery
-from voicevox_core.blocking import OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
 
 
 def main() -> None:
@@ -20,17 +19,23 @@ def main() -> None:
     (
         acceleration_mode,
         vvm_path,
+        onnxruntime_filename,
         open_jtalk_dict_dir,
         text,
         out,
         style_id,
     ) = parse_args()
 
-    logger.debug("%s", f"{voicevox_core.supported_devices()=}")
+    logger.info("%s", f"Loading ONNX Runtime ({onnxruntime_filename=})")
+    onnxruntime = Onnxruntime.load_once(filename=onnxruntime_filename)
+
+    logger.debug("%s", f"{onnxruntime.supported_devices()=}")
 
     logger.info("%s", f"Initializing ({acceleration_mode=}, {open_jtalk_dict_dir=})")
     synthesizer = Synthesizer(
-        OpenJtalk(open_jtalk_dict_dir), acceleration_mode=acceleration_mode
+        onnxruntime,
+        OpenJtalk(open_jtalk_dict_dir),
+        acceleration_mode=acceleration_mode,
     )
 
     logger.debug("%s", f"{synthesizer.metas=}")
@@ -50,7 +55,7 @@ def main() -> None:
     logger.info("%s", f"Wrote `{out}`")
 
 
-def parse_args() -> Tuple[AccelerationMode, Path, Path, str, Path, int]:
+def parse_args() -> Tuple[AccelerationMode, Path, str, Path, str, Path, int]:
     argparser = ArgumentParser()
     argparser.add_argument(
         "--mode",
@@ -63,6 +68,11 @@ def parse_args() -> Tuple[AccelerationMode, Path, Path, str, Path, int]:
         type=Path,
         help="vvmファイルへのパス",
     )
+    argparser.add_argument(
+        "--onnxruntime",
+        default=Onnxruntime.LIB_VERSIONED_FILENAME,
+        help="ONNX Runtimeのライブラリのfilename",
+    )
     argparser.add_argument(
         "--dict-dir",
         default="./open_jtalk_dic_utf_8-1.11",
@@ -87,7 +97,16 @@ def parse_args() -> Tuple[AccelerationMode, Path, Path, str, Path, int]:
         help="話者IDを指定",
     )
     args = argparser.parse_args()
-    return (args.mode, args.vvm, args.dict_dir, args.text, args.out, args.style_id)
+    # FIXME: 流石に多くなってきたので、`dataclass`化する
+    return (
+        args.mode,
+        args.vvm,
+        args.onnxruntime,
+        args.dict_dir,
+        args.text,
+        args.out,
+        args.style_id,
+    )
 
 
 def display_as_json(audio_query: AudioQuery) -> str:

From 2dd2c8700f295fc77d748aa0b0f081d4fefe5254 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sun, 7 Jul 2024 12:48:10 +0900
Subject: [PATCH 12/36] =?UTF-8?q?refactor:=20Rust=20API=E3=81=AEAudioQuery?=
 =?UTF-8?q?=E7=B3=BB=E3=81=AE=E5=9E=8B=E5=90=8D=E3=81=8B=E3=82=89=E6=8E=A5?=
 =?UTF-8?q?=E5=B0=BE=E8=BE=9E"Model"=E3=82=92=E5=89=8A=E9=99=A4=20(#805)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* refactor: Rust APIのAudioQuery系の型名から接尾辞"Model"を削除

* doc修正

* fixup! doc修正
---
 .../src/engine/full_context_label.rs          |  64 +++++----
 .../voicevox_core/src/engine/kana_parser.rs   |  25 ++--
 crates/voicevox_core/src/engine/mod.rs        |   2 +-
 crates/voicevox_core/src/engine/model.rs      |  24 ++--
 crates/voicevox_core/src/lib.rs               |   2 +-
 crates/voicevox_core/src/synthesizer.rs       | 125 +++++++++---------
 crates/voicevox_core/src/text_analyzer.rs     |   8 +-
 crates/voicevox_core_c_api/src/helpers.rs     |   8 +-
 crates/voicevox_core_c_api/src/lib.rs         |  10 +-
 .../voicevox_core_java_api/src/synthesizer.rs |   8 +-
 .../voicevox_core_python_api/src/convert.rs   |  17 +--
 crates/voicevox_core_python_api/src/lib.rs    |  12 +-
 12 files changed, 142 insertions(+), 163 deletions(-)

diff --git a/crates/voicevox_core/src/engine/full_context_label.rs b/crates/voicevox_core/src/engine/full_context_label.rs
index 8b87048e5..4f95abbf2 100644
--- a/crates/voicevox_core/src/engine/full_context_label.rs
+++ b/crates/voicevox_core/src/engine/full_context_label.rs
@@ -1,10 +1,10 @@
 use std::str::FromStr;
 
 use crate::{
-    engine::{self, open_jtalk::FullcontextExtractor, MoraModel},
-    AccentPhraseModel,
+    engine::{self, open_jtalk::FullcontextExtractor},
+    AccentPhrase,
 };
-use jlabel::{Label, Mora};
+use jlabel::Label;
 use smallvec::SmallVec;
 
 // FIXME: 入力テキストをここで持って、メッセージに含む
@@ -33,7 +33,7 @@ type Result<T> = std::result::Result<T, FullContextLabelError>;
 pub(crate) fn extract_full_context_label(
     open_jtalk: &impl FullcontextExtractor,
     text: impl AsRef<str>,
-) -> Result<Vec<AccentPhraseModel>> {
+) -> Result<Vec<AccentPhrase>> {
     let labels = open_jtalk
         .extract_fullcontext(text.as_ref())
         .map_err(|source| FullContextLabelError {
@@ -58,7 +58,7 @@ pub(crate) fn extract_full_context_label(
 
 fn generate_accent_phrases(
     utterance: &[Label],
-) -> std::result::Result<Vec<AccentPhraseModel>, ErrorKind> {
+) -> std::result::Result<Vec<AccentPhrase>, ErrorKind> {
     let mut accent_phrases = Vec::with_capacity(
         utterance
             .first()
@@ -88,7 +88,7 @@ fn generate_accent_phrases(
         let pause_mora = if ap_curr.accent_phrase_position_backward == 1
             && bg_curr.breath_group_position_backward != 1
         {
-            Some(MoraModel::new(
+            Some(crate::Mora::new(
                 "、".into(),
                 None,
                 None,
@@ -103,7 +103,7 @@ fn generate_accent_phrases(
         // workaround for VOICEVOX/voicevox_engine#55
         let accent = usize::from(ap_curr.accent_position).min(moras.len());
 
-        accent_phrases.push(AccentPhraseModel::new(
+        accent_phrases.push(AccentPhrase::new(
             moras,
             accent,
             pause_mora,
@@ -113,7 +113,7 @@ fn generate_accent_phrases(
     Ok(accent_phrases)
 }
 
-fn generate_moras(accent_phrase: &[Label]) -> std::result::Result<Vec<MoraModel>, ErrorKind> {
+fn generate_moras(accent_phrase: &[Label]) -> std::result::Result<Vec<crate::Mora>, ErrorKind> {
     let mut moras = Vec::with_capacity(accent_phrase.len());
 
     let split = accent_phrase.chunk_by(|a, b| a.mora == b.mora);
@@ -136,7 +136,7 @@ fn generate_moras(accent_phrase: &[Label]) -> std::result::Result<Vec<MoraModel>
             // position_forwardとposition_backwardが飽和している場合は無視する
             [Label {
                 mora:
-                    Some(Mora {
+                    Some(jlabel::Mora {
                         position_forward: 49,
                         position_backward: 49,
                         ..
@@ -151,10 +151,10 @@ fn generate_moras(accent_phrase: &[Label]) -> std::result::Result<Vec<MoraModel>
     Ok(moras)
 }
 
-fn generate_mora(consonant: Option<&Label>, vowel: &Label) -> MoraModel {
+fn generate_mora(consonant: Option<&Label>, vowel: &Label) -> crate::Mora {
     let consonant_phoneme = consonant.and_then(|c| c.phoneme.c.to_owned());
     let vowel_phoneme = vowel.phoneme.c.as_deref().unwrap();
-    MoraModel::new(
+    crate::Mora::new(
         mora_to_text(consonant_phoneme.as_deref(), vowel_phoneme),
         consonant_phoneme,
         consonant.and(Some(0.0)),
@@ -190,14 +190,14 @@ mod tests {
         engine::{
             full_context_label::{extract_full_context_label, generate_accent_phrases},
             open_jtalk::FullcontextExtractor,
-            MoraModel,
+            Mora,
         },
-        AccentPhraseModel,
+        AccentPhrase,
     };
     use jlabel::Label;
 
-    fn mora(text: &str, consonant: Option<&str>, vowel: &str) -> MoraModel {
-        MoraModel::new(
+    fn mora(text: &str, consonant: Option<&str>, vowel: &str) -> Mora {
+        Mora::new(
             text.into(),
             consonant.map(|c| c.into()),
             consonant.and(Some(0.0)),
@@ -218,7 +218,7 @@ mod tests {
             "y^e-sil+xx=xx/A:xx+xx+xx/B:xx-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:1_1!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:1_1/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:1+1-1",
         ],
         &[
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![mora("イェ", Some("y"), "e")],
                 1,
                 None,
@@ -236,7 +236,7 @@ mod tests {
             "N^cl-sil+xx=xx/A:xx+xx+xx/B:09-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:3_3!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:1_3/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:1+1-3",
         ],
         &[
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("ン", None, "N"),
                     mora("ン", None, "N"),
@@ -271,7 +271,7 @@ mod tests {
             "s^U-sil+xx=xx/A:xx+xx+xx/B:10-7_2/C:xx_xx+xx/D:xx+xx_xx/E:5_1!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:2_8/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:1+2-8",
         ],
         &[
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("コ", Some("k"), "o"),
                     mora("レ", Some("r"), "e"),
@@ -281,7 +281,7 @@ mod tests {
                 None,
                 false,
             ),
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("テ", Some("t"), "e"),
                     mora("ス", Some("s"), "U"),
@@ -324,7 +324,7 @@ mod tests {
             "k^u-sil+xx=xx/A:xx+xx+xx/B:05-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:4_2!1_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:1_4/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:4+4-12",
         ],
         &[
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("イ", None, "i"),
                     mora("チ", Some("ch"), "i"),
@@ -333,7 +333,7 @@ mod tests {
                 Some(mora("、", None, "pau")),
                 false,
             ),
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("セ", Some("s"), "e"),
                     mora("ン", None, "N"),
@@ -342,7 +342,7 @@ mod tests {
                 Some(mora("、", None, "pau")),
                 false,
             ),
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("ヒャ", Some("hy"), "a"),
                     mora("ク", Some("k"), "u"),
@@ -353,7 +353,7 @@ mod tests {
                 Some(mora("、", None, "pau")),
                 false,
             ),
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("イ", None, "i"),
                     mora("チ", Some("ch"), "i"),
@@ -386,7 +386,7 @@ mod tests {
             "a^a-sil+xx=xx/A:xx+xx+xx/B:09-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:1_1!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:2_3/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:2+3-8",
         ],
         &[
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("クヮ", Some("kw"), "a"),
                     mora("ル", Some("r"), "u"),
@@ -398,7 +398,7 @@ mod tests {
                 Some(mora("、", None, "pau")),
                 false,
             ),
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![
                     mora("ア", None, "a"),
                     mora("ア", None, "a"),
@@ -407,7 +407,7 @@ mod tests {
                 None,
                 false,
             ),
-            AccentPhraseModel::new(
+            AccentPhrase::new(
                 vec![mora("ア", None, "a")],
                 1,
                 None,
@@ -418,13 +418,13 @@ mod tests {
     fn label_cases(
         #[case] text: &str,
         #[case] labels: &[&str],
-        #[case] accent_phrase: &[AccentPhraseModel],
+        #[case] accent_phrase: &[AccentPhrase],
     ) {
     }
 
     #[apply(label_cases)]
     #[tokio::test]
-    async fn open_jtalk(text: &str, labels: &[&str], _accent_phrase: &[AccentPhraseModel]) {
+    async fn open_jtalk(text: &str, labels: &[&str], _accent_phrase: &[AccentPhrase]) {
         let open_jtalk = crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
             .await
             .unwrap();
@@ -432,7 +432,7 @@ mod tests {
     }
 
     #[apply(label_cases)]
-    fn parse_labels(_text: &str, labels: &[&str], accent_phrase: &[AccentPhraseModel]) {
+    fn parse_labels(_text: &str, labels: &[&str], accent_phrase: &[AccentPhrase]) {
         let parsed_labels = labels
             .iter()
             .map(|s| Label::from_str(s).unwrap())
@@ -446,11 +446,7 @@ mod tests {
 
     #[apply(label_cases)]
     #[tokio::test]
-    async fn extract_fullcontext(
-        text: &str,
-        _labels: &[&str],
-        accent_phrase: &[AccentPhraseModel],
-    ) {
+    async fn extract_fullcontext(text: &str, _labels: &[&str], accent_phrase: &[AccentPhrase]) {
         let open_jtalk = crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
             .await
             .unwrap();
diff --git a/crates/voicevox_core/src/engine/kana_parser.rs b/crates/voicevox_core/src/engine/kana_parser.rs
index eaa3d93c1..42f17dc63 100644
--- a/crates/voicevox_core/src/engine/kana_parser.rs
+++ b/crates/voicevox_core/src/engine/kana_parser.rs
@@ -1,4 +1,4 @@
-use crate::engine::model::{AccentPhraseModel, MoraModel};
+use crate::engine::model::{AccentPhrase, Mora};
 use crate::engine::mora_list::MORA_LIST_MINIMUM;
 use once_cell::sync::Lazy;
 use std::collections::HashMap;
@@ -16,7 +16,7 @@ pub(crate) struct KanaParseError(String);
 
 type KanaParseResult<T> = std::result::Result<T, KanaParseError>;
 
-static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, MoraModel>> = Lazy::new(|| {
+static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, Mora>> = Lazy::new(|| {
     let mut text2mora_with_unvoice = HashMap::new();
     for [text, consonant, vowel] in MORA_LIST_MINIMUM {
         let consonant = if !consonant.is_empty() {
@@ -28,7 +28,7 @@ static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, MoraModel>> = Lazy::new(|| {
 
         if ["a", "i", "u", "e", "o"].contains(vowel) {
             let upper_vowel = vowel.to_uppercase();
-            let unvoice_mora = MoraModel::new(
+            let unvoice_mora = Mora::new(
                 text.to_string(),
                 consonant.clone(),
                 consonant_length,
@@ -39,7 +39,7 @@ static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, MoraModel>> = Lazy::new(|| {
             text2mora_with_unvoice.insert(UNVOICE_SYMBOL.to_string() + text, unvoice_mora);
         }
 
-        let mora = MoraModel::new(
+        let mora = Mora::new(
             text.to_string(),
             consonant,
             consonant_length,
@@ -52,10 +52,10 @@ static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, MoraModel>> = Lazy::new(|| {
     text2mora_with_unvoice
 });
 
-fn text_to_accent_phrase(phrase: &str) -> KanaParseResult<AccentPhraseModel> {
+fn text_to_accent_phrase(phrase: &str) -> KanaParseResult<AccentPhrase> {
     let phrase_vec: Vec<char> = phrase.chars().collect();
     let mut accent_index: Option<usize> = None;
-    let mut moras: Vec<MoraModel> = Vec::new();
+    let mut moras: Vec<Mora> = Vec::new();
     let mut stack = String::new();
     let mut matched_text: Option<String> = None;
     let text2mora = &TEXT2MORA_WITH_UNVOICE;
@@ -107,15 +107,10 @@ fn text_to_accent_phrase(phrase: &str) -> KanaParseResult<AccentPhraseModel> {
             "accent not found in accent phrase: {phrase}"
         )));
     }
-    Ok(AccentPhraseModel::new(
-        moras,
-        accent_index.unwrap(),
-        None,
-        false,
-    ))
+    Ok(AccentPhrase::new(moras, accent_index.unwrap(), None, false))
 }
 
-pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhraseModel>> {
+pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhrase>> {
     const TERMINATOR: char = '\0';
     let mut parsed_result = Vec::new();
     let chars_of_text = text.chars().chain([TERMINATOR]);
@@ -142,7 +137,7 @@ pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhraseModel>>
             let accent_phrase = {
                 let mut accent_phrase = text_to_accent_phrase(&phrase)?;
                 if letter == PAUSE_DELIMITER {
-                    accent_phrase.set_pause_mora(Some(MoraModel::new(
+                    accent_phrase.set_pause_mora(Some(Mora::new(
                         PAUSE_DELIMITER.to_string(),
                         None,
                         None,
@@ -163,7 +158,7 @@ pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhraseModel>>
     Ok(parsed_result)
 }
 
-pub(crate) fn create_kana(accent_phrases: &[AccentPhraseModel]) -> String {
+pub(crate) fn create_kana(accent_phrases: &[AccentPhrase]) -> String {
     let mut text = String::new();
     for phrase in accent_phrases {
         let moras = phrase.moras();
diff --git a/crates/voicevox_core/src/engine/mod.rs b/crates/voicevox_core/src/engine/mod.rs
index 95fe3d562..d446a7253 100644
--- a/crates/voicevox_core/src/engine/mod.rs
+++ b/crates/voicevox_core/src/engine/mod.rs
@@ -10,6 +10,6 @@ pub(crate) use self::full_context_label::{
     extract_full_context_label, mora_to_text, FullContextLabelError,
 };
 pub(crate) use self::kana_parser::{create_kana, parse_kana, KanaParseError};
-pub use self::model::{AccentPhraseModel, AudioQueryModel, MoraModel};
+pub use self::model::{AccentPhrase, AudioQuery, Mora};
 pub(crate) use self::mora_list::mora2text;
 pub use self::open_jtalk::FullcontextExtractor;
diff --git a/crates/voicevox_core/src/engine/model.rs b/crates/voicevox_core/src/engine/model.rs
index de0f388f9..09f53b6ee 100644
--- a/crates/voicevox_core/src/engine/model.rs
+++ b/crates/voicevox_core/src/engine/model.rs
@@ -6,7 +6,7 @@ use serde::{Deserialize, Serialize};
 
 /// モーラ（子音＋母音）ごとの情報。
 #[derive(Clone, Debug, new, Getters, Deserialize, Serialize, PartialEq)]
-pub struct MoraModel {
+pub struct Mora {
     /// 文字。
     text: String,
     /// 子音の音素。
@@ -23,20 +23,20 @@ pub struct MoraModel {
 
 /// AccentPhrase (アクセント句ごとの情報)。
 #[derive(Clone, Debug, new, Getters, Deserialize, Serialize, PartialEq)]
-pub struct AccentPhraseModel {
+pub struct AccentPhrase {
     /// モーラの配列。
-    moras: Vec<MoraModel>,
+    moras: Vec<Mora>,
     /// アクセント箇所。
     accent: usize,
     /// 後ろに無音を付けるかどうか。
-    pause_mora: Option<MoraModel>,
+    pause_mora: Option<Mora>,
     /// 疑問系かどうか。
     #[serde(default)]
     is_interrogative: bool,
 }
 
-impl AccentPhraseModel {
-    pub(super) fn set_pause_mora(&mut self, pause_mora: Option<MoraModel>) {
+impl AccentPhrase {
+    pub(super) fn set_pause_mora(&mut self, pause_mora: Option<Mora>) {
         self.pause_mora = pause_mora;
     }
 
@@ -48,9 +48,9 @@ impl AccentPhraseModel {
 /// AudioQuery (音声合成用のクエリ)。
 #[allow(clippy::too_many_arguments)]
 #[derive(Clone, new, Getters, Deserialize, Serialize)]
-pub struct AudioQueryModel {
+pub struct AudioQuery {
     /// アクセント句の配列。
-    accent_phrases: Vec<AccentPhraseModel>,
+    accent_phrases: Vec<AccentPhrase>,
     /// 全体の話速。
     speed_scale: f32,
     /// 全体の音高。
@@ -76,7 +76,7 @@ pub struct AudioQueryModel {
     kana: Option<String>,
 }
 
-impl AudioQueryModel {
+impl AudioQuery {
     pub(crate) fn with_kana(self, kana: Option<String>) -> Self {
         Self { kana, ..self }
     }
@@ -88,12 +88,12 @@ mod tests {
     use rstest::rstest;
     use serde_json::json;
 
-    use super::AudioQueryModel;
+    use super::AudioQuery;
 
     #[rstest]
     fn check_audio_query_model_json_field_snake_case() {
         let audio_query_model =
-            AudioQueryModel::new(vec![], 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0, false, None);
+            AudioQuery::new(vec![], 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0, false, None);
         let val = serde_json::to_value(audio_query_model).unwrap();
         check_json_field_snake_case(&val);
     }
@@ -120,7 +120,7 @@ mod tests {
 
     #[rstest]
     fn it_accepts_json_without_optional_fields() -> anyhow::Result<()> {
-        serde_json::from_value::<AudioQueryModel>(json!({
+        serde_json::from_value::<AudioQuery>(json!({
             "accent_phrases": [
                 {
                     "moras": [
diff --git a/crates/voicevox_core/src/lib.rs b/crates/voicevox_core/src/lib.rs
index 910f9eeef..25ff64f9e 100644
--- a/crates/voicevox_core/src/lib.rs
+++ b/crates/voicevox_core/src/lib.rs
@@ -93,7 +93,7 @@ use rstest_reuse;
 
 pub use self::{
     devices::SupportedDevices,
-    engine::{AccentPhraseModel, AudioQueryModel, FullcontextExtractor},
+    engine::{AccentPhrase, AudioQuery, FullcontextExtractor, Mora},
     error::{Error, ErrorKind},
     metas::{
         RawStyleId, RawStyleVersion, SpeakerMeta, StyleId, StyleMeta, StyleType, StyleVersion,
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 767d27b1c..4f9576500 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -76,7 +76,7 @@ pub(crate) mod blocking {
     use enum_map::enum_map;
 
     use crate::{
-        engine::{create_kana, mora_to_text, MoraModel, OjtPhoneme},
+        engine::{create_kana, mora_to_text, Mora, OjtPhoneme},
         error::ErrorRepr,
         infer::{
             domains::{
@@ -88,8 +88,8 @@ pub(crate) mod blocking {
         },
         status::Status,
         text_analyzer::{KanaAnalyzer, OpenJTalkAnalyzer, TextAnalyzer},
-        AccentPhraseModel, AudioQueryModel, FullcontextExtractor, Result, StyleId,
-        SynthesisOptions, VoiceModelId, VoiceModelMeta,
+        AccentPhrase, AudioQuery, FullcontextExtractor, Result, StyleId, SynthesisOptions,
+        VoiceModelId, VoiceModelMeta,
     };
 
     use super::{AccelerationMode, InitializeOptions, TtsOptions};
@@ -243,7 +243,7 @@ pub(crate) mod blocking {
         /// AudioQueryから音声合成を行う。
         pub fn synthesis(
             &self,
-            audio_query: &AudioQueryModel,
+            audio_query: &AudioQuery,
             style_id: StyleId,
             options: &SynthesisOptions,
         ) -> Result<Vec<u8>> {
@@ -352,12 +352,12 @@ pub(crate) mod blocking {
             return Ok(to_wav(wave, audio_query));
 
             fn adjust_interrogative_accent_phrases(
-                accent_phrases: &[AccentPhraseModel],
-            ) -> Vec<AccentPhraseModel> {
+                accent_phrases: &[AccentPhrase],
+            ) -> Vec<AccentPhrase> {
                 accent_phrases
                     .iter()
                     .map(|accent_phrase| {
-                        AccentPhraseModel::new(
+                        AccentPhrase::new(
                             adjust_interrogative_moras(accent_phrase),
                             *accent_phrase.accent(),
                             accent_phrase.pause_mora().clone(),
@@ -367,13 +367,13 @@ pub(crate) mod blocking {
                     .collect()
             }
 
-            fn adjust_interrogative_moras(accent_phrase: &AccentPhraseModel) -> Vec<MoraModel> {
+            fn adjust_interrogative_moras(accent_phrase: &AccentPhrase) -> Vec<Mora> {
                 let moras = accent_phrase.moras();
                 if *accent_phrase.is_interrogative() && !moras.is_empty() {
                     let last_mora = moras.last().unwrap();
                     let last_mora_pitch = *last_mora.pitch();
                     if last_mora_pitch != 0.0 {
-                        let mut new_moras: Vec<MoraModel> = Vec::with_capacity(moras.len() + 1);
+                        let mut new_moras: Vec<Mora> = Vec::with_capacity(moras.len() + 1);
                         new_moras.extend_from_slice(moras.as_slice());
                         let interrogative_mora = make_interrogative_mora(last_mora);
                         new_moras.push(interrogative_mora);
@@ -383,14 +383,14 @@ pub(crate) mod blocking {
                 moras.clone()
             }
 
-            fn make_interrogative_mora(last_mora: &MoraModel) -> MoraModel {
+            fn make_interrogative_mora(last_mora: &Mora) -> Mora {
                 const FIX_VOWEL_LENGTH: f32 = 0.15;
                 const ADJUST_PITCH: f32 = 0.3;
                 const MAX_PITCH: f32 = 6.5;
 
                 let pitch = (*last_mora.pitch() + ADJUST_PITCH).min(MAX_PITCH);
 
-                MoraModel::new(
+                Mora::new(
                     mora_to_text(None, last_mora.vowel()),
                     None,
                     None,
@@ -400,7 +400,7 @@ pub(crate) mod blocking {
                 )
             }
 
-            fn to_wav(wave: &[f32], audio_query: &AudioQueryModel) -> Vec<u8> {
+            fn to_wav(wave: &[f32], audio_query: &AudioQuery) -> Vec<u8> {
                 let volume_scale = *audio_query.volume_scale();
                 let output_stereo = *audio_query.output_stereo();
                 let output_sampling_rate = *audio_query.output_sampling_rate();
@@ -475,7 +475,7 @@ pub(crate) mod blocking {
             &self,
             kana: &str,
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let accent_phrases = self.kana_analyzer.analyze(kana)?;
             self.replace_mora_data(&accent_phrases, style_id)
         }
@@ -483,9 +483,9 @@ pub(crate) mod blocking {
         /// AccentPhraseの配列の音高・音素長を、特定の声で生成しなおす。
         pub fn replace_mora_data(
             &self,
-            accent_phrases: &[AccentPhraseModel],
+            accent_phrases: &[AccentPhrase],
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let accent_phrases = self.replace_phoneme_length(accent_phrases, style_id)?;
             self.replace_mora_pitch(&accent_phrases, style_id)
         }
@@ -493,9 +493,9 @@ pub(crate) mod blocking {
         /// AccentPhraseの配列の音素長を、特定の声で生成しなおす。
         pub fn replace_phoneme_length(
             &self,
-            accent_phrases: &[AccentPhraseModel],
+            accent_phrases: &[AccentPhrase],
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let (_, phoneme_data_list) = initial_process(accent_phrases);
 
             let (_, _, vowel_indexes_data) = split_mora(&phoneme_data_list);
@@ -510,12 +510,12 @@ pub(crate) mod blocking {
             let new_accent_phrases = accent_phrases
                 .iter()
                 .map(|accent_phrase| {
-                    AccentPhraseModel::new(
+                    AccentPhrase::new(
                         accent_phrase
                             .moras()
                             .iter()
                             .map(|mora| {
-                                let new_mora = MoraModel::new(
+                                let new_mora = Mora::new(
                                     mora.text().clone(),
                                     mora.consonant().clone(),
                                     mora.consonant().as_ref().map(|_| {
@@ -531,7 +531,7 @@ pub(crate) mod blocking {
                             .collect(),
                         *accent_phrase.accent(),
                         accent_phrase.pause_mora().as_ref().map(|pause_mora| {
-                            let new_pause_mora = MoraModel::new(
+                            let new_pause_mora = Mora::new(
                                 pause_mora.text().clone(),
                                 pause_mora.consonant().clone(),
                                 *pause_mora.consonant_length(),
@@ -553,9 +553,9 @@ pub(crate) mod blocking {
         /// AccentPhraseの配列の音高を、特定の声で生成しなおす。
         pub fn replace_mora_pitch(
             &self,
-            accent_phrases: &[AccentPhraseModel],
+            accent_phrases: &[AccentPhrase],
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let (_, phoneme_data_list) = initial_process(accent_phrases);
 
             let mut base_start_accent_list = vec![0];
@@ -626,12 +626,12 @@ pub(crate) mod blocking {
             let new_accent_phrases = accent_phrases
                 .iter()
                 .map(|accent_phrase| {
-                    AccentPhraseModel::new(
+                    AccentPhrase::new(
                         accent_phrase
                             .moras()
                             .iter()
                             .map(|mora| {
-                                let new_mora = MoraModel::new(
+                                let new_mora = Mora::new(
                                     mora.text().clone(),
                                     mora.consonant().clone(),
                                     *mora.consonant_length(),
@@ -645,7 +645,7 @@ pub(crate) mod blocking {
                             .collect(),
                         *accent_phrase.accent(),
                         accent_phrase.pause_mora().as_ref().map(|pause_mora| {
-                            let new_pause_mora = MoraModel::new(
+                            let new_pause_mora = Mora::new(
                                 pause_mora.text().clone(),
                                 pause_mora.consonant().clone(),
                                 *pause_mora.consonant_length(),
@@ -665,7 +665,7 @@ pub(crate) mod blocking {
 
             fn create_one_accent_list(
                 accent_list: &mut Vec<i64>,
-                accent_phrase: &AccentPhraseModel,
+                accent_phrase: &AccentPhrase,
                 point: i32,
             ) {
                 let mut one_accent_list: Vec<i64> = Vec::new();
@@ -712,15 +712,10 @@ pub(crate) mod blocking {
         /// # }
         /// ```
         ///
-        /// [AudioQuery]: crate::AudioQueryModel
-        pub fn audio_query_from_kana(
-            &self,
-            kana: &str,
-            style_id: StyleId,
-        ) -> Result<AudioQueryModel> {
+        /// [AudioQuery]: crate::AudioQuery
+        pub fn audio_query_from_kana(&self, kana: &str, style_id: StyleId) -> Result<AudioQuery> {
             let accent_phrases = self.create_accent_phrases_from_kana(kana, style_id)?;
-            Ok(AudioQueryModel::from_accent_phrases(accent_phrases)
-                .with_kana(Some(kana.to_owned())))
+            Ok(AudioQuery::from_accent_phrases(accent_phrases).with_kana(Some(kana.to_owned())))
         }
 
         /// AquesTalk風記法から音声合成を行う。
@@ -764,7 +759,7 @@ pub(crate) mod blocking {
             &self,
             text: &str,
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let accent_phrases = self.open_jtalk_analyzer.analyze(text)?;
             self.replace_mora_data(&accent_phrases, style_id)
         }
@@ -794,10 +789,10 @@ pub(crate) mod blocking {
         /// # }
         /// ```
         ///
-        /// [AudioQuery]: crate::AudioQueryModel
-        pub fn audio_query(&self, text: &str, style_id: StyleId) -> Result<AudioQueryModel> {
+        /// [AudioQuery]: crate::AudioQuery
+        pub fn audio_query(&self, text: &str, style_id: StyleId) -> Result<AudioQuery> {
             let accent_phrases = self.create_accent_phrases(text, style_id)?;
-            Ok(AudioQueryModel::from_accent_phrases(accent_phrases))
+            Ok(AudioQuery::from_accent_phrases(accent_phrases))
         }
 
         /// 日本語のテキストから音声合成を行う。
@@ -1036,7 +1031,7 @@ pub(crate) mod blocking {
         }
     }
 
-    fn initial_process(accent_phrases: &[AccentPhraseModel]) -> (Vec<MoraModel>, Vec<OjtPhoneme>) {
+    fn initial_process(accent_phrases: &[AccentPhrase]) -> (Vec<Mora>, Vec<OjtPhoneme>) {
         let flatten_moras = to_flatten_moras(accent_phrases);
 
         let mut phoneme_strings = vec!["pau".to_string()];
@@ -1052,7 +1047,7 @@ pub(crate) mod blocking {
 
         return (flatten_moras, phoneme_data_list);
 
-        fn to_flatten_moras(accent_phrases: &[AccentPhraseModel]) -> Vec<MoraModel> {
+        fn to_flatten_moras(accent_phrases: &[AccentPhrase]) -> Vec<Mora> {
             let mut flatten_moras = Vec::new();
 
             for accent_phrase in accent_phrases {
@@ -1114,8 +1109,8 @@ pub(crate) mod blocking {
         (consonant_phoneme_list, vowel_phoneme_list, vowel_indexes)
     }
 
-    impl AudioQueryModel {
-        fn from_accent_phrases(accent_phrases: Vec<AccentPhraseModel>) -> Self {
+    impl AudioQuery {
+        fn from_accent_phrases(accent_phrases: Vec<AccentPhrase>) -> Self {
             let kana = create_kana(&accent_phrases);
             Self::new(
                 accent_phrases,
@@ -1137,8 +1132,8 @@ pub(crate) mod tokio {
     use std::sync::Arc;
 
     use crate::{
-        AccentPhraseModel, AudioQueryModel, FullcontextExtractor, Result, StyleId,
-        SynthesisOptions, VoiceModelId, VoiceModelMeta,
+        AccentPhrase, AudioQuery, FullcontextExtractor, Result, StyleId, SynthesisOptions,
+        VoiceModelId, VoiceModelMeta,
     };
 
     use super::{InitializeOptions, TtsOptions};
@@ -1191,7 +1186,7 @@ pub(crate) mod tokio {
 
         pub async fn synthesis(
             &self,
-            audio_query: &AudioQueryModel,
+            audio_query: &AudioQuery,
             style_id: StyleId,
             options: &SynthesisOptions,
         ) -> Result<Vec<u8>> {
@@ -1207,7 +1202,7 @@ pub(crate) mod tokio {
             &self,
             kana: &str,
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let blocking = self.0.clone();
             let kana = kana.to_owned();
 
@@ -1217,9 +1212,9 @@ pub(crate) mod tokio {
 
         pub async fn replace_mora_data(
             &self,
-            accent_phrases: &[AccentPhraseModel],
+            accent_phrases: &[AccentPhrase],
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let blocking = self.0.clone();
             let accent_phrases = accent_phrases.to_owned();
 
@@ -1229,9 +1224,9 @@ pub(crate) mod tokio {
 
         pub async fn replace_phoneme_length(
             &self,
-            accent_phrases: &[AccentPhraseModel],
+            accent_phrases: &[AccentPhrase],
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let blocking = self.0.clone();
             let accent_phrases = accent_phrases.to_owned();
 
@@ -1243,9 +1238,9 @@ pub(crate) mod tokio {
 
         pub async fn replace_mora_pitch(
             &self,
-            accent_phrases: &[AccentPhraseModel],
+            accent_phrases: &[AccentPhrase],
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let blocking = self.0.clone();
             let accent_phrases = accent_phrases.to_owned();
 
@@ -1257,7 +1252,7 @@ pub(crate) mod tokio {
             &self,
             kana: &str,
             style_id: StyleId,
-        ) -> Result<AudioQueryModel> {
+        ) -> Result<AudioQuery> {
             let blocking = self.0.clone();
             let kana = kana.to_owned();
 
@@ -1283,14 +1278,14 @@ pub(crate) mod tokio {
             &self,
             text: &str,
             style_id: StyleId,
-        ) -> Result<Vec<AccentPhraseModel>> {
+        ) -> Result<Vec<AccentPhrase>> {
             let blocking = self.0.clone();
             let text = text.to_owned();
 
             crate::task::asyncify(move || blocking.create_accent_phrases(&text, style_id)).await
         }
 
-        pub async fn audio_query(&self, text: &str, style_id: StyleId) -> Result<AudioQueryModel> {
+        pub async fn audio_query(&self, text: &str, style_id: StyleId) -> Result<AudioQuery> {
             let blocking = self.0.clone();
             let text = text.to_owned();
 
@@ -1316,9 +1311,7 @@ pub(crate) mod tokio {
 mod tests {
 
     use super::{blocking::PerformInference as _, AccelerationMode, InitializeOptions};
-    use crate::{
-        engine::MoraModel, macros::tests::assert_debug_fmt_eq, AccentPhraseModel, Result, StyleId,
-    };
+    use crate::{engine::Mora, macros::tests::assert_debug_fmt_eq, AccentPhrase, Result, StyleId};
     use ::test_util::OPEN_JTALK_DIC_DIR;
     use rstest::rstest;
 
@@ -1740,7 +1733,7 @@ mod tests {
         assert_eq!(accent_phrases.len(), 5);
 
         // 入力テキストに「、」や「。」などの句読点が含まれていたときに
-        // AccentPhraseModel の pause_mora に期待する値をテスト
+        // AccentPhraseの pause_mora に期待する値をテスト
 
         assert!(
             accent_phrases[0].pause_mora().is_some(),
@@ -1812,7 +1805,7 @@ mod tests {
             any_mora_param_changed(
                 &accent_phrases,
                 &modified_accent_phrases,
-                MoraModel::vowel_length
+                Mora::vowel_length
             ),
             "mora_length() does not work: mora.vowel_length() is not changed."
         );
@@ -1850,7 +1843,7 @@ mod tests {
 
         // NOTE: 一つでも音高が変わっていれば、動作しているとみなす
         assert!(
-            any_mora_param_changed(&accent_phrases, &modified_accent_phrases, MoraModel::pitch),
+            any_mora_param_changed(&accent_phrases, &modified_accent_phrases, Mora::pitch),
             "mora_pitch() does not work: mora.pitch() is not changed."
         );
     }
@@ -1887,7 +1880,7 @@ mod tests {
 
         // NOTE: 一つでも音高が変わっていれば、動作しているとみなす
         assert!(
-            any_mora_param_changed(&accent_phrases, &modified_accent_phrases, MoraModel::pitch),
+            any_mora_param_changed(&accent_phrases, &modified_accent_phrases, Mora::pitch),
             "mora_data() does not work: mora.pitch() is not changed."
         );
         // NOTE: 一つでも母音の長さが変わっていれば、動作しているとみなす
@@ -1895,16 +1888,16 @@ mod tests {
             any_mora_param_changed(
                 &accent_phrases,
                 &modified_accent_phrases,
-                MoraModel::vowel_length
+                Mora::vowel_length
             ),
             "mora_data() does not work: mora.vowel_length() is not changed."
         );
     }
 
     fn any_mora_param_changed<T: PartialEq>(
-        before: &[AccentPhraseModel],
-        after: &[AccentPhraseModel],
-        param: fn(&MoraModel) -> &T,
+        before: &[AccentPhrase],
+        after: &[AccentPhrase],
+        param: fn(&Mora) -> &T,
     ) -> bool {
         std::iter::zip(before, after)
             .flat_map(move |(before, after)| std::iter::zip(before.moras(), after.moras()))
diff --git a/crates/voicevox_core/src/text_analyzer.rs b/crates/voicevox_core/src/text_analyzer.rs
index 8540f26e0..f0811ed91 100644
--- a/crates/voicevox_core/src/text_analyzer.rs
+++ b/crates/voicevox_core/src/text_analyzer.rs
@@ -1,10 +1,10 @@
 use crate::{
     engine::{extract_full_context_label, parse_kana},
-    AccentPhraseModel, FullcontextExtractor, Result,
+    AccentPhrase, FullcontextExtractor, Result,
 };
 
 pub(crate) trait TextAnalyzer {
-    fn analyze(&self, text: &str) -> Result<Vec<AccentPhraseModel>>;
+    fn analyze(&self, text: &str) -> Result<Vec<AccentPhrase>>;
 }
 
 /// AquesTalk風記法からAccentPhraseの配列を生成するTextAnalyzer
@@ -12,7 +12,7 @@ pub(crate) trait TextAnalyzer {
 pub(crate) struct KanaAnalyzer;
 
 impl TextAnalyzer for KanaAnalyzer {
-    fn analyze(&self, text: &str) -> Result<Vec<AccentPhraseModel>> {
+    fn analyze(&self, text: &str) -> Result<Vec<AccentPhrase>> {
         if text.is_empty() {
             return Ok(Vec::new());
         }
@@ -31,7 +31,7 @@ impl<O> OpenJTalkAnalyzer<O> {
 }
 
 impl<O: FullcontextExtractor> TextAnalyzer for OpenJTalkAnalyzer<O> {
-    fn analyze(&self, text: &str) -> Result<Vec<AccentPhraseModel>> {
+    fn analyze(&self, text: &str) -> Result<Vec<AccentPhrase>> {
         if text.is_empty() {
             return Ok(Vec::new());
         }
diff --git a/crates/voicevox_core_c_api/src/helpers.rs b/crates/voicevox_core_c_api/src/helpers.rs
index 5066b643a..af4057d09 100644
--- a/crates/voicevox_core_c_api/src/helpers.rs
+++ b/crates/voicevox_core_c_api/src/helpers.rs
@@ -1,12 +1,12 @@
 use easy_ext::ext;
 use std::{ffi::CStr, fmt::Debug, iter};
 use uuid::Uuid;
-use voicevox_core::{AudioQueryModel, UserDictWord, VoiceModelId};
+use voicevox_core::{AudioQuery, UserDictWord, VoiceModelId};
 
 use thiserror::Error;
 use tracing::error;
 
-use voicevox_core::AccentPhraseModel;
+use voicevox_core::AccentPhrase;
 
 use crate::{
     result_code::VoicevoxResultCode, VoicevoxAccelerationMode, VoicevoxInitializeOptions,
@@ -80,11 +80,11 @@ pub(crate) enum CApiError {
     InvalidUuid(uuid::Error),
 }
 
-pub(crate) fn audio_query_model_to_json(audio_query_model: &AudioQueryModel) -> String {
+pub(crate) fn audio_query_model_to_json(audio_query_model: &AudioQuery) -> String {
     serde_json::to_string(audio_query_model).expect("should be always valid")
 }
 
-pub(crate) fn accent_phrases_to_json(audio_query_model: &[AccentPhraseModel]) -> String {
+pub(crate) fn accent_phrases_to_json(audio_query_model: &[AccentPhrase]) -> String {
     serde_json::to_string(audio_query_model).expect("should be always valid")
 }
 
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 964e635ab..3904698fc 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -33,7 +33,7 @@ use tracing_subscriber::fmt::format::Writer;
 use tracing_subscriber::EnvFilter;
 use uuid::Uuid;
 use voicevox_core::__internal::interop::IdRef as _;
-use voicevox_core::{AccentPhraseModel, AudioQueryModel, TtsOptions, UserDictWord};
+use voicevox_core::{AccentPhrase, AudioQuery, TtsOptions, UserDictWord};
 use voicevox_core::{StyleId, SynthesisOptions};
 
 fn init_logger_once() {
@@ -906,7 +906,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_replace_mora_data(
 ) -> VoicevoxResultCode {
     init_logger_once();
     into_result_code_with_error((|| {
-        let accent_phrases: Vec<AccentPhraseModel> =
+        let accent_phrases: Vec<AccentPhrase> =
             serde_json::from_str(ensure_utf8(CStr::from_ptr(accent_phrases_json))?)
                 .map_err(CApiError::InvalidAccentPhrase)?;
         let accent_phrases = synthesizer
@@ -946,7 +946,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_replace_phoneme_length(
 ) -> VoicevoxResultCode {
     init_logger_once();
     into_result_code_with_error((|| {
-        let accent_phrases: Vec<AccentPhraseModel> =
+        let accent_phrases: Vec<AccentPhrase> =
             serde_json::from_str(ensure_utf8(CStr::from_ptr(accent_phrases_json))?)
                 .map_err(CApiError::InvalidAccentPhrase)?;
         let accent_phrases = synthesizer
@@ -986,7 +986,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_replace_mora_pitch(
 ) -> VoicevoxResultCode {
     init_logger_once();
     into_result_code_with_error((|| {
-        let accent_phrases: Vec<AccentPhraseModel> =
+        let accent_phrases: Vec<AccentPhrase> =
             serde_json::from_str(ensure_utf8(CStr::from_ptr(accent_phrases_json))?)
                 .map_err(CApiError::InvalidAccentPhrase)?;
         let accent_phrases = synthesizer
@@ -1049,7 +1049,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_synthesis(
         let audio_query_json = CStr::from_ptr(audio_query_json)
             .to_str()
             .map_err(|_| CApiError::InvalidUtf8Input)?;
-        let audio_query: AudioQueryModel =
+        let audio_query: AudioQuery =
             serde_json::from_str(audio_query_json).map_err(CApiError::InvalidAudioQuery)?;
         let wav = synthesizer.synthesizer().synthesis(
             &audio_query,
diff --git a/crates/voicevox_core_java_api/src/synthesizer.rs b/crates/voicevox_core_java_api/src/synthesizer.rs
index b2605e8ae..9ebd98e47 100644
--- a/crates/voicevox_core_java_api/src/synthesizer.rs
+++ b/crates/voicevox_core_java_api/src/synthesizer.rs
@@ -288,7 +288,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsReplaceMo
 ) -> jobject {
     throw_if_err(env, std::ptr::null_mut(), |env| {
         let accent_phrases_json: String = env.get_string(&accent_phrases_json)?.into();
-        let accent_phrases: Vec<voicevox_core::AccentPhraseModel> =
+        let accent_phrases: Vec<voicevox_core::AccentPhrase> =
             serde_json::from_str(&accent_phrases_json).map_err(JavaApiError::DeJson)?;
         let style_id = style_id as u32;
 
@@ -319,7 +319,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsReplacePh
 ) -> jobject {
     throw_if_err(env, std::ptr::null_mut(), |env| {
         let accent_phrases_json: String = env.get_string(&accent_phrases_json)?.into();
-        let accent_phrases: Vec<voicevox_core::AccentPhraseModel> =
+        let accent_phrases: Vec<voicevox_core::AccentPhrase> =
             serde_json::from_str(&accent_phrases_json).map_err(JavaApiError::DeJson)?;
         let style_id = style_id as u32;
 
@@ -348,7 +348,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsReplaceMo
 ) -> jobject {
     throw_if_err(env, std::ptr::null_mut(), |env| {
         let accent_phrases_json: String = env.get_string(&accent_phrases_json)?.into();
-        let accent_phrases: Vec<voicevox_core::AccentPhraseModel> =
+        let accent_phrases: Vec<voicevox_core::AccentPhrase> =
             serde_json::from_str(&accent_phrases_json).map_err(JavaApiError::DeJson)?;
         let style_id = style_id as u32;
 
@@ -378,7 +378,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsSynthesis
 ) -> jobject {
     throw_if_err(env, std::ptr::null_mut(), |env| {
         let audio_query: String = env.get_string(&query_json)?.into();
-        let audio_query: voicevox_core::AudioQueryModel =
+        let audio_query: voicevox_core::AudioQuery =
             serde_json::from_str(&audio_query).map_err(JavaApiError::DeJson)?;
         let style_id = style_id as u32;
 
diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs
index 0eee14a5b..b625f70b5 100644
--- a/crates/voicevox_core_python_api/src/convert.rs
+++ b/crates/voicevox_core_python_api/src/convert.rs
@@ -10,9 +10,7 @@ use pyo3::{
 use serde::{de::DeserializeOwned, Serialize};
 use serde_json::json;
 use uuid::Uuid;
-use voicevox_core::{
-    AccelerationMode, AccentPhraseModel, StyleId, UserDictWordType, VoiceModelMeta,
-};
+use voicevox_core::{AccelerationMode, AccentPhrase, StyleId, UserDictWordType, VoiceModelMeta};
 
 use crate::{
     ExtractFullContextLabelError, GetSupportedDevicesError, GpuSupportError, InferenceFailedError,
@@ -86,15 +84,12 @@ pub(crate) fn blocking_modify_accent_phrases<'py>(
     accent_phrases: &'py PyList,
     speaker_id: StyleId,
     py: Python<'py>,
-    method: impl FnOnce(
-        Vec<AccentPhraseModel>,
-        StyleId,
-    ) -> voicevox_core::Result<Vec<AccentPhraseModel>>,
+    method: impl FnOnce(Vec<AccentPhrase>, StyleId) -> voicevox_core::Result<Vec<AccentPhrase>>,
 ) -> PyResult<Vec<&'py PyAny>> {
     let rust_accent_phrases = accent_phrases
         .iter()
         .map(from_dataclass)
-        .collect::<PyResult<Vec<AccentPhraseModel>>>()?;
+        .collect::<PyResult<Vec<AccentPhrase>>>()?;
 
     method(rust_accent_phrases, speaker_id)
         .into_py_result(py)?
@@ -115,13 +110,13 @@ pub(crate) fn async_modify_accent_phrases<'py, Fun, Fut>(
     method: Fun,
 ) -> PyResult<&'py PyAny>
 where
-    Fun: FnOnce(Vec<AccentPhraseModel>, StyleId) -> Fut + Send + 'static,
-    Fut: Future<Output = voicevox_core::Result<Vec<AccentPhraseModel>>> + Send + 'static,
+    Fun: FnOnce(Vec<AccentPhrase>, StyleId) -> Fut + Send + 'static,
+    Fut: Future<Output = voicevox_core::Result<Vec<AccentPhrase>>> + Send + 'static,
 {
     let rust_accent_phrases = accent_phrases
         .iter()
         .map(from_dataclass)
-        .collect::<PyResult<Vec<AccentPhraseModel>>>()?;
+        .collect::<PyResult<Vec<AccentPhrase>>>()?;
     pyo3_asyncio::tokio::future_into_py_with_locals(
         py,
         pyo3_asyncio::tokio::get_current_locals(py)?,
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index 0da82f9ca..e301f1042 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -151,8 +151,8 @@ mod blocking {
     };
     use uuid::Uuid;
     use voicevox_core::{
-        AccelerationMode, AudioQueryModel, InitializeOptions, StyleId, SynthesisOptions,
-        TtsOptions, UserDictWord,
+        AccelerationMode, AudioQuery, InitializeOptions, StyleId, SynthesisOptions, TtsOptions,
+        UserDictWord,
     };
 
     use crate::{convert::VoicevoxCoreResultExt as _, Closable};
@@ -497,7 +497,7 @@ mod blocking {
         ))]
         fn synthesis<'py>(
             &self,
-            #[pyo3(from_py_with = "crate::convert::from_dataclass")] audio_query: AudioQueryModel,
+            #[pyo3(from_py_with = "crate::convert::from_dataclass")] audio_query: AudioQuery,
             style_id: u32,
             enable_interrogative_upspeak: bool,
             py: Python<'py>,
@@ -651,8 +651,8 @@ mod asyncio {
     };
     use uuid::Uuid;
     use voicevox_core::{
-        AccelerationMode, AudioQueryModel, InitializeOptions, StyleId, SynthesisOptions,
-        TtsOptions, UserDictWord,
+        AccelerationMode, AudioQuery, InitializeOptions, StyleId, SynthesisOptions, TtsOptions,
+        UserDictWord,
     };
 
     use crate::{convert::VoicevoxCoreResultExt as _, Closable};
@@ -1045,7 +1045,7 @@ mod asyncio {
         #[pyo3(signature=(audio_query,style_id,enable_interrogative_upspeak = TtsOptions::default().enable_interrogative_upspeak))]
         fn synthesis<'py>(
             &self,
-            #[pyo3(from_py_with = "crate::convert::from_dataclass")] audio_query: AudioQueryModel,
+            #[pyo3(from_py_with = "crate::convert::from_dataclass")] audio_query: AudioQuery,
             style_id: u32,
             enable_interrogative_upspeak: bool,
             py: Python<'py>,

From e14f785890d706733a7f58f7035ef0a0f555e63f Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sun, 7 Jul 2024 23:09:28 +0900
Subject: [PATCH 13/36] chore: `tool.maturin.skip-auditwheel = false` (#806)

---
 crates/voicevox_core_python_api/pyproject.toml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/crates/voicevox_core_python_api/pyproject.toml b/crates/voicevox_core_python_api/pyproject.toml
index 428e7695f..4ae2da74a 100644
--- a/crates/voicevox_core_python_api/pyproject.toml
+++ b/crates/voicevox_core_python_api/pyproject.toml
@@ -28,7 +28,6 @@ executionEnvironments = [{ root = "python/test" }, { root = "python" }]
 [tool.maturin]
 module-name = "voicevox_core._rust"
 bindings = "pyo3"
-skip-auditwheel = true # Linuxでlibonnxruntime.so.*の不在を許してもらう
 python-source = "python"
 
 [tool.poetry]

From d66a8b0c1422ae7b8b07aca7da18cce988d4b8d6 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Thu, 11 Jul 2024 16:16:56 +0900
Subject: [PATCH 14/36] =?UTF-8?q?refactor:=20Rust=20API=E3=81=AB=E3=81=8A?=
 =?UTF-8?q?=E3=81=91=E3=82=8Bgetter=E3=82=92=E3=83=91=E3=83=96=E3=83=AA?=
 =?UTF-8?q?=E3=83=83=E3=82=AFAPI=E3=81=A8=E3=81=97=E3=81=A6=E6=95=B4?=
 =?UTF-8?q?=E3=81=88=E3=82=8B=20(#807)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crates/voicevox_core/src/devices.rs           |   3 +-
 .../src/engine/full_context_label.rs          | 188 ++++-----
 .../voicevox_core/src/engine/kana_parser.rs   |  69 ++--
 crates/voicevox_core/src/engine/model.rs      |  65 +--
 crates/voicevox_core/src/metas.rs             |  23 +-
 crates/voicevox_core/src/status.rs            |  27 +-
 crates/voicevox_core/src/synthesizer.rs       | 390 +++++++++---------
 crates/voicevox_core/src/user_dict/word.rs    |  40 +-
 crates/voicevox_core/src/voice_model.rs       |  23 +-
 .../src/compatible_engine.rs                  |   4 +-
 crates/voicevox_core_c_api/src/lib.rs         |   8 +-
 .../voicevox_core_java_api/src/voice_model.rs |   2 +-
 crates/voicevox_core_python_api/src/lib.rs    |   4 +-
 13 files changed, 437 insertions(+), 409 deletions(-)

diff --git a/crates/voicevox_core/src/devices.rs b/crates/voicevox_core/src/devices.rs
index 140105962..dfe8d7e64 100644
--- a/crates/voicevox_core/src/devices.rs
+++ b/crates/voicevox_core/src/devices.rs
@@ -1,11 +1,10 @@
-use derive_getters::Getters;
 use serde::{Deserialize, Serialize};
 
 /// このライブラリで利用可能なデバイスの情報。
 ///
 /// あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったと
 /// しても`cuda`や`dml`は`true`を示しうる。
-#[derive(Getters, Debug, Serialize, Deserialize)]
+#[derive(Debug, Serialize, Deserialize)]
 pub struct SupportedDevices {
     /// CPUが利用可能。
     ///
diff --git a/crates/voicevox_core/src/engine/full_context_label.rs b/crates/voicevox_core/src/engine/full_context_label.rs
index 4f95abbf2..92617a8c1 100644
--- a/crates/voicevox_core/src/engine/full_context_label.rs
+++ b/crates/voicevox_core/src/engine/full_context_label.rs
@@ -88,14 +88,14 @@ fn generate_accent_phrases(
         let pause_mora = if ap_curr.accent_phrase_position_backward == 1
             && bg_curr.breath_group_position_backward != 1
         {
-            Some(crate::Mora::new(
-                "、".into(),
-                None,
-                None,
-                "pau".into(),
-                0.,
-                0.,
-            ))
+            Some(crate::Mora {
+                text: "、".into(),
+                consonant: None,
+                consonant_length: None,
+                vowel: "pau".into(),
+                vowel_length: 0.,
+                pitch: 0.,
+            })
         } else {
             None
         };
@@ -103,12 +103,12 @@ fn generate_accent_phrases(
         // workaround for VOICEVOX/voicevox_engine#55
         let accent = usize::from(ap_curr.accent_position).min(moras.len());
 
-        accent_phrases.push(AccentPhrase::new(
+        accent_phrases.push(AccentPhrase {
             moras,
             accent,
             pause_mora,
-            ap_curr.is_interrogative,
-        ))
+            is_interrogative: ap_curr.is_interrogative,
+        })
     }
     Ok(accent_phrases)
 }
@@ -153,15 +153,15 @@ fn generate_moras(accent_phrase: &[Label]) -> std::result::Result<Vec<crate::Mor
 
 fn generate_mora(consonant: Option<&Label>, vowel: &Label) -> crate::Mora {
     let consonant_phoneme = consonant.and_then(|c| c.phoneme.c.to_owned());
-    let vowel_phoneme = vowel.phoneme.c.as_deref().unwrap();
-    crate::Mora::new(
-        mora_to_text(consonant_phoneme.as_deref(), vowel_phoneme),
-        consonant_phoneme,
-        consonant.and(Some(0.0)),
-        vowel_phoneme.to_string(),
-        0.0,
-        0.0,
-    )
+    let vowel = vowel.phoneme.c.clone().unwrap();
+    crate::Mora {
+        text: mora_to_text(consonant_phoneme.as_deref(), &vowel),
+        consonant: consonant_phoneme,
+        consonant_length: consonant.and(Some(0.0)),
+        vowel,
+        vowel_length: 0.0,
+        pitch: 0.0,
+    }
 }
 
 pub fn mora_to_text(consonant: Option<&str>, vowel: &str) -> String {
@@ -197,14 +197,14 @@ mod tests {
     use jlabel::Label;
 
     fn mora(text: &str, consonant: Option<&str>, vowel: &str) -> Mora {
-        Mora::new(
-            text.into(),
-            consonant.map(|c| c.into()),
-            consonant.and(Some(0.0)),
-            vowel.into(),
-            0.0,
-            0.0,
-        )
+        Mora {
+            text: text.into(),
+            consonant: consonant.map(|c| c.into()),
+            consonant_length: consonant.and(Some(0.0)),
+            vowel: vowel.into(),
+            vowel_length: 0.0,
+            pitch: 0.0,
+        }
     }
 
     #[template]
@@ -218,12 +218,12 @@ mod tests {
             "y^e-sil+xx=xx/A:xx+xx+xx/B:xx-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:1_1!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:1_1/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:1+1-1",
         ],
         &[
-            AccentPhrase::new(
-                vec![mora("イェ", Some("y"), "e")],
-                1,
-                None,
-                false,
-            )
+            AccentPhrase {
+                moras: vec![mora("イェ", Some("y"), "e")],
+                accent: 1,
+                pause_mora: None,
+                is_interrogative: false,
+            }
         ]
     )]
     #[case(
@@ -236,16 +236,16 @@ mod tests {
             "N^cl-sil+xx=xx/A:xx+xx+xx/B:09-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:3_3!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:1_3/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:1+1-3",
         ],
         &[
-            AccentPhrase::new(
-                vec![
+            AccentPhrase {
+                moras: vec![
                     mora("ン", None, "N"),
                     mora("ン", None, "N"),
                     mora("ッ", None, "cl"),
                 ],
-                3,
-                None,
-                false,
-            ),
+                accent: 3,
+                pause_mora: None,
+                is_interrogative: false,
+            },
         ]
     )]
     #[case(
@@ -271,28 +271,28 @@ mod tests {
             "s^U-sil+xx=xx/A:xx+xx+xx/B:10-7_2/C:xx_xx+xx/D:xx+xx_xx/E:5_1!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:2_8/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:1+2-8",
         ],
         &[
-            AccentPhrase::new(
-                vec![
+            AccentPhrase {
+                moras: vec![
                     mora("コ", Some("k"), "o"),
                     mora("レ", Some("r"), "e"),
                     mora("ワ", Some("w"), "a"),
                 ],
-                3,
-                None,
-                false,
-            ),
-            AccentPhrase::new(
-                vec![
+                accent: 3,
+                pause_mora: None,
+                is_interrogative: false,
+            },
+            AccentPhrase {
+                moras: vec![
                     mora("テ", Some("t"), "e"),
                     mora("ス", Some("s"), "U"),
                     mora("ト", Some("t"), "o"),
                     mora("デ", Some("d"), "e"),
                     mora("ス", Some("s"), "U"),
                 ],
-                1,
-                None,
-                false,
-            ),
+                accent: 1,
+                pause_mora: None,
+                is_interrogative: false,
+            },
         ]
     )]
     #[case(
@@ -324,46 +324,46 @@ mod tests {
             "k^u-sil+xx=xx/A:xx+xx+xx/B:05-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:4_2!1_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:1_4/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:4+4-12",
         ],
         &[
-            AccentPhrase::new(
-                vec![
+            AccentPhrase {
+                moras: vec![
                     mora("イ", None, "i"),
                     mora("チ", Some("ch"), "i"),
                 ],
-                2,
-                Some(mora("、", None, "pau")),
-                false,
-            ),
-            AccentPhrase::new(
-                vec![
+                accent: 2,
+                pause_mora: Some(mora("、", None, "pau")),
+                is_interrogative: false,
+            },
+            AccentPhrase {
+                moras: vec![
                     mora("セ", Some("s"), "e"),
                     mora("ン", None, "N"),
                 ],
-                1,
-                Some(mora("、", None, "pau")),
-                false,
-            ),
-            AccentPhrase::new(
-                vec![
+                accent: 1,
+                pause_mora: Some(mora("、", None, "pau")),
+                is_interrogative: false,
+            },
+            AccentPhrase {
+                moras: vec![
                     mora("ヒャ", Some("hy"), "a"),
                     mora("ク", Some("k"), "u"),
                     mora("マ", Some("m"), "a"),
                     mora("ン", None, "N"),
                 ],
-                3,
-                Some(mora("、", None, "pau")),
-                false,
-            ),
-            AccentPhrase::new(
-                vec![
+                accent: 3,
+                pause_mora: Some(mora("、", None, "pau")),
+                is_interrogative: false,
+            },
+            AccentPhrase {
+                moras: vec![
                     mora("イ", None, "i"),
                     mora("チ", Some("ch"), "i"),
                     mora("オ", None, "o"),
                     mora("ク", Some("k"), "u"),
                 ],
-                2,
-                None,
-                true,
-            ),
+                accent: 2,
+                pause_mora: None,
+                is_interrogative: true,
+            },
         ]
     )]
     #[case(
@@ -386,33 +386,33 @@ mod tests {
             "a^a-sil+xx=xx/A:xx+xx+xx/B:09-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:1_1!0_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:xx_xx%xx_xx_xx/H:2_3/I:xx-xx@xx+xx&xx-xx|xx+xx/J:xx_xx/K:2+3-8",
         ],
         &[
-            AccentPhrase::new(
-                vec![
+            AccentPhrase {
+                moras: vec![
                     mora("クヮ", Some("kw"), "a"),
                     mora("ル", Some("r"), "u"),
                     mora("テ", Some("t"), "e"),
                     mora("ッ", None, "cl"),
                     mora("ト", Some("t"), "o"),
                 ],
-                3,
-                Some(mora("、", None, "pau")),
-                false,
-            ),
-            AccentPhrase::new(
-                vec![
+                accent: 3,
+                pause_mora: Some(mora("、", None, "pau")),
+                is_interrogative: false,
+            },
+            AccentPhrase {
+                moras: vec![
                     mora("ア", None, "a"),
                     mora("ア", None, "a"),
                 ],
-                1,
-                None,
-                false,
-            ),
-            AccentPhrase::new(
-                vec![mora("ア", None, "a")],
-                1,
-                None,
-                false,
-            ),
+                accent: 1,
+                pause_mora: None,
+                is_interrogative: false,
+            },
+            AccentPhrase {
+                moras: vec![mora("ア", None, "a")],
+                accent: 1,
+                pause_mora: None,
+                is_interrogative: false,
+            },
         ]
     )]
     fn label_cases(
diff --git a/crates/voicevox_core/src/engine/kana_parser.rs b/crates/voicevox_core/src/engine/kana_parser.rs
index 42f17dc63..9397376f6 100644
--- a/crates/voicevox_core/src/engine/kana_parser.rs
+++ b/crates/voicevox_core/src/engine/kana_parser.rs
@@ -27,26 +27,27 @@ static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, Mora>> = Lazy::new(|| {
         let consonant_length = if consonant.is_some() { Some(0.0) } else { None };
 
         if ["a", "i", "u", "e", "o"].contains(vowel) {
-            let upper_vowel = vowel.to_uppercase();
-            let unvoice_mora = Mora::new(
-                text.to_string(),
-                consonant.clone(),
+            let vowel = vowel.to_uppercase();
+
+            let unvoice_mora = Mora {
+                text: text.to_string(),
+                consonant: consonant.clone(),
                 consonant_length,
-                upper_vowel,
-                0.,
-                0.,
-            );
+                vowel,
+                vowel_length: 0.,
+                pitch: 0.,
+            };
             text2mora_with_unvoice.insert(UNVOICE_SYMBOL.to_string() + text, unvoice_mora);
         }
 
-        let mora = Mora::new(
-            text.to_string(),
+        let mora = Mora {
+            text: text.to_string(),
             consonant,
             consonant_length,
-            vowel.to_string(),
-            0.,
-            0.,
-        );
+            vowel: vowel.to_string(),
+            vowel_length: 0.,
+            pitch: 0.,
+        };
         text2mora_with_unvoice.insert(text.to_string(), mora);
     }
     text2mora_with_unvoice
@@ -107,7 +108,12 @@ fn text_to_accent_phrase(phrase: &str) -> KanaParseResult<AccentPhrase> {
             "accent not found in accent phrase: {phrase}"
         )));
     }
-    Ok(AccentPhrase::new(moras, accent_index.unwrap(), None, false))
+    Ok(AccentPhrase {
+        moras,
+        accent: accent_index.unwrap(),
+        pause_mora: None,
+        is_interrogative: false,
+    })
 }
 
 pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhrase>> {
@@ -137,14 +143,14 @@ pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhrase>> {
             let accent_phrase = {
                 let mut accent_phrase = text_to_accent_phrase(&phrase)?;
                 if letter == PAUSE_DELIMITER {
-                    accent_phrase.set_pause_mora(Some(Mora::new(
-                        PAUSE_DELIMITER.to_string(),
-                        None,
-                        None,
-                        "pau".to_string(),
-                        0.,
-                        0.,
-                    )));
+                    accent_phrase.set_pause_mora(Some(Mora {
+                        text: PAUSE_DELIMITER.to_string(),
+                        consonant: None,
+                        consonant_length: None,
+                        vowel: "pau".to_string(),
+                        vowel_length: 0.,
+                        pitch: 0.,
+                    }));
                 }
                 accent_phrase.set_is_interrogative(is_interrogative);
                 accent_phrase
@@ -161,20 +167,19 @@ pub(crate) fn parse_kana(text: &str) -> KanaParseResult<Vec<AccentPhrase>> {
 pub(crate) fn create_kana(accent_phrases: &[AccentPhrase]) -> String {
     let mut text = String::new();
     for phrase in accent_phrases {
-        let moras = phrase.moras();
-        for (index, mora) in moras.iter().enumerate() {
-            if ["A", "E", "I", "O", "U"].contains(&(*mora.vowel()).as_ref()) {
+        for (index, mora) in phrase.moras.iter().enumerate() {
+            if ["A", "E", "I", "O", "U"].contains(&&*mora.vowel) {
                 text.push(UNVOICE_SYMBOL);
             }
-            text.push_str(mora.text());
-            if index + 1 == *phrase.accent() {
+            text.push_str(&mora.text);
+            if index + 1 == phrase.accent {
                 text.push(ACCENT_SYMBOL);
             }
         }
-        if *phrase.is_interrogative() {
+        if phrase.is_interrogative {
             text.push(WIDE_INTERROGATION_MARK);
         }
-        text.push(if phrase.pause_mora().is_some() {
+        text.push(if phrase.pause_mora.is_some() {
             PAUSE_DELIMITER
         } else {
             NOPAUSE_DELIMITER
@@ -207,10 +212,10 @@ mod tests {
         assert_eq!(mora.is_some(), res.is_some());
         if let Some(res) = res {
             let mut m = String::new();
-            if let Some(ref c) = *res.consonant() {
+            if let Some(c) = &res.consonant {
                 m.push_str(c);
             }
-            m.push_str(res.vowel());
+            m.push_str(&res.vowel);
             assert_eq!(m, mora.unwrap());
         }
     }
diff --git a/crates/voicevox_core/src/engine/model.rs b/crates/voicevox_core/src/engine/model.rs
index 09f53b6ee..20203feb3 100644
--- a/crates/voicevox_core/src/engine/model.rs
+++ b/crates/voicevox_core/src/engine/model.rs
@@ -1,38 +1,36 @@
-use derive_getters::Getters;
-use derive_new::new;
 use serde::{Deserialize, Serialize};
 
 /* 各フィールドのjsonフィールド名はsnake_caseとする*/
 
 /// モーラ（子音＋母音）ごとの情報。
-#[derive(Clone, Debug, new, Getters, Deserialize, Serialize, PartialEq)]
+#[derive(Clone, Debug, Deserialize, Serialize, PartialEq)]
 pub struct Mora {
     /// 文字。
-    text: String,
+    pub text: String,
     /// 子音の音素。
-    consonant: Option<String>,
+    pub consonant: Option<String>,
     /// 子音の音長。
-    consonant_length: Option<f32>,
+    pub consonant_length: Option<f32>,
     /// 母音の音素。
-    vowel: String,
+    pub vowel: String,
     /// 母音の音長。
-    vowel_length: f32,
+    pub vowel_length: f32,
     /// 音高。
-    pitch: f32,
+    pub pitch: f32,
 }
 
 /// AccentPhrase (アクセント句ごとの情報)。
-#[derive(Clone, Debug, new, Getters, Deserialize, Serialize, PartialEq)]
+#[derive(Clone, Debug, Deserialize, Serialize, PartialEq)]
 pub struct AccentPhrase {
     /// モーラの配列。
-    moras: Vec<Mora>,
+    pub moras: Vec<Mora>,
     /// アクセント箇所。
-    accent: usize,
+    pub accent: usize,
     /// 後ろに無音を付けるかどうか。
-    pause_mora: Option<Mora>,
+    pub pause_mora: Option<Mora>,
     /// 疑問系かどうか。
     #[serde(default)]
-    is_interrogative: bool,
+    pub is_interrogative: bool,
 }
 
 impl AccentPhrase {
@@ -46,34 +44,33 @@ impl AccentPhrase {
 }
 
 /// AudioQuery (音声合成用のクエリ)。
-#[allow(clippy::too_many_arguments)]
-#[derive(Clone, new, Getters, Deserialize, Serialize)]
+#[derive(Clone, Deserialize, Serialize)]
 pub struct AudioQuery {
     /// アクセント句の配列。
-    accent_phrases: Vec<AccentPhrase>,
+    pub accent_phrases: Vec<AccentPhrase>,
     /// 全体の話速。
-    speed_scale: f32,
+    pub speed_scale: f32,
     /// 全体の音高。
-    pitch_scale: f32,
+    pub pitch_scale: f32,
     /// 全体の抑揚。
-    intonation_scale: f32,
+    pub intonation_scale: f32,
     /// 全体の音量。
-    volume_scale: f32,
+    pub volume_scale: f32,
     /// 音声の前の無音時間。
-    pre_phoneme_length: f32,
+    pub pre_phoneme_length: f32,
     /// 音声の後の無音時間。
-    post_phoneme_length: f32,
+    pub post_phoneme_length: f32,
     /// 音声データの出力サンプリングレート。
-    output_sampling_rate: u32,
+    pub output_sampling_rate: u32,
     /// 音声データをステレオ出力するか否か。
-    output_stereo: bool,
+    pub output_stereo: bool,
     /// \[読み取り専用\] AquesTalk風記法。
     ///
     /// [`Synthesizer::audio_query`]が返すもののみ`Some`となる。入力としてのAudioQueryでは無視され
     /// る。
     ///
-    /// [`Synthesizer::audio_query`]: crate::Synthesizer::audio_query
-    kana: Option<String>,
+    /// [`Synthesizer::audio_query`]: crate::blocking::Synthesizer::audio_query
+    pub kana: Option<String>,
 }
 
 impl AudioQuery {
@@ -92,8 +89,18 @@ mod tests {
 
     #[rstest]
     fn check_audio_query_model_json_field_snake_case() {
-        let audio_query_model =
-            AudioQuery::new(vec![], 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0, false, None);
+        let audio_query_model = AudioQuery {
+            accent_phrases: vec![],
+            speed_scale: 0.0,
+            pitch_scale: 0.0,
+            intonation_scale: 0.0,
+            volume_scale: 0.0,
+            pre_phoneme_length: 0.0,
+            post_phoneme_length: 0.0,
+            output_sampling_rate: 0,
+            output_stereo: false,
+            kana: None,
+        };
         let val = serde_json::to_value(audio_query_model).unwrap();
         check_json_field_snake_case(&val);
     }
diff --git a/crates/voicevox_core/src/metas.rs b/crates/voicevox_core/src/metas.rs
index b9f274c48..1fb4a7f9d 100644
--- a/crates/voicevox_core/src/metas.rs
+++ b/crates/voicevox_core/src/metas.rs
@@ -1,6 +1,5 @@
 use std::fmt::{Debug, Display};
 
-use derive_getters::Getters;
 use derive_new::new;
 use indexmap::IndexMap;
 use itertools::Itertools as _;
@@ -102,20 +101,20 @@ impl Display for StyleVersion {
 pub type VoiceModelMeta = Vec<SpeakerMeta>;
 
 /// **話者**(_speaker_)のメタ情報。
-#[derive(Deserialize, Serialize, Getters, Clone)]
+#[derive(Deserialize, Serialize, Clone)]
 pub struct SpeakerMeta {
     /// 話者名。
-    name: String,
+    pub name: String,
     /// 話者に属するスタイル。
-    styles: Vec<StyleMeta>,
+    pub styles: Vec<StyleMeta>,
     /// 話者のバージョン。
-    version: StyleVersion,
+    pub version: StyleVersion,
     /// 話者のUUID。
-    speaker_uuid: String,
+    pub speaker_uuid: String,
     /// 話者の順番。
     ///
     /// `SpeakerMeta`の列は、この値に対して昇順に並んでいるべきである。
-    order: Option<u32>,
+    pub order: Option<u32>,
 }
 
 impl SpeakerMeta {
@@ -161,19 +160,19 @@ impl SpeakerMeta {
 }
 
 /// **スタイル**(_style_)のメタ情報。
-#[derive(Deserialize, Serialize, Getters, Clone)]
+#[derive(Deserialize, Serialize, Clone)]
 pub struct StyleMeta {
     /// スタイルID。
-    id: StyleId,
+    pub id: StyleId,
     /// スタイル名。
-    name: String,
+    pub name: String,
     /// スタイルに対応するモデルの種類。
     #[serde(default)]
-    r#type: StyleType,
+    pub r#type: StyleType,
     /// スタイルの順番。
     ///
     /// [`SpeakerMeta::styles`]は、この値に対して昇順に並んでいるべきである。
-    order: Option<u32>,
+    pub order: Option<u32>,
 }
 
 /// **スタイル**(_style_)に対応するモデルの種類。
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index 475031f1c..8c75d64d9 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -149,9 +149,10 @@ impl<R: InferenceRuntime> LoadedModels<R> {
             .0
             .iter()
             .find(|(_, LoadedModel { metas, .. })| {
-                metas.iter().flat_map(SpeakerMeta::styles).any(|style| {
-                    *style.id() == style_id && D::style_types().contains(style.r#type())
-                })
+                metas
+                    .iter()
+                    .flat_map(|SpeakerMeta { styles, .. }| styles)
+                    .any(|style| style.id == style_id && D::style_types().contains(&style.r#type))
             })
             .ok_or(ErrorRepr::StyleNotFound {
                 style_id,
@@ -200,7 +201,7 @@ impl<R: InferenceRuntime> LoadedModels<R> {
     }
 
     fn contains_style(&self, style_id: StyleId) -> bool {
-        self.styles().any(|style| *style.id() == style_id)
+        self.styles().any(|style| style.id == style_id)
     }
 
     /// 音声モデルを受け入れ可能かをチェックする。
@@ -232,22 +233,21 @@ impl<R: InferenceRuntime> LoadedModels<R> {
         let loaded = self.speakers();
         let external = model_header.metas.iter();
         for (loaded, external) in iproduct!(loaded, external) {
-            if loaded.speaker_uuid() == external.speaker_uuid() {
+            if loaded.speaker_uuid == external.speaker_uuid {
                 loaded.warn_diff_except_styles(external);
             }
         }
 
-        let loaded = self.styles();
+        let loaded = self.styles().map(|&StyleMeta { id, .. }| id);
         let external = model_header
             .metas
             .iter()
-            .flat_map(|speaker| speaker.styles());
-        if let Some((style, _)) =
-            iproduct!(loaded, external).find(|(loaded, external)| loaded.id() == external.id())
+            .flat_map(|speaker| &speaker.styles)
+            .map(|&StyleMeta { id, .. }| id);
+        if let Some((id, _)) =
+            iproduct!(loaded, external).find(|(loaded, external)| loaded == external)
         {
-            return Err(error(LoadModelErrorKind::StyleAlreadyLoaded {
-                id: *style.id(),
-            }));
+            return Err(error(LoadModelErrorKind::StyleAlreadyLoaded { id }));
         }
         Ok(())
     }
@@ -282,7 +282,8 @@ impl<R: InferenceRuntime> LoadedModels<R> {
     }
 
     fn styles(&self) -> impl Iterator<Item = &StyleMeta> {
-        self.speakers().flat_map(|speaker| speaker.styles())
+        self.speakers()
+            .flat_map(|SpeakerMeta { styles, .. }| styles)
     }
 }
 
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 4f9576500..a11af2d5b 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -155,9 +155,9 @@ pub(crate) mod blocking {
                     let supported_devices = onnxruntime.supported_devices()?;
 
                     if cfg!(feature = "directml") {
-                        *supported_devices.dml()
+                        supported_devices.dml
                     } else {
-                        *supported_devices.cuda()
+                        supported_devices.cuda
                     }
                 }
                 AccelerationMode::Cpu => false,
@@ -198,9 +198,9 @@ pub(crate) mod blocking {
                 let supported_devices = onnxruntime.supported_devices()?;
 
                 if cfg!(feature = "directml") {
-                    Ok(*supported_devices.dml())
+                    Ok(supported_devices.dml)
                 } else {
-                    Ok(*supported_devices.cuda())
+                    Ok(supported_devices.cuda)
                 }
             }
         }
@@ -247,38 +247,44 @@ pub(crate) mod blocking {
             style_id: StyleId,
             options: &SynthesisOptions,
         ) -> Result<Vec<u8>> {
-            let speed_scale = *audio_query.speed_scale();
-            let pitch_scale = *audio_query.pitch_scale();
-            let intonation_scale = *audio_query.intonation_scale();
-            let pre_phoneme_length = *audio_query.pre_phoneme_length();
-            let post_phoneme_length = *audio_query.post_phoneme_length();
+            let AudioQuery {
+                accent_phrases,
+                speed_scale,
+                pitch_scale,
+                intonation_scale,
+                pre_phoneme_length,
+                post_phoneme_length,
+                ..
+            } = audio_query;
 
             let accent_phrases = if options.enable_interrogative_upspeak {
-                adjust_interrogative_accent_phrases(audio_query.accent_phrases().as_slice())
+                adjust_interrogative_accent_phrases(accent_phrases)
             } else {
-                audio_query.accent_phrases().clone()
+                accent_phrases.clone()
             };
 
             let (flatten_moras, phoneme_data_list) = initial_process(&accent_phrases);
 
-            let mut phoneme_length_list = vec![pre_phoneme_length];
+            let mut phoneme_length_list = vec![*pre_phoneme_length];
             let mut f0_list = vec![0.];
             let mut voiced_list = vec![false];
             {
                 let mut sum_of_f0_bigger_than_zero = 0.;
                 let mut count_of_f0_bigger_than_zero = 0;
 
-                for mora in flatten_moras {
-                    let consonant_length = *mora.consonant_length();
-                    let vowel_length = *mora.vowel_length();
-                    let pitch = *mora.pitch();
-
+                for Mora {
+                    consonant_length,
+                    vowel_length,
+                    pitch,
+                    ..
+                } in flatten_moras
+                {
                     if let Some(consonant_length) = consonant_length {
                         phoneme_length_list.push(consonant_length);
                     }
                     phoneme_length_list.push(vowel_length);
 
-                    let f0_single = pitch * 2.0_f32.powf(pitch_scale);
+                    let f0_single = pitch * 2.0_f32.powf(*pitch_scale);
                     f0_list.push(f0_single);
 
                     let bigger_than_zero = f0_single > 0.;
@@ -289,7 +295,7 @@ pub(crate) mod blocking {
                         count_of_f0_bigger_than_zero += 1;
                     }
                 }
-                phoneme_length_list.push(post_phoneme_length);
+                phoneme_length_list.push(*post_phoneme_length);
                 f0_list.push(0.);
                 voiced_list.push(false);
                 let mean_f0 = sum_of_f0_bigger_than_zero / (count_of_f0_bigger_than_zero as f32);
@@ -356,23 +362,23 @@ pub(crate) mod blocking {
             ) -> Vec<AccentPhrase> {
                 accent_phrases
                     .iter()
-                    .map(|accent_phrase| {
-                        AccentPhrase::new(
-                            adjust_interrogative_moras(accent_phrase),
-                            *accent_phrase.accent(),
-                            accent_phrase.pause_mora().clone(),
-                            *accent_phrase.is_interrogative(),
-                        )
+                    .map(|accent_phrase| AccentPhrase {
+                        moras: adjust_interrogative_moras(accent_phrase),
+                        ..accent_phrase.clone()
                     })
                     .collect()
             }
 
-            fn adjust_interrogative_moras(accent_phrase: &AccentPhrase) -> Vec<Mora> {
-                let moras = accent_phrase.moras();
-                if *accent_phrase.is_interrogative() && !moras.is_empty() {
+            fn adjust_interrogative_moras(
+                AccentPhrase {
+                    moras,
+                    is_interrogative,
+                    ..
+                }: &AccentPhrase,
+            ) -> Vec<Mora> {
+                if *is_interrogative && !moras.is_empty() {
                     let last_mora = moras.last().unwrap();
-                    let last_mora_pitch = *last_mora.pitch();
-                    if last_mora_pitch != 0.0 {
+                    if last_mora.pitch != 0.0 {
                         let mut new_moras: Vec<Mora> = Vec::with_capacity(moras.len() + 1);
                         new_moras.extend_from_slice(moras.as_slice());
                         let interrogative_mora = make_interrogative_mora(last_mora);
@@ -388,23 +394,27 @@ pub(crate) mod blocking {
                 const ADJUST_PITCH: f32 = 0.3;
                 const MAX_PITCH: f32 = 6.5;
 
-                let pitch = (*last_mora.pitch() + ADJUST_PITCH).min(MAX_PITCH);
+                let pitch = (last_mora.pitch + ADJUST_PITCH).min(MAX_PITCH);
 
-                Mora::new(
-                    mora_to_text(None, last_mora.vowel()),
-                    None,
-                    None,
-                    last_mora.vowel().clone(),
-                    FIX_VOWEL_LENGTH,
+                Mora {
+                    text: mora_to_text(None, &last_mora.vowel),
+                    consonant: None,
+                    consonant_length: None,
+                    vowel: last_mora.vowel.clone(),
+                    vowel_length: FIX_VOWEL_LENGTH,
                     pitch,
-                )
+                }
             }
 
-            fn to_wav(wave: &[f32], audio_query: &AudioQuery) -> Vec<u8> {
-                let volume_scale = *audio_query.volume_scale();
-                let output_stereo = *audio_query.output_stereo();
-                let output_sampling_rate = *audio_query.output_sampling_rate();
-
+            fn to_wav(
+                wave: &[f32],
+                &AudioQuery {
+                    volume_scale,
+                    output_sampling_rate,
+                    output_stereo,
+                    ..
+                }: &AudioQuery,
+            ) -> Vec<u8> {
                 // TODO: 44.1kHzなどの対応
 
                 let num_channels: u16 = if output_stereo { 2 } else { 1 };
@@ -509,41 +519,32 @@ pub(crate) mod blocking {
             let mut index = 0;
             let new_accent_phrases = accent_phrases
                 .iter()
-                .map(|accent_phrase| {
-                    AccentPhrase::new(
-                        accent_phrase
-                            .moras()
-                            .iter()
-                            .map(|mora| {
-                                let new_mora = Mora::new(
-                                    mora.text().clone(),
-                                    mora.consonant().clone(),
-                                    mora.consonant().as_ref().map(|_| {
-                                        phoneme_length[vowel_indexes_data[index + 1] as usize - 1]
-                                    }),
-                                    mora.vowel().clone(),
-                                    phoneme_length[vowel_indexes_data[index + 1] as usize],
-                                    *mora.pitch(),
-                                );
-                                index += 1;
-                                new_mora
-                            })
-                            .collect(),
-                        *accent_phrase.accent(),
-                        accent_phrase.pause_mora().as_ref().map(|pause_mora| {
-                            let new_pause_mora = Mora::new(
-                                pause_mora.text().clone(),
-                                pause_mora.consonant().clone(),
-                                *pause_mora.consonant_length(),
-                                pause_mora.vowel().clone(),
-                                phoneme_length[vowel_indexes_data[index + 1] as usize],
-                                *pause_mora.pitch(),
-                            );
+                .map(|accent_phrase| AccentPhrase {
+                    moras: accent_phrase
+                        .moras
+                        .iter()
+                        .map(|mora| {
+                            let new_mora = Mora {
+                                consonant_length: mora.consonant.as_ref().map(|_| {
+                                    phoneme_length[vowel_indexes_data[index + 1] as usize - 1]
+                                }),
+                                vowel_length: phoneme_length
+                                    [vowel_indexes_data[index + 1] as usize],
+                                ..mora.clone()
+                            };
                             index += 1;
-                            new_pause_mora
-                        }),
-                        *accent_phrase.is_interrogative(),
-                    )
+                            new_mora
+                        })
+                        .collect(),
+                    pause_mora: accent_phrase.pause_mora.as_ref().map(|pause_mora| {
+                        let new_pause_mora = Mora {
+                            vowel_length: phoneme_length[vowel_indexes_data[index + 1] as usize],
+                            ..pause_mora.clone()
+                        };
+                        index += 1;
+                        new_pause_mora
+                    }),
+                    ..accent_phrase.clone()
                 })
                 .collect();
 
@@ -563,10 +564,10 @@ pub(crate) mod blocking {
             let mut base_start_accent_phrase_list = vec![0];
             let mut base_end_accent_phrase_list = vec![0];
             for accent_phrase in accent_phrases {
-                let mut accent = usize::from(*accent_phrase.accent() != 1);
+                let mut accent = usize::from(accent_phrase.accent != 1);
                 create_one_accent_list(&mut base_start_accent_list, accent_phrase, accent as i32);
 
-                accent = *accent_phrase.accent() - 1;
+                accent = accent_phrase.accent - 1;
                 create_one_accent_list(&mut base_end_accent_list, accent_phrase, accent as i32);
                 create_one_accent_list(&mut base_start_accent_phrase_list, accent_phrase, 0);
                 create_one_accent_list(&mut base_end_accent_phrase_list, accent_phrase, -1);
@@ -625,39 +626,28 @@ pub(crate) mod blocking {
             let mut index = 0;
             let new_accent_phrases = accent_phrases
                 .iter()
-                .map(|accent_phrase| {
-                    AccentPhrase::new(
-                        accent_phrase
-                            .moras()
-                            .iter()
-                            .map(|mora| {
-                                let new_mora = Mora::new(
-                                    mora.text().clone(),
-                                    mora.consonant().clone(),
-                                    *mora.consonant_length(),
-                                    mora.vowel().clone(),
-                                    *mora.vowel_length(),
-                                    f0_list[index + 1],
-                                );
-                                index += 1;
-                                new_mora
-                            })
-                            .collect(),
-                        *accent_phrase.accent(),
-                        accent_phrase.pause_mora().as_ref().map(|pause_mora| {
-                            let new_pause_mora = Mora::new(
-                                pause_mora.text().clone(),
-                                pause_mora.consonant().clone(),
-                                *pause_mora.consonant_length(),
-                                pause_mora.vowel().clone(),
-                                *pause_mora.vowel_length(),
-                                f0_list[index + 1],
-                            );
+                .map(|accent_phrase| AccentPhrase {
+                    moras: accent_phrase
+                        .moras
+                        .iter()
+                        .map(|mora| {
+                            let new_mora = Mora {
+                                pitch: f0_list[index + 1],
+                                ..mora.clone()
+                            };
                             index += 1;
-                            new_pause_mora
-                        }),
-                        *accent_phrase.is_interrogative(),
-                    )
+                            new_mora
+                        })
+                        .collect(),
+                    pause_mora: accent_phrase.pause_mora.as_ref().map(|pause_mora| {
+                        let new_pause_mora = Mora {
+                            pitch: f0_list[index + 1],
+                            ..pause_mora.clone()
+                        };
+                        index += 1;
+                        new_pause_mora
+                    }),
+                    ..accent_phrase.clone()
                 })
                 .collect();
 
@@ -670,17 +660,16 @@ pub(crate) mod blocking {
             ) {
                 let mut one_accent_list: Vec<i64> = Vec::new();
 
-                for (i, mora) in accent_phrase.moras().iter().enumerate() {
+                for (i, mora) in accent_phrase.moras.iter().enumerate() {
                     let value = (i as i32 == point
-                        || (point < 0
-                            && i == (accent_phrase.moras().len() as i32 + point) as usize))
+                        || (point < 0 && i == (accent_phrase.moras.len() as i32 + point) as usize))
                         .into();
                     one_accent_list.push(value);
-                    if mora.consonant().is_some() {
+                    if mora.consonant.is_some() {
                         one_accent_list.push(value);
                     }
                 }
-                if accent_phrase.pause_mora().is_some() {
+                if accent_phrase.pause_mora.is_some() {
                     one_accent_list.push(0);
                 }
                 accent_list.extend(one_accent_list)
@@ -1036,10 +1025,10 @@ pub(crate) mod blocking {
 
         let mut phoneme_strings = vec!["pau".to_string()];
         for mora in flatten_moras.iter() {
-            if let Some(consonant) = mora.consonant() {
+            if let Some(consonant) = &mora.consonant {
                 phoneme_strings.push(consonant.clone())
             }
-            phoneme_strings.push(mora.vowel().clone());
+            phoneme_strings.push(mora.vowel.clone());
         }
         phoneme_strings.push("pau".to_string());
 
@@ -1050,12 +1039,14 @@ pub(crate) mod blocking {
         fn to_flatten_moras(accent_phrases: &[AccentPhrase]) -> Vec<Mora> {
             let mut flatten_moras = Vec::new();
 
-            for accent_phrase in accent_phrases {
-                let moras = accent_phrase.moras();
+            for AccentPhrase {
+                moras, pause_mora, ..
+            } in accent_phrases
+            {
                 for mora in moras {
                     flatten_moras.push(mora.clone());
                 }
-                if let Some(pause_mora) = accent_phrase.pause_mora() {
+                if let Some(pause_mora) = pause_mora {
                     flatten_moras.push(pause_mora.clone());
                 }
             }
@@ -1112,18 +1103,18 @@ pub(crate) mod blocking {
     impl AudioQuery {
         fn from_accent_phrases(accent_phrases: Vec<AccentPhrase>) -> Self {
             let kana = create_kana(&accent_phrases);
-            Self::new(
+            Self {
                 accent_phrases,
-                1.,
-                0.,
-                1.,
-                1.,
-                0.1,
-                0.1,
-                DEFAULT_SAMPLING_RATE,
-                false,
-                Some(kana),
-            )
+                speed_scale: 1.,
+                pitch_scale: 0.,
+                intonation_scale: 1.,
+                volume_scale: 1.,
+                pre_phoneme_length: 0.1,
+                post_phoneme_length: 0.1,
+                output_sampling_rate: DEFAULT_SAMPLING_RATE,
+                output_stereo: false,
+                kana: Some(kana),
+            }
         }
     }
 }
@@ -1594,41 +1585,39 @@ mod tests {
         .unwrap();
 
         assert_eq!(
-            query.accent_phrases().len(),
+            query.accent_phrases.len(),
             expected_text_consonant_vowel_data.len()
         );
 
-        for (accent_phrase, (text_consonant_vowel_slice, accent_pos)) in
-            std::iter::zip(query.accent_phrases(), expected_text_consonant_vowel_data)
-        {
-            assert_eq!(
-                accent_phrase.moras().len(),
-                text_consonant_vowel_slice.len()
-            );
-            assert_eq!(accent_phrase.accent(), accent_pos);
+        for (accent_phrase, (text_consonant_vowel_slice, accent_pos)) in std::iter::zip(
+            query.accent_phrases,
+            expected_text_consonant_vowel_data.iter().copied(),
+        ) {
+            assert_eq!(accent_phrase.moras.len(), text_consonant_vowel_slice.len());
+            assert_eq!(accent_phrase.accent, accent_pos);
 
-            for (mora, (text, consonant, vowel)) in
-                std::iter::zip(accent_phrase.moras(), *text_consonant_vowel_slice)
-            {
-                assert_eq!(mora.text(), text);
+            for (mora, (text, consonant, vowel)) in std::iter::zip(
+                accent_phrase.moras,
+                text_consonant_vowel_slice.iter().copied(),
+            ) {
+                assert_eq!(mora.text, text);
                 // NOTE: 子音の長さが必ず非ゼロになるテストケースを想定している
                 assert_ne!(
-                    mora.consonant_length(),
-                    &Some(0.),
+                    mora.consonant_length,
+                    Some(0.),
                     "expected mora.consonant_length is not Some(0.0), but got Some(0.0)."
                 );
-                assert_eq!(mora.consonant(), &Some(consonant.to_string()));
-                assert_eq!(mora.vowel(), vowel);
+                assert_eq!(mora.consonant, Some(consonant.to_string()));
+                assert_eq!(mora.vowel, vowel);
                 // NOTE: 母音の長さが必ず非ゼロになるテストケースを想定している
                 assert_ne!(
-                    mora.vowel_length(),
-                    &0.,
+                    mora.vowel_length, 0.,
                     "expected mora.vowel_length is not 0.0, but got 0.0."
                 );
             }
         }
 
-        assert_eq!(query.kana().as_deref(), Some(expected_kana_text));
+        assert_eq!(query.kana.as_deref(), Some(expected_kana_text));
     }
 
     #[rstest]
@@ -1675,31 +1664,29 @@ mod tests {
             expected_text_consonant_vowel_data.len()
         );
 
-        for (accent_phrase, (text_consonant_vowel_slice, accent_pos)) in
-            std::iter::zip(accent_phrases, expected_text_consonant_vowel_data)
-        {
-            assert_eq!(
-                accent_phrase.moras().len(),
-                text_consonant_vowel_slice.len()
-            );
-            assert_eq!(accent_phrase.accent(), accent_pos);
+        for (accent_phrase, (text_consonant_vowel_slice, accent_pos)) in std::iter::zip(
+            accent_phrases,
+            expected_text_consonant_vowel_data.iter().copied(),
+        ) {
+            assert_eq!(accent_phrase.moras.len(), text_consonant_vowel_slice.len());
+            assert_eq!(accent_phrase.accent, accent_pos);
 
-            for (mora, (text, consonant, vowel)) in
-                std::iter::zip(accent_phrase.moras(), *text_consonant_vowel_slice)
-            {
-                assert_eq!(mora.text(), text);
+            for (mora, (text, consonant, vowel)) in std::iter::zip(
+                accent_phrase.moras,
+                text_consonant_vowel_slice.iter().copied(),
+            ) {
+                assert_eq!(mora.text, text);
                 // NOTE: 子音の長さが必ず非ゼロになるテストケースを想定している
                 assert_ne!(
-                    mora.consonant_length(),
-                    &Some(0.),
+                    mora.consonant_length,
+                    Some(0.),
                     "expected mora.consonant_length is not Some(0.0), but got Some(0.0)."
                 );
-                assert_eq!(mora.consonant(), &Some(consonant.to_string()));
-                assert_eq!(mora.vowel(), vowel);
+                assert_eq!(mora.consonant, Some(consonant.to_string()));
+                assert_eq!(mora.vowel, vowel);
                 // NOTE: 母音の長さが必ず非ゼロになるテストケースを想定している
                 assert_ne!(
-                    mora.vowel_length(),
-                    &0.,
+                    mora.vowel_length, 0.,
                     "expected mora.vowel_length is not 0.0, but got 0.0."
                 );
             }
@@ -1736,36 +1723,35 @@ mod tests {
         // AccentPhraseの pause_mora に期待する値をテスト
 
         assert!(
-            accent_phrases[0].pause_mora().is_some(),
-            "accent_phrases[0].pause_mora() is None"
+            accent_phrases[0].pause_mora.is_some(),
+            "accent_phrases[0].pause_mora is None"
         );
         assert!(
-            accent_phrases[1].pause_mora().is_some(),
-            "accent_phrases[1].pause_mora() is None"
+            accent_phrases[1].pause_mora.is_some(),
+            "accent_phrases[1].pause_mora is None"
         );
         assert!(
-            accent_phrases[2].pause_mora().is_some(),
-            "accent_phrases[2].pause_mora() is None"
+            accent_phrases[2].pause_mora.is_some(),
+            "accent_phrases[2].pause_mora is None"
         );
         assert!(
-            accent_phrases[3].pause_mora().is_some(),
-            "accent_phrases[3].pause_mora() is None"
+            accent_phrases[3].pause_mora.is_some(),
+            "accent_phrases[3].pause_mora is None"
         );
         assert!(
-            accent_phrases[4].pause_mora().is_none(), // 文末の句読点は削除される
-            "accent_phrases[4].pause_mora() is not None"
+            accent_phrases[4].pause_mora.is_none(), // 文末の句読点は削除される
+            "accent_phrases[4].pause_mora is not None"
         );
 
         for accent_phrase in accent_phrases.iter().take(4) {
-            let pause_mora = accent_phrase.pause_mora().clone().unwrap();
-            assert_eq!(pause_mora.text(), "、");
-            assert_eq!(pause_mora.consonant(), &None);
-            assert_eq!(pause_mora.consonant_length(), &None);
-            assert_eq!(pause_mora.vowel(), "pau");
+            let pause_mora = accent_phrase.pause_mora.clone().unwrap();
+            assert_eq!(pause_mora.text, "、");
+            assert_eq!(pause_mora.consonant, None);
+            assert_eq!(pause_mora.consonant_length, None);
+            assert_eq!(pause_mora.vowel, "pau");
             assert_ne!(
-                pause_mora.vowel_length(),
-                &0.0,
-                "pause_mora.vowel_length() should not be 0.0"
+                pause_mora.vowel_length, 0.0,
+                "pause_mora.vowel_length should not be 0.0",
             );
         }
     }
@@ -1805,9 +1791,9 @@ mod tests {
             any_mora_param_changed(
                 &accent_phrases,
                 &modified_accent_phrases,
-                Mora::vowel_length
+                |Mora { vowel_length, .. }| vowel_length,
             ),
-            "mora_length() does not work: mora.vowel_length() is not changed."
+            "mora_length() does not work: mora.vowel_length is not changed.",
         );
     }
 
@@ -1843,8 +1829,12 @@ mod tests {
 
         // NOTE: 一つでも音高が変わっていれば、動作しているとみなす
         assert!(
-            any_mora_param_changed(&accent_phrases, &modified_accent_phrases, Mora::pitch),
-            "mora_pitch() does not work: mora.pitch() is not changed."
+            any_mora_param_changed(
+                &accent_phrases,
+                &modified_accent_phrases,
+                |Mora { pitch, .. }| pitch
+            ),
+            "mora_pitch() does not work: mora.pitch is not changed.",
         );
     }
 
@@ -1880,17 +1870,21 @@ mod tests {
 
         // NOTE: 一つでも音高が変わっていれば、動作しているとみなす
         assert!(
-            any_mora_param_changed(&accent_phrases, &modified_accent_phrases, Mora::pitch),
-            "mora_data() does not work: mora.pitch() is not changed."
+            any_mora_param_changed(
+                &accent_phrases,
+                &modified_accent_phrases,
+                |Mora { pitch, .. }| pitch,
+            ),
+            "mora_data() does not work: mora.pitch is not changed.",
         );
         // NOTE: 一つでも母音の長さが変わっていれば、動作しているとみなす
         assert!(
             any_mora_param_changed(
                 &accent_phrases,
                 &modified_accent_phrases,
-                Mora::vowel_length
+                |Mora { vowel_length, .. }| vowel_length,
             ),
-            "mora_data() does not work: mora.vowel_length() is not changed."
+            "mora_data() does not work: mora.vowel_length is not changed.",
         );
     }
 
@@ -1900,7 +1894,7 @@ mod tests {
         param: fn(&Mora) -> &T,
     ) -> bool {
         std::iter::zip(before, after)
-            .flat_map(move |(before, after)| std::iter::zip(before.moras(), after.moras()))
+            .flat_map(|(before, after)| std::iter::zip(&before.moras, &after.moras))
             .any(|(before, after)| param(before) != param(after))
     }
 
diff --git a/crates/voicevox_core/src/user_dict/word.rs b/crates/voicevox_core/src/user_dict/word.rs
index 7ed98a949..96a47dcc4 100644
--- a/crates/voicevox_core/src/user_dict/word.rs
+++ b/crates/voicevox_core/src/user_dict/word.rs
@@ -5,25 +5,24 @@ use crate::{
         priority2cost, MAX_PRIORITY, MIN_PRIORITY, PART_OF_SPEECH_DETAIL,
     },
 };
-use derive_getters::Getters;
 use once_cell::sync::Lazy;
 use regex::Regex;
 use serde::{de::Error as _, Deserialize, Serialize};
 use std::ops::RangeToInclusive;
 
 /// ユーザー辞書の単語。
-#[derive(Clone, Debug, Getters, Serialize)]
+#[derive(Clone, Debug, Serialize)]
 pub struct UserDictWord {
     /// 単語の表記。
-    pub surface: String,
+    surface: String,
     /// 単語の読み。
-    pub pronunciation: String,
+    pronunciation: String,
     /// アクセント型。
-    pub accent_type: usize,
+    accent_type: usize,
     /// 単語の種類。
-    pub word_type: UserDictWordType,
+    word_type: UserDictWordType,
     /// 単語の優先度。
-    pub priority: u32,
+    priority: u32,
 
     /// モーラ数。
     mora_count: usize,
@@ -127,6 +126,31 @@ impl UserDictWord {
             mora_count,
         })
     }
+
+    /// 単語の表記。
+    pub fn surface(&self) -> &str {
+        &self.surface
+    }
+
+    /// 単語の読み。
+    pub fn pronunciation(&self) -> &str {
+        &self.pronunciation
+    }
+
+    /// アクセント型。
+    pub fn accent_type(&self) -> usize {
+        self.accent_type
+    }
+
+    /// 単語の種類。
+    pub fn word_type(&self) -> UserDictWordType {
+        self.word_type
+    }
+
+    /// 単語の優先度。
+    pub fn priority(&self) -> u32 {
+        self.priority
+    }
 }
 
 /// カタカナの文字列が発音として有効かどうかを判定する。
@@ -203,7 +227,7 @@ pub(crate) fn to_zenkaku(surface: &str) -> String {
         .collect()
 }
 /// ユーザー辞書の単語の種類。
-#[derive(Clone, Debug, PartialEq, Eq, Serialize, Deserialize, Hash)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Deserialize, Hash)]
 #[serde(rename_all = "SCREAMING_SNAKE_CASE")]
 pub enum UserDictWordType {
     /// 固有名詞。
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index f5e862854..027747ab7 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -3,9 +3,7 @@
 //! VVM ファイルの定義と形式は[ドキュメント](../../../docs/vvm.md)を参照。
 
 use anyhow::anyhow;
-use derive_getters::Getters;
 use derive_more::From;
-use derive_new::new;
 use easy_ext::ext;
 use enum_map::EnumMap;
 use itertools::Itertools as _;
@@ -41,15 +39,16 @@ pub(crate) type ModelBytesWithInnerVoiceIdsByDomain =
     Hash,
     PartialOrd,
     Deserialize,
-    new,
-    Getters,
     derive_more::Display,
     Debug,
     From,
 )]
-#[serde(transparent)]
-pub struct VoiceModelId {
-    raw_voice_model_id: RawVoiceModelId,
+pub struct VoiceModelId(RawVoiceModelId);
+
+impl VoiceModelId {
+    pub fn raw_voice_model_id(self) -> RawVoiceModelId {
+        self.0
+    }
 }
 
 // FIXME: "header"といいつつ、VVMのファイルパスを持っている状態になっている。
@@ -106,9 +105,8 @@ impl ManifestDomains {
     fn check_acceptable(&self, metas: &[SpeakerMeta]) -> std::result::Result<(), StyleType> {
         let err = metas
             .iter()
-            .flat_map(SpeakerMeta::styles)
-            .map(StyleMeta::r#type)
-            .copied()
+            .flat_map(|SpeakerMeta { styles, .. }| styles)
+            .map(|StyleMeta { r#type, .. }| *r#type)
             .unique()
             .find(|&style_type| !self.accepts(style_type));
 
@@ -153,6 +151,7 @@ pub(crate) mod blocking {
     use ouroboros::self_referencing;
     use rayon::iter::{IntoParallelIterator as _, ParallelIterator as _};
     use serde::de::DeserializeOwned;
+    use uuid::Uuid;
 
     use crate::{
         error::{LoadModelError, LoadModelErrorKind, LoadModelResult},
@@ -288,8 +287,8 @@ pub(crate) mod blocking {
 
     #[ext(IdRef)]
     pub impl VoiceModel {
-        fn id_ref(&self) -> &VoiceModelId {
-            &self.header.manifest.id
+        fn id_ref(&self) -> &Uuid {
+            &self.header.manifest.id.0
         }
     }
 }
diff --git a/crates/voicevox_core_c_api/src/compatible_engine.rs b/crates/voicevox_core_c_api/src/compatible_engine.rs
index bd66210e2..70fa83710 100644
--- a/crates/voicevox_core_c_api/src/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/src/compatible_engine.rs
@@ -51,8 +51,8 @@ static VOICE_MODEL_SET: Lazy<VoiceModelSet> = Lazy::new(|| {
     let mut style_model_map = BTreeMap::default();
     for vvm in all_vvms.iter() {
         for meta in vvm.metas().iter() {
-            for style in meta.styles().iter() {
-                style_model_map.insert(*style.id(), vvm.id());
+            for style in meta.styles.iter() {
+                style_model_map.insert(style.id, vvm.id());
             }
         }
     }
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 3904698fc..38c06cd4f 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -449,7 +449,7 @@ pub unsafe extern "C" fn voicevox_voice_model_new_from_path(
 #[no_mangle]
 pub extern "C" fn voicevox_voice_model_id(model: &VoicevoxVoiceModel) -> VoicevoxVoiceModelId<'_> {
     init_logger_once();
-    model.model.id_ref().raw_voice_model_id().as_bytes()
+    model.model.id_ref().as_bytes()
 }
 
 /// ::VoicevoxVoiceModel からメタ情報を取得する。
@@ -1281,9 +1281,9 @@ pub extern "C" fn voicevox_user_dict_word_make(
     VoicevoxUserDictWord {
         surface,
         pronunciation,
-        accent_type: UserDictWord::default().accent_type,
-        word_type: UserDictWord::default().word_type.into(),
-        priority: UserDictWord::default().priority,
+        accent_type: UserDictWord::default().accent_type(),
+        word_type: UserDictWord::default().word_type().into(),
+        priority: UserDictWord::default().priority(),
     }
 }
 
diff --git a/crates/voicevox_core_java_api/src/voice_model.rs b/crates/voicevox_core_java_api/src/voice_model.rs
index 546ab9bf6..1ea90ba8c 100644
--- a/crates/voicevox_core_java_api/src/voice_model.rs
+++ b/crates/voicevox_core_java_api/src/voice_model.rs
@@ -35,7 +35,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsGetId<'loc
             .get_rust_field::<_, _, Arc<voicevox_core::blocking::VoiceModel>>(&this, "handle")?
             .clone();
 
-        let id = env.new_uuid(*internal.id().raw_voice_model_id())?;
+        let id = env.new_uuid(internal.id().raw_voice_model_id())?;
 
         Ok(id.into_raw())
     })
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index e301f1042..001df0713 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -173,7 +173,7 @@ mod blocking {
 
         #[getter]
         fn id(&self, py: Python<'_>) -> PyResult<PyObject> {
-            let id = *self.model.id().raw_voice_model_id();
+            let id = self.model.id().raw_voice_model_id();
             crate::convert::to_py_uuid(py, id)
         }
 
@@ -676,7 +676,7 @@ mod asyncio {
 
         #[getter]
         fn id(&self, py: Python<'_>) -> PyResult<PyObject> {
-            let id = *self.model.id().raw_voice_model_id();
+            let id = self.model.id().raw_voice_model_id();
             crate::convert::to_py_uuid(py, id)
         }
 

From e22ec4714495bc502387155c911efa4972ef5aea Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Tue, 23 Jul 2024 08:59:06 +0900
Subject: [PATCH 15/36] =?UTF-8?q?chore:=20sphinx-autoapi=E3=82=92v3.1.0?=
 =?UTF-8?q?=E3=81=AB=E4=B8=8A=E3=81=92=E3=82=8B=20(#808)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* chore: sphinx-autoapiをv3.1.0に上げる

* poetry.lockを修正

* poetry.lockをGHAの`ubuntu-22.04`が吐くやつに合わせる

* `exclude_patterns`にコメント
---
 .github/workflows/generate_document.yml       |  3 ---
 crates/voicevox_core_python_api/poetry.lock   | 22 +++++--------------
 .../voicevox_core_python_api/pyproject.toml   |  2 +-
 docs/apis/python_api/conf.py                  |  2 +-
 4 files changed, 7 insertions(+), 22 deletions(-)

diff --git a/.github/workflows/generate_document.yml b/.github/workflows/generate_document.yml
index c4af6b80b..d63a2f819 100644
--- a/.github/workflows/generate_document.yml
+++ b/.github/workflows/generate_document.yml
@@ -65,9 +65,6 @@ jobs:
           working-directory: "docs/apis/c_api/doxygen"
       - name: Build voicevox_core_python_api
         run: maturin develop --manifest-path ./crates/voicevox_core_python_api/Cargo.toml --locked
-      # https://github.com/readthedocs/sphinx-autoapi/issues/405
-      - name: Workaround to make Sphinx recognize `_rust` as a module
-        run: touch ./crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.py
       - name: Generate Sphinx document
         run: sphinx-build docs/apis/python_api public/apis/python_api
       - name: Generate Javadoc
diff --git a/crates/voicevox_core_python_api/poetry.lock b/crates/voicevox_core_python_api/poetry.lock
index 0decb2a6a..911dfafc2 100644
--- a/crates/voicevox_core_python_api/poetry.lock
+++ b/crates/voicevox_core_python_api/poetry.lock
@@ -1,4 +1,4 @@
-# This file is automatically @generated by Poetry 1.7.1 and should not be changed by hand.
+# This file is automatically @generated by Poetry 1.8.3 and should not be changed by hand.
 
 [[package]]
 name = "accessible-pygments"
@@ -39,17 +39,6 @@ files = [
 [package.dependencies]
 typing-extensions = {version = ">=4.0.0", markers = "python_version < \"3.9\""}
 
-[[package]]
-name = "anyascii"
-version = "0.3.2"
-description = "Unicode to ASCII transliteration"
-optional = false
-python-versions = ">=3.3"
-files = [
-    {file = "anyascii-0.3.2-py3-none-any.whl", hash = "sha256:3b3beef6fc43d9036d3b0529050b0c48bfad8bc960e9e562d7223cfb94fe45d4"},
-    {file = "anyascii-0.3.2.tar.gz", hash = "sha256:9d5d32ef844fe225b8bc7cba7f950534fae4da27a9bf3a6bea2cb0ea46ce4730"},
-]
-
 [[package]]
 name = "astroid"
 version = "3.0.1"
@@ -923,17 +912,16 @@ test = ["cython", "filelock", "html5lib", "pytest (>=4.6)"]
 
 [[package]]
 name = "sphinx-autoapi"
-version = "3.0.0"
+version = "3.1.0"
 description = "Sphinx API documentation generator"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "sphinx-autoapi-3.0.0.tar.gz", hash = "sha256:09ebd674a32b44467222b0fb8a917b97c89523f20dbf05b52cb8a3f0e15714de"},
-    {file = "sphinx_autoapi-3.0.0-py2.py3-none-any.whl", hash = "sha256:ea207793cba1feff7b2ded0e29364f2995a4d157303a98603cee0ce94cea2688"},
+    {file = "sphinx_autoapi-3.1.0-py2.py3-none-any.whl", hash = "sha256:b102ded12ff5397ff6f9536065644c0a01a203b1d53dac07419c267fd771367f"},
+    {file = "sphinx_autoapi-3.1.0.tar.gz", hash = "sha256:c5455191c36af19e0de73dd52e15feb04a37ca4439fa5e8d77f1941768c15d32"},
 ]
 
 [package.dependencies]
-anyascii = "*"
 astroid = [
     {version = ">=2.7", markers = "python_version < \"3.12\""},
     {version = ">=3.0.0a1", markers = "python_version >= \"3.12\""},
@@ -1091,4 +1079,4 @@ testing = ["big-O", "jaraco.functools", "jaraco.itertools", "more-itertools", "p
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.8,<3.13"
-content-hash = "42faee9d02ea5ad43eaef485f2127f0ffd77a5f8951ef71529eb1e85249e9c04"
+content-hash = "68fffc23b63507c95b965429a6a54f161f8c6a94fe98b6dcad001475f690b6a3"
diff --git a/crates/voicevox_core_python_api/pyproject.toml b/crates/voicevox_core_python_api/pyproject.toml
index 4ae2da74a..ac9dba7b3 100644
--- a/crates/voicevox_core_python_api/pyproject.toml
+++ b/crates/voicevox_core_python_api/pyproject.toml
@@ -44,7 +44,7 @@ pydantic = ">=2.5.2,<3"
 [tool.poetry.group.docs.dependencies]
 sphinx = "6.2.1"
 pydata-sphinx-theme = "0.14.1"
-sphinx-autoapi = "3.0.0"
+sphinx-autoapi = "3.1.0"
 
 [tool.poetry.group.dev.dependencies]
 maturin = "1.3.1"
diff --git a/docs/apis/python_api/conf.py b/docs/apis/python_api/conf.py
index b1695b750..60f9df90e 100644
--- a/docs/apis/python_api/conf.py
+++ b/docs/apis/python_api/conf.py
@@ -32,7 +32,7 @@
 ]
 
 # templates_path = ['_templates']
-exclude_patterns = []
+exclude_patterns = ["autoapi/*/_rust/*"] # パブリックAPIを意図した部分ではなく、またorphan扱いとなって警告が出るため
 
 
 # -- Options for HTML output -------------------------------------------------

From 21290d0ae30a17e6fec7e41c817533616827ebf9 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sat, 3 Aug 2024 22:35:15 +0900
Subject: [PATCH 16/36] chore(deps): update dependency rust to v1.80.0 (#809)

* chore(deps): update dependency rust to v1.80.0

* Fix Clippy lints

---------

Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com>
Co-authored-by: Ryo Yamashita <qryxip@gmail.com>
---
 crates/voicevox_core/src/user_dict/word.rs | 2 ++
 crates/voicevox_core_c_api/src/lib.rs      | 8 +++++---
 rust-toolchain                             | 2 +-
 3 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/crates/voicevox_core/src/user_dict/word.rs b/crates/voicevox_core/src/user_dict/word.rs
index 96a47dcc4..f6bbc182f 100644
--- a/crates/voicevox_core/src/user_dict/word.rs
+++ b/crates/voicevox_core/src/user_dict/word.rs
@@ -212,8 +212,10 @@ fn calculate_mora_count(pronunciation: &str, accent_type: usize) -> InvalidWordR
 /// 一部の種類の文字を、全角文字に置き換える。
 ///
 /// 具体的には
+///
 /// - "!"から"~"までの範囲の文字(数字やアルファベット)は、対応する全角文字に
 /// - " "などの目に見えない文字は、まとめて全角スペース(0x3000)に
+///
 /// 変換する。
 pub(crate) fn to_zenkaku(surface: &str) -> String {
     // 元実装：https://github.com/VOICEVOX/voicevox/blob/69898f5dd001d28d4de355a25766acb0e0833ec2/src/components/DictionaryManageDialog.vue#L379-L387
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 38c06cd4f..a634e6ae8 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -1,6 +1,8 @@
-// ここにあるRustdocはcbindgen向けのものである。safety documentation自体は書くが、Doxygenの慣習に従
-// い`<dt>`で書く。
-#![allow(clippy::missing_safety_doc)]
+// ここにある`#[doc]`はすべてrustdocではなくDoxygen向けのものである。
+#![allow(
+    clippy::doc_lazy_continuation,
+    clippy::missing_safety_doc // safety documentation自体は書くが、Doxygenの慣習に従い`<dt>`で書く
+)]
 
 mod c_impls;
 /// cbindgen:ignore
diff --git a/rust-toolchain b/rust-toolchain
index b3a8c61e6..aaceec04e 100644
--- a/rust-toolchain
+++ b/rust-toolchain
@@ -1 +1 @@
-1.79.0
+1.80.0

From bf8cdb87ee478177252a516b1e98a8172ddc37a2 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Mon, 5 Aug 2024 00:18:03 +0900
Subject: [PATCH 17/36] change: rework GPU features (#810)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* change: rework GPU features

* `body`に対してコメント

* `<table>`の組み立てを`build-spec-table`に集約する

* fixup! `<table>`の組み立てを`build-spec-table`に集約する

* `GpuSpec::defaults`の網羅性をテスト

* `DeviceAvailabilities`の表示を日本語にする

* デフォルトを`VOICEVOX/onnxruntime-builder`宛てにする

* `if cfg!(…)`の形にする

* `load-onnxruntime`でCUDAとDirectMLが使えることに言及
---
 .github/workflows/build_and_deploy.yml        | 104 +--
 .github/workflows/download_test.yml           |   8 +-
 .github/workflows/test.yml                    |  28 +-
 Cargo.lock                                    | 672 +++++++++++++++++-
 Cargo.toml                                    |   2 +
 crates/downloader/Cargo.toml                  |   3 +
 crates/downloader/src/main.rs                 | 216 ++++--
 crates/voicevox_core/Cargo.toml               |   7 +-
 crates/voicevox_core/src/devices.rs           | 213 +++++-
 crates/voicevox_core/src/error.rs             |   7 +-
 crates/voicevox_core/src/infer.rs             |  15 +-
 .../src/infer/runtimes/onnxruntime.rs         |  46 +-
 crates/voicevox_core/src/lib.rs               |  28 +-
 crates/voicevox_core/src/status.rs            |  25 +-
 crates/voicevox_core/src/synthesizer.rs       |  69 +-
 crates/voicevox_core_c_api/Cargo.toml         |   2 -
 .../include/voicevox_core.h                   |   4 +-
 crates/voicevox_core_c_api/src/lib.rs         |   4 +-
 .../voicevox_core_c_api/tests/e2e/log_mask.rs |   2 +-
 .../tests/e2e/snapshots.toml                  |  10 +
 crates/voicevox_core_java_api/Cargo.toml      |   4 -
 .../jp/hiroshiba/voicevoxcore/GlobalInfo.java |   6 +-
 crates/voicevox_core_python_api/Cargo.toml    |   4 -
 .../python/voicevox_core/_models.py           |   4 +-
 docs/downloader.md                            |   6 +-
 docs/usage.md                                 |   4 +-
 example/cpp/windows/README.md                 |   2 +-
 example/python/README.md                      |   2 +
 28 files changed, 1221 insertions(+), 276 deletions(-)

diff --git a/.github/workflows/build_and_deploy.yml b/.github/workflows/build_and_deploy.yml
index e9b5e9eb5..9283b273d 100644
--- a/.github/workflows/build_and_deploy.yml
+++ b/.github/workflows/build_and_deploy.yml
@@ -61,123 +61,90 @@ jobs:
           includes='[
             {
               "os": "windows-2019",
-              "features": "",
               "target": "x86_64-pc-windows-msvc",
-              "artifact_name": "windows-x64-cpu",
+              "artifact_name": "windows-x64",
               "c_release_format": "plain-cdylib",
-              "whl_local_version": "cpu",
-              "can_skip_in_simple_test": true
-            },
-            {
-              "os": "windows-2019",
-              "features": "directml",
-              "target": "x86_64-pc-windows-msvc",
-              "artifact_name": "windows-x64-directml",
-              "c_release_format": "plain-cdylib",
-              "whl_local_version": "directml",
+              "python_whl": true,
               "can_skip_in_simple_test": false
             },
             {
               "os": "windows-2019",
-              "features": "cuda",
-              "target": "x86_64-pc-windows-msvc",
-              "artifact_name": "windows-x64-cuda",
-              "c_release_format": "plain-cdylib",
-              "whl_local_version": "cuda",
-              "can_skip_in_simple_test": true
-            },
-            {
-              "os": "windows-2019",
-              "features": "",
               "target": "i686-pc-windows-msvc",
-              "artifact_name": "windows-x86-cpu",
-              "c_release_format": "plain-cdylib",
-              "whl_local_version": "cpu",
-              "can_skip_in_simple_test": true
-            },
-            {
-              "os": "ubuntu-20.04",
-              "features": "",
-              "target": "x86_64-unknown-linux-gnu",
-              "artifact_name": "linux-x64-cpu",
+              "artifact_name": "windows-x86",
               "c_release_format": "plain-cdylib",
-              "whl_local_version": "cpu",
+              "python_whl": true,
               "can_skip_in_simple_test": true
             },
             {
               "os": "ubuntu-20.04",
-              "features": "cuda",
               "target": "x86_64-unknown-linux-gnu",
-              "artifact_name": "linux-x64-gpu",
+              "artifact_name": "linux-x64",
               "c_release_format": "plain-cdylib",
-              "whl_local_version": "cuda",
+              "python_whl": true,
               "can_skip_in_simple_test": false
             },
             {
               "os": "ubuntu-20.04",
-              "features": "",
               "target": "aarch64-unknown-linux-gnu",
-              "artifact_name": "linux-arm64-cpu",
+              "artifact_name": "linux-arm64",
               "c_release_format": "plain-cdylib",
-              "whl_local_version": "cpu",
+              "python_whl": true,
               "can_skip_in_simple_test": true
             },
             {
               "os": "ubuntu-20.04",
-              "features": "",
               "target": "aarch64-linux-android",
-              "artifact_name": "android-arm64-cpu",
+              "artifact_name": "android-arm64",
               "c_release_format": "plain-cdylib",
+              "python_whl": false,
               "can_skip_in_simple_test": true
             },
             {
               "os": "ubuntu-20.04",
-              "features": "",
               "target": "x86_64-linux-android",
-              "artifact_name": "android-x86_64-cpu",
+              "artifact_name": "android-x86_64",
               "c_release_format": "plain-cdylib",
+              "python_whl": false,
               "can_skip_in_simple_test": true
             },
             {
               "os": "macos-12",
-              "features": "",
               "target": "aarch64-apple-darwin",
-              "artifact_name": "osx-arm64-cpu",
+              "artifact_name": "osx-arm64",
               "c_release_format": "plain-cdylib",
-              "whl_local_version": "cpu",
+              "python_whl": true,
               "can_skip_in_simple_test": false
             },
             {
               "os": "macos-12",
-              "features": "",
               "target": "x86_64-apple-darwin",
-              "artifact_name": "osx-x64-cpu",
+              "artifact_name": "osx-x64",
               "c_release_format": "plain-cdylib",
-              "whl_local_version": "cpu",
+              "python_whl": true,
               "can_skip_in_simple_test": true
             },
             {
               "os": "macos-12",
-              "features": "",
               "target": "aarch64-apple-ios",
               "artifact_name": "ios-arm64-cpu",
               "c_release_format": "ios-xcframework",
+              "python_whl": false,
               "can_skip_in_simple_test": true
             },
             {
               "os": "macos-12",
-              "features": "",
               "target": "aarch64-apple-ios-sim",
               "artifact_name": "ios-arm64-cpu-sim",
               "c_release_format": "ios-xcframework",
+              "python_whl": false,
               "can_skip_in_simple_test": true
             },
             {
               "os": "macos-12",
-              "features": "",
               "target": "x86_64-apple-ios",
               "artifact_name": "ios-x64-cpu",
               "c_release_format": "ios-xcframework",
+              "python_whl": false,
               "can_skip_in_simple_test": true
             }
           ]'
@@ -216,7 +183,7 @@ jobs:
             git -c user.name=dummy -c user.email=dummy@dummy.dummy merge FETCH_HEAD
           ) > /dev/null 2>&1
       - name: Set up Python 3.8
-        if: matrix.whl_local_version
+        if: matrix.python_whl
         uses: actions/setup-python@v5
         with:
           python-version: "3.8"
@@ -258,7 +225,7 @@ jobs:
       - name: set cargo version
         run: |
           cargo set-version "$VERSION" --exclude voicevox_core_python_api --exclude downloader --exclude xtask
-          if ${{ !!matrix.whl_local_version }}; then cargo set-version "$VERSION+"${{ matrix.whl_local_version }} -p voicevox_core_python_api; fi
+          if ${{ matrix.python_whl }}; then cargo set-version "$VERSION" -p voicevox_core_python_api; fi
       - name: cache target
         uses: Swatinem/rust-cache@v2
         if: ${{ !inputs.is_production }}
@@ -270,7 +237,7 @@ jobs:
             ios-xcframework) linking=link-onnxruntime ;;
           esac
           function build() {
-            cargo build -p voicevox_core_c_api -vv --features "$linking",${{ matrix.features }} --target ${{ matrix.target }} --release
+            cargo build -p voicevox_core_c_api -vv --features "$linking" --target ${{ matrix.target }} --release
           }
           if ${{ !inputs.is_production }}; then
             build
@@ -280,7 +247,7 @@ jobs:
         env:
           RUSTFLAGS: -C panic=abort
       - name: build voicevox_core_python_api
-        if: matrix.whl_local_version
+        if: matrix.python_whl
         id: build-voicevox-core-python-api
         run: |
           rm -rf ./target/wheels
@@ -288,7 +255,7 @@ jobs:
           poetry config virtualenvs.create false
           (cd crates/voicevox_core_python_api && poetry install --with dev)
           function build() {
-            maturin build --manifest-path ./crates/voicevox_core_python_api/Cargo.toml --features ${{ matrix.features }}, --target ${{ matrix.target }} --release
+            maturin build --manifest-path ./crates/voicevox_core_python_api/Cargo.toml --target ${{ matrix.target }} --release
           }
           if ${{ !inputs.is_production }}; then
             build
@@ -300,7 +267,7 @@ jobs:
         if: contains(matrix.target, 'android')
         run: |
           function build() {
-            cargo build -p voicevox_core_java_api -vv --features ${{ matrix.features }}, --target ${{ matrix.target }} --release
+            cargo build -p voicevox_core_java_api -vv --target ${{ matrix.target }} --release
           }
           if ${{ !inputs.is_production }}; then
             build
@@ -318,9 +285,6 @@ jobs:
             > "artifact/${{ env.ASSET_NAME }}/voicevox_core.h"
           cp -v target/${{ matrix.target }}/release/*voicevox_core.{dll,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
           cp -v target/${{ matrix.target }}/release/voicevox_core.dll.lib "artifact/${{ env.ASSET_NAME }}/voicevox_core.lib" || true
-          cp -v -n target/${{ matrix.target }}/release/{,lib}onnxruntime*.{dll,so.*,so,dylib} "artifact/${{ env.ASSET_NAME }}" || true
-          # libonnxruntimeについてはバージョン付のshared libraryを使用するためバージョンがついてないものを削除する
-          rm -f artifact/${{ env.ASSET_NAME }}/libonnxruntime.{so,dylib}
           cp -v README.md "artifact/${{ env.ASSET_NAME }}/README.txt"
           echo "${{ env.VERSION }}" > "artifact/${{ env.ASSET_NAME }}/VERSION"
 
@@ -354,7 +318,7 @@ jobs:
             ${{ env.ASSET_NAME }}.zip
           target_commitish: ${{ github.sha }}
       - name: Upload Python whl to Release
-        if: fromJson(needs.config.outputs.deploy) && matrix.whl_local_version
+        if: fromJson(needs.config.outputs.deploy) && matrix.python_whl
         uses: softprops/action-gh-release@v2
         with:
           prerelease: true
@@ -475,17 +439,17 @@ jobs:
         run:
           cargo set-version "$VERSION" -p voicevox_core_java_api
 
-      - name: "Download artifact (android-arm64-cpu)"
+      - name: "Download artifact (android-arm64)"
         uses: actions/download-artifact@v4
         with:
-          name: voicevox_core_java_api-android-arm64-cpu
-          path: artifact/android-arm64-cpu
+          name: voicevox_core_java_api-android-arm64
+          path: artifact/android-arm64
 
-      - name: "Download artifact (android-x86_64-cpu)"
+      - name: "Download artifact (android-x86_64)"
         uses: actions/download-artifact@v4
         with:
-          name: voicevox_core_java_api-android-x86_64-cpu
-          path: artifact/android-x86_64-cpu
+          name: voicevox_core_java_api-android-x86_64
+          path: artifact/android-x86_64
 
       - name: Print tree
         run: tree artifact
@@ -494,8 +458,8 @@ jobs:
         run: |
           rm -rf crates/voicevox_core_java_api/lib/src/main/resources/dll
           cat <<EOF | while read -r line; do
-          android-arm64-cpu|arm64-v8a
-          android-x86_64-cpu|x86_64
+          android-arm64|arm64-v8a
+          android-x86_64|x86_64
           EOF
             IFS='|' read -r artifact_name target <<< "$line"
             mkdir "crates/voicevox_core_java_api/lib/src/main/resources/jniLibs/${target}/"
diff --git a/.github/workflows/download_test.yml b/.github/workflows/download_test.yml
index 9f953534a..ebdd25813 100644
--- a/.github/workflows/download_test.yml
+++ b/.github/workflows/download_test.yml
@@ -102,7 +102,7 @@ jobs:
               open_jtalk_dic_utf_8-1.11
           - name: DirectML option確認
             os: windows-latest
-            download_command: cargo run -vv -p downloader -- --device directml
+            download_command: cargo run -vv -p downloader -- --devices directml
             download_dir: voicevox_core
             check_items: |
               voicevox_core.dll
@@ -121,7 +121,7 @@ jobs:
               *curand*
           - name: DirectMLかつMin option確認
             os: windows-latest
-            download_command: cargo run -vv -p downloader -- --device directml --min
+            download_command: cargo run -vv -p downloader -- --devices directml --min
             download_dir: voicevox_core
             check_items: |
               voicevox_core.dll
@@ -139,7 +139,7 @@ jobs:
               open_jtalk_dic_utf_8-1.11
           - name: cuda option確認
             os: windows-latest
-            download_command: cargo run -vv -p downloader -- --device cuda
+            download_command: cargo run -vv -p downloader -- --devices cuda
             download_dir: voicevox_core
             check_items: |
               voicevox_core.dll
@@ -161,7 +161,7 @@ jobs:
               *directml*
           - name: cudaかつmin option確認
             os: windows-latest
-            download_command: cargo run -vv -p downloader -- --device cuda --min
+            download_command: cargo run -vv -p downloader -- --devices cuda --min
             download_dir: voicevox_core
             check_items: |
               voicevox_core.dll
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 8550fbfca..d84d16442 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -72,10 +72,10 @@ jobs:
         with:
           python-version: "3.8"
       - uses: Swatinem/rust-cache@v2
-      - run: cargo clippy -vv --features directml,cuda --tests -- -D clippy::all -D warnings --no-deps
-      - run: cargo clippy -vv --features directml,cuda -- -D clippy::all -D warnings --no-deps
-      - run: cargo clippy -vv -p voicevox_core -p voicevox_core_c_api --features link-onnxruntime,directml,cuda --tests -- -D clippy::all -D warnings --no-deps
-      - run: cargo clippy -vv -p voicevox_core -p voicevox_core_c_api --features link-onnxruntime,directml,cuda -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv --tests -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv -p voicevox_core -p voicevox_core_c_api --features link-onnxruntime --tests -- -D clippy::all -D warnings --no-deps
+      - run: cargo clippy -vv -p voicevox_core -p voicevox_core_c_api --features link-onnxruntime -- -D clippy::all -D warnings --no-deps
       - run: cargo fmt -- --check
 
   rust-unit-test:
@@ -88,7 +88,7 @@ jobs:
         with:
           key: "cargo-unit-test-cache"
       - name: Run cargo unit test
-        run: RUST_BACKTRACE=full cargo test --lib --bins -vv --features , -- --include-ignored
+        run: RUST_BACKTRACE=full cargo test --lib --bins -vv -- --include-ignored
       - name: Run cargo documentation test
         run: RUST_BACKTRACE=full cargo test --doc -vv
 
@@ -101,14 +101,12 @@ jobs:
         id: strategy-matrix
         run: |
           includes='[
-            { "os": "windows-2019", "features": "", "can_skip_in_simple_test": true },
-            { "os": "windows-2022", "features": "", "can_skip_in_simple_test": true },
-            { "os": "windows-2019", "features": "directml", "can_skip_in_simple_test": false },
-            { "os": "windows-2022", "features": "directml", "can_skip_in_simple_test": true },
-            { "os": "macos-12", "features": "", "can_skip_in_simple_test": false },
-            { "os": "macos-13", "features": "", "can_skip_in_simple_test": true },
-            { "os": "ubuntu-20.04", "features": "", "can_skip_in_simple_test": false },
-            { "os": "ubuntu-22.04", "features": "", "can_skip_in_simple_test": true }
+            { "os": "windows-2019", "can_skip_in_simple_test": true },
+            { "os": "windows-2022", "can_skip_in_simple_test": true },
+            { "os": "macos-12", "can_skip_in_simple_test": false },
+            { "os": "macos-13", "can_skip_in_simple_test": true },
+            { "os": "ubuntu-20.04", "can_skip_in_simple_test": false },
+            { "os": "ubuntu-22.04", "can_skip_in_simple_test": true }
           ]'
 
           # FIXME: composite action に切り出す
@@ -135,9 +133,9 @@ jobs:
         uses: ./.github/actions/rust-toolchain-from-file
       - uses: Swatinem/rust-cache@v2
         with:
-          key: "cargo-integration-test-cache-${{ matrix.features }}-${{ matrix.os }}"
+          key: "cargo-integration-test-cache-${{ matrix.os }}"
       - name: Run cargo integration test (load-onnxruntime)
-        run: RUST_BACKTRACE=full cargo test --test "*" -vv --features ,${{ matrix.features }} -- --include-ignored
+        run: RUST_BACKTRACE=full cargo test --test "*" -vv -- --include-ignored
 
   c-header:
     runs-on: ubuntu-latest
diff --git a/Cargo.lock b/Cargo.lock
index a612d57e6..9fdf8f695 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -29,6 +29,19 @@ dependencies = [
  "opaque-debug",
 ]
 
+[[package]]
+name = "ahash"
+version = "0.8.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e89da841a80418a9b391ebaea17f5c112ffaaa96f621d2c285b5174da76b9011"
+dependencies = [
+ "cfg-if",
+ "getrandom",
+ "once_cell",
+ "version_check",
+ "zerocopy",
+]
+
 [[package]]
 name = "aho-corasick"
 version = "1.1.2"
@@ -86,6 +99,7 @@ dependencies = [
  "anstyle",
  "anstyle-parse",
  "anstyle-query",
+ "anstyle-wincon",
  "colorchoice",
  "utf8parse",
 ]
@@ -114,6 +128,16 @@ dependencies = [
  "windows-sys 0.48.0",
 ]
 
+[[package]]
+name = "anstyle-wincon"
+version = "2.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "58f54d10c6dfa51283a066ceab3ec1ab78d13fae00aa49243a45e4571fb79dfd"
+dependencies = [
+ "anstyle",
+ "windows-sys 0.48.0",
+]
+
 [[package]]
 name = "anyhow"
 version = "1.0.65"
@@ -229,6 +253,15 @@ version = "1.0.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "8a32fd6af2b5827bce66c29053ba0e7c42b9dcab01835835058558c10851a46b"
 
+[[package]]
+name = "bincode"
+version = "1.3.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b1f45e9417d87227c7a56d22e471c6206462cba514c7590c09aff4cf6d1ddcad"
+dependencies = [
+ "serde",
+]
+
 [[package]]
 name = "bindgen"
 version = "0.62.0"
@@ -285,6 +318,21 @@ dependencies = [
  "xattr",
 ]
 
+[[package]]
+name = "bit-set"
+version = "0.5.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0700ddab506f33b20a03b13996eccd309a48e5ff77d0d95926aa0210fb4e95f1"
+dependencies = [
+ "bit-vec",
+]
+
+[[package]]
+name = "bit-vec"
+version = "0.6.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "349f9b6a179ed607305526ca489b34ad0a41aed5f7980fa90eb03160b69598fb"
+
 [[package]]
 name = "bitflags"
 version = "1.3.2"
@@ -389,6 +437,16 @@ dependencies = [
  "thiserror",
 ]
 
+[[package]]
+name = "caseless"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "808dab3318747be122cb31d36de18d4d1c81277a76f8332a02b81a3d73463d7f"
+dependencies = [
+ "regex",
+ "unicode-normalization",
+]
+
 [[package]]
 name = "cbindgen"
 version = "0.24.3"
@@ -482,37 +540,44 @@ dependencies = [
  "bitflags 1.3.2",
  "clap_lex 0.2.4",
  "indexmap 1.9.1",
- "strsim",
+ "strsim 0.10.0",
  "termcolor",
  "textwrap",
 ]
 
 [[package]]
 name = "clap"
-version = "4.0.10"
+version = "4.4.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3b1a0a4208c6c483b952ad35c6eed505fc13b46f08f631b81e828084a9318d74"
+checksum = "84ed82781cea27b43c9b106a979fe450a13a31aab0500595fb3fc06616de08e6"
 dependencies = [
- "atty",
- "bitflags 1.3.2",
+ "clap_builder",
  "clap_derive",
- "clap_lex 0.3.0",
- "once_cell",
- "strsim",
- "termcolor",
+]
+
+[[package]]
+name = "clap_builder"
+version = "4.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2bb9faaa7c2ef94b2743a21f5a29e6f0010dff4caa69ac8e9d6cf8b6fa74da08"
+dependencies = [
+ "anstream",
+ "anstyle",
+ "clap_lex 0.5.1",
+ "strsim 0.10.0",
+ "terminal_size",
 ]
 
 [[package]]
 name = "clap_derive"
-version = "4.0.10"
+version = "4.4.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "db342ce9fda24fb191e2ed4e102055a4d381c1086a06630174cd8da8d5d917ce"
+checksum = "0862016ff20d69b84ef8247369fabf5c008a7417002411897d40ee1f4532b873"
 dependencies = [
  "heck",
- "proc-macro-error",
  "proc-macro2",
  "quote",
- "syn 1.0.102",
+ "syn 2.0.48",
 ]
 
 [[package]]
@@ -526,12 +591,9 @@ dependencies = [
 
 [[package]]
 name = "clap_lex"
-version = "0.3.0"
+version = "0.5.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0d4198f73e42b4936b35b5bb248d81d2b595ecb170da0bac7655c54eedfa8da8"
-dependencies = [
- "os_str_bytes",
-]
+checksum = "cd7cc57abe963c6d3b9d8be5b06ba7c8957a930305ca90304f24ef040aa6f961"
 
 [[package]]
 name = "cmake"
@@ -595,6 +657,27 @@ dependencies = [
  "memchr",
 ]
 
+[[package]]
+name = "comrak"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "395ab67843c57df5a4ee29d610740828dbc928cc64ecf0f2a1d5cd0e98e107a9"
+dependencies = [
+ "caseless",
+ "clap 4.4.3",
+ "derive_builder",
+ "entities",
+ "memchr",
+ "once_cell",
+ "regex",
+ "shell-words",
+ "slug",
+ "syntect",
+ "typed-arena",
+ "unicode_categories",
+ "xdg",
+]
+
 [[package]]
 name = "concolor"
 version = "0.0.11"
@@ -740,6 +823,29 @@ dependencies = [
  "typenum",
 ]
 
+[[package]]
+name = "cssparser"
+version = "0.31.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5b3df4f93e5fbbe73ec01ec8d3f68bba73107993a5b1e7519273c32db9b0d5be"
+dependencies = [
+ "cssparser-macros",
+ "dtoa-short",
+ "itoa",
+ "phf 0.11.2",
+ "smallvec",
+]
+
+[[package]]
+name = "cssparser-macros"
+version = "0.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "13b588ba4ac1a99f7f2964d24b3d896ddc6bf847ee3855dbd4366f058cfcd331"
+dependencies = [
+ "quote",
+ "syn 2.0.48",
+]
+
 [[package]]
 name = "cstr"
 version = "0.2.11"
@@ -806,9 +912,9 @@ dependencies = [
 
 [[package]]
 name = "darling"
-version = "0.20.3"
+version = "0.20.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0209d94da627ab5605dcccf08bb18afa5009cfbef48d8a8b7d7bdbc79be25c5e"
+checksum = "6f63b86c8a8826a49b8c21f08a2d07338eec8d900540f8630dc76284be802989"
 dependencies = [
  "darling_core",
  "darling_macro",
@@ -816,23 +922,23 @@ dependencies = [
 
 [[package]]
 name = "darling_core"
-version = "0.20.3"
+version = "0.20.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "177e3443818124b357d8e76f53be906d60937f0d3a90773a664fa63fa253e621"
+checksum = "95133861a8032aaea082871032f5815eb9e98cef03fa916ab4500513994df9e5"
 dependencies = [
  "fnv",
  "ident_case",
  "proc-macro2",
  "quote",
- "strsim",
+ "strsim 0.11.1",
  "syn 2.0.48",
 ]
 
 [[package]]
 name = "darling_macro"
-version = "0.20.3"
+version = "0.20.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "836a9bbc7ad63342d6d6e7b815ccab164bc77a2d95d84bc3117a8c0d5c98e2d5"
+checksum = "d336a2a514f6ccccaa3e09b02d41d35330c07ddf03a62165fcec10bb561c7806"
 dependencies = [
  "darling_core",
  "quote",
@@ -861,6 +967,37 @@ dependencies = [
  "syn 1.0.102",
 ]
 
+[[package]]
+name = "derive_builder"
+version = "0.20.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0350b5cb0331628a5916d6c5c0b72e97393b8b6b03b47a9284f4e7f5a405ffd7"
+dependencies = [
+ "derive_builder_macro",
+]
+
+[[package]]
+name = "derive_builder_core"
+version = "0.20.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d48cda787f839151732d396ac69e3473923d54312c070ee21e9effcaa8ca0b1d"
+dependencies = [
+ "darling",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.48",
+]
+
+[[package]]
+name = "derive_builder_macro"
+version = "0.20.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "206868b8242f27cecce124c19fd88157fbd0dd334df2587f36417bafbc85097b"
+dependencies = [
+ "derive_builder_core",
+ "syn 2.0.48",
+]
+
 [[package]]
 name = "derive_more"
 version = "0.99.17"
@@ -874,6 +1011,12 @@ dependencies = [
  "syn 1.0.102",
 ]
 
+[[package]]
+name = "deunicode"
+version = "1.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "339544cc9e2c4dc3fc7149fd630c5f22263a4fdf18a98afd0075784968b5cf00"
+
 [[package]]
 name = "diff"
 version = "0.1.13"
@@ -910,18 +1053,21 @@ dependencies = [
  "anyhow",
  "binstall-tar",
  "bytes",
- "clap 4.0.10",
+ "clap 4.4.3",
+ "comrak",
  "flate2",
  "fs-err",
  "futures-core",
  "futures-util",
  "indicatif",
+ "itertools 0.10.5",
  "octocrab",
  "once_cell",
  "parse-display",
  "rayon",
  "reqwest",
  "rstest",
+ "scraper",
  "strum",
  "tokio",
  "tracing",
@@ -930,6 +1076,21 @@ dependencies = [
  "zip",
 ]
 
+[[package]]
+name = "dtoa"
+version = "1.0.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dcbb2bf8e87535c23f7a8a321e364ce21462d0ff10cb6407820e8e96dfff6653"
+
+[[package]]
+name = "dtoa-short"
+version = "0.3.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cd1511a7b6a56299bd043a9c167a6d2bfb37bf84a6dfceaba651168adfb43c87"
+dependencies = [
+ "dtoa",
+]
+
 [[package]]
 name = "duct"
 version = "0.13.6"
@@ -970,6 +1131,12 @@ dependencies = [
  "syn 1.0.102",
 ]
 
+[[package]]
+name = "ego-tree"
+version = "0.6.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3a68a4904193147e0a8dec3314640e6db742afd5f6e634f428a6af230d9b3591"
+
 [[package]]
 name = "either"
 version = "1.8.0"
@@ -991,6 +1158,12 @@ dependencies = [
  "cfg-if",
 ]
 
+[[package]]
+name = "entities"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b5320ae4c3782150d900b79807611a59a99fc9a1d61d686faafc24b93fc8d7ca"
+
 [[package]]
 name = "enum-map"
 version = "3.0.0-beta.1"
@@ -1091,6 +1264,16 @@ dependencies = [
  "once_cell",
 ]
 
+[[package]]
+name = "fancy-regex"
+version = "0.11.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b95f7c0680e4142284cf8b22c14a476e87d61b004a3a0861872b32ef7ead40a2"
+dependencies = [
+ "bit-set",
+ "regex",
+]
+
 [[package]]
 name = "fastrand"
 version = "1.8.0"
@@ -1154,6 +1337,16 @@ dependencies = [
  "tokio",
 ]
 
+[[package]]
+name = "futf"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "df420e2e84819663797d1ec6544b13c5be84629e7bb00dc960d6917db2987843"
+dependencies = [
+ "mac",
+ "new_debug_unreachable",
+]
+
 [[package]]
 name = "futures"
 version = "0.3.28"
@@ -1262,6 +1455,15 @@ dependencies = [
  "slab",
 ]
 
+[[package]]
+name = "fxhash"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c31b6d751ae2c7f11320402d34e41349dd1016f8d5d45e48c4312bc8625af50c"
+dependencies = [
+ "byteorder",
+]
+
 [[package]]
 name = "generic-array"
 version = "0.14.6"
@@ -1272,6 +1474,15 @@ dependencies = [
  "version_check",
 ]
 
+[[package]]
+name = "getopts"
+version = "0.2.21"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "14dbbfd5c71d70241ecf9e6f13737f7b5ce823821063188d7e46c41d371eebd5"
+dependencies = [
+ "unicode-width",
+]
+
 [[package]]
 name = "getrandom"
 version = "0.2.7"
@@ -1392,6 +1603,20 @@ dependencies = [
  "digest",
 ]
 
+[[package]]
+name = "html5ever"
+version = "0.27.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c13771afe0e6e846f1e67d038d4cb29998a6779f93c809212e4e9c32efd244d4"
+dependencies = [
+ "log",
+ "mac",
+ "markup5ever",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.48",
+]
+
 [[package]]
 name = "http"
 version = "0.2.8"
@@ -1744,11 +1969,20 @@ version = "0.6.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d7b603516767d1ab23d0de09d023e62966c3322f7148297c35cf3d97aa8b37fa"
 dependencies = [
- "clap 4.0.10",
+ "clap 4.4.3",
  "termcolor",
  "threadpool",
 ]
 
+[[package]]
+name = "line-wrap"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f30344350a2a51da54c1d53be93fade8a237e545dbcc4bdbe635413f2117cab9"
+dependencies = [
+ "safemem",
+]
+
 [[package]]
 name = "link-cplusplus"
 version = "1.0.7"
@@ -1758,6 +1992,12 @@ dependencies = [
  "cc",
 ]
 
+[[package]]
+name = "linked-hash-map"
+version = "0.5.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0717cef1bc8b636c6e1c1bbdefc09e6322da8a9321966e8928ef80d20f7f770f"
+
 [[package]]
 name = "linux-raw-sys"
 version = "0.1.4"
@@ -1789,6 +2029,26 @@ dependencies = [
  "cfg-if",
 ]
 
+[[package]]
+name = "mac"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c41e0c4fef86961ac6d6f8a82609f55f31b05e4fce149ac5710e439df7619ba4"
+
+[[package]]
+name = "markup5ever"
+version = "0.12.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "16ce3abbeba692c8b8441d036ef91aea6df8da2c6b6e21c7e14d3c18e526be45"
+dependencies = [
+ "log",
+ "phf 0.11.2",
+ "phf_codegen 0.11.2",
+ "string_cache",
+ "string_cache_codegen",
+ "tendril",
+]
+
 [[package]]
 name = "matchers"
 version = "0.1.0"
@@ -1907,6 +2167,12 @@ dependencies = [
  "rand",
 ]
 
+[[package]]
+name = "new_debug_unreachable"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "650eef8c711430f1a879fdd01d4745a7deea475becfb90269c06775983bbf086"
+
 [[package]]
 name = "noisy_float"
 version = "0.2.0"
@@ -2051,6 +2317,28 @@ version = "1.19.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "3fdb12b2476b595f9358c5161aa467c2438859caa136dec86c26fdd2efe17b92"
 
+[[package]]
+name = "onig"
+version = "6.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8c4b31c8722ad9171c6d77d3557db078cab2bd50afcc9d09c8b315c59df8ca4f"
+dependencies = [
+ "bitflags 1.3.2",
+ "libc",
+ "once_cell",
+ "onig_sys",
+]
+
+[[package]]
+name = "onig_sys"
+version = "69.8.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7b829e3d7e9cc74c7e315ee8edb185bf4190da5acde74afd7fc59c35b1f086e7"
+dependencies = [
+ "cc",
+ "pkg-config",
+]
+
 [[package]]
 name = "opaque-debug"
 version = "0.3.0"
@@ -2238,6 +2526,96 @@ version = "2.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d4fd5641d01c8f18a23da7b6fe29298ff4b55afcccdf78973b24cf3175fee32e"
 
+[[package]]
+name = "phf"
+version = "0.10.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fabbf1ead8a5bcbc20f5f8b939ee3f5b0f6f281b6ad3468b84656b658b455259"
+dependencies = [
+ "phf_shared 0.10.0",
+]
+
+[[package]]
+name = "phf"
+version = "0.11.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ade2d8b8f33c7333b51bcf0428d37e217e9f32192ae4772156f65063b8ce03dc"
+dependencies = [
+ "phf_macros",
+ "phf_shared 0.11.2",
+]
+
+[[package]]
+name = "phf_codegen"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4fb1c3a8bc4dd4e5cfce29b44ffc14bedd2ee294559a294e2a4d4c9e9a6a13cd"
+dependencies = [
+ "phf_generator 0.10.0",
+ "phf_shared 0.10.0",
+]
+
+[[package]]
+name = "phf_codegen"
+version = "0.11.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e8d39688d359e6b34654d328e262234662d16cc0f60ec8dcbe5e718709342a5a"
+dependencies = [
+ "phf_generator 0.11.2",
+ "phf_shared 0.11.2",
+]
+
+[[package]]
+name = "phf_generator"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5d5285893bb5eb82e6aaf5d59ee909a06a16737a8970984dd7746ba9283498d6"
+dependencies = [
+ "phf_shared 0.10.0",
+ "rand",
+]
+
+[[package]]
+name = "phf_generator"
+version = "0.11.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "48e4cc64c2ad9ebe670cb8fd69dd50ae301650392e81c05f9bfcb2d5bdbc24b0"
+dependencies = [
+ "phf_shared 0.11.2",
+ "rand",
+]
+
+[[package]]
+name = "phf_macros"
+version = "0.11.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3444646e286606587e49f3bcf1679b8cef1dc2c5ecc29ddacaffc305180d464b"
+dependencies = [
+ "phf_generator 0.11.2",
+ "phf_shared 0.11.2",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.48",
+]
+
+[[package]]
+name = "phf_shared"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b6796ad771acdc0123d2a88dc428b5e38ef24456743ddb1744ed628f9815c096"
+dependencies = [
+ "siphasher",
+]
+
+[[package]]
+name = "phf_shared"
+version = "0.11.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "90fcb95eef784c2ac79119d1dd819e162b5da872ce6f3c3abe1e8ca1c082f72b"
+dependencies = [
+ "siphasher",
+]
+
 [[package]]
 name = "pin-project"
 version = "1.0.12"
@@ -2276,6 +2654,20 @@ version = "0.3.25"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1df8c4ec4b0627e53bdf214615ad287367e482558cf84b109250b37464dc03ae"
 
+[[package]]
+name = "plist"
+version = "1.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9a4a0cfc5fb21a09dc6af4bf834cf10d4a32fccd9e2ea468c4b1751a097487aa"
+dependencies = [
+ "base64 0.21.0",
+ "indexmap 1.9.1",
+ "line-wrap",
+ "quick-xml",
+ "serde",
+ "time",
+]
+
 [[package]]
 name = "portable-atomic"
 version = "0.3.19"
@@ -2294,6 +2686,12 @@ version = "0.2.16"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "eb9f9e6e233e5c4a35559a617bf40a4ec447db2e84c20b55a6f83167b7e57872"
 
+[[package]]
+name = "precomputed-hash"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "925383efa346730478fb4838dbe9137d2a47675ad789c546d150a6e1dd4ab31c"
+
 [[package]]
 name = "predicates"
 version = "2.1.5"
@@ -2474,6 +2872,15 @@ dependencies = [
  "syn 2.0.48",
 ]
 
+[[package]]
+name = "quick-xml"
+version = "0.30.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "eff6510e86862b57b210fd8cbe8ed3f0d7d600b9c2863cd4549a2e033c66e956"
+dependencies = [
+ "memchr",
+]
+
 [[package]]
 name = "quote"
 version = "1.0.35"
@@ -2825,6 +3232,12 @@ version = "1.0.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "4501abdff3ae82a1c1b477a17252eb69cee9e66eb915c1abaa4f44d873df9f09"
 
+[[package]]
+name = "safemem"
+version = "0.3.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ef703b7cb59335eae2eb93ceb664c0eb7ea6bf567079d843e09420219668e072"
+
 [[package]]
 name = "same-file"
 version = "1.0.6"
@@ -2840,6 +3253,22 @@ version = "1.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d29ab0c6d3fc0ee92fe66e2d99f700eab17a8d57d1c1d3b748380fb20baa78cd"
 
+[[package]]
+name = "scraper"
+version = "0.19.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "761fb705fdf625482d2ed91d3f0559dcfeab2798fe2771c69560a774865d0802"
+dependencies = [
+ "ahash",
+ "cssparser",
+ "ego-tree",
+ "getopts",
+ "html5ever",
+ "once_cell",
+ "selectors",
+ "tendril",
+]
+
 [[package]]
 name = "scratch"
 version = "1.0.3"
@@ -2865,6 +3294,25 @@ dependencies = [
  "zeroize",
 ]
 
+[[package]]
+name = "selectors"
+version = "0.25.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4eb30575f3638fc8f6815f448d50cb1a2e255b0897985c8c59f4d37b72a07b06"
+dependencies = [
+ "bitflags 2.5.0",
+ "cssparser",
+ "derive_more",
+ "fxhash",
+ "log",
+ "new_debug_unreachable",
+ "phf 0.10.1",
+ "phf_codegen 0.10.0",
+ "precomputed-hash",
+ "servo_arc",
+ "smallvec",
+]
+
 [[package]]
 name = "semver"
 version = "1.0.14"
@@ -2965,6 +3413,15 @@ dependencies = [
  "syn 2.0.48",
 ]
 
+[[package]]
+name = "servo_arc"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d036d71a959e00c77a63538b90a6c2390969f9772b096ea837205c6bd0491a44"
+dependencies = [
+ "stable_deref_trait",
+]
+
 [[package]]
 name = "sha1"
 version = "0.10.5"
@@ -3006,6 +3463,12 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "shell-words"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "24188a676b6ae68c3b2cb3a01be17fbf7240ce009799bb56d5b1409051e78fde"
+
 [[package]]
 name = "shlex"
 version = "1.1.0"
@@ -3024,6 +3487,12 @@ dependencies = [
  "time",
 ]
 
+[[package]]
+name = "siphasher"
+version = "0.3.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "38b58827f4464d87d377d175e90bf58eb00fd8716ff0a62f80356b5e61555d0d"
+
 [[package]]
 name = "slab"
 version = "0.4.7"
@@ -3033,6 +3502,16 @@ dependencies = [
  "autocfg",
 ]
 
+[[package]]
+name = "slug"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3bd94acec9c8da640005f8e135a39fc0372e74535e6b368b7a04b875f784c8c4"
+dependencies = [
+ "deunicode",
+ "wasm-bindgen",
+]
+
 [[package]]
 name = "smallvec"
 version = "1.13.1"
@@ -3078,18 +3557,56 @@ version = "0.5.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "6e63cff320ae2c57904679ba7cb63280a3dc4613885beafb148ee7bf9aa9042d"
 
+[[package]]
+name = "stable_deref_trait"
+version = "1.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a8f112729512f8e442d81f95a8a7ddf2b7c6b8a1a6f509a95864142b30cab2d3"
+
 [[package]]
 name = "static_assertions"
 version = "1.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "a2eb9349b6444b326872e140eb1cf5e7c522154d69e7a0ffb0fb81c06b37543f"
 
+[[package]]
+name = "string_cache"
+version = "0.8.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f91138e76242f575eb1d3b38b4f1362f10d3a43f47d182a5b359af488a02293b"
+dependencies = [
+ "new_debug_unreachable",
+ "once_cell",
+ "parking_lot",
+ "phf_shared 0.10.0",
+ "precomputed-hash",
+ "serde",
+]
+
+[[package]]
+name = "string_cache_codegen"
+version = "0.5.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6bb30289b722be4ff74a408c3cc27edeaad656e06cb1fe8fa9231fa59c728988"
+dependencies = [
+ "phf_generator 0.10.0",
+ "phf_shared 0.10.0",
+ "proc-macro2",
+ "quote",
+]
+
 [[package]]
 name = "strsim"
 version = "0.10.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "73473c0e59e6d5812c5dfe2a064a6444949f089e20eec9a2e5506596494e4623"
 
+[[package]]
+name = "strsim"
+version = "0.11.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7da8b5736845d9f2fcb837ea5d9e2628564b3b043a70948a3f0b778838c5fb4f"
+
 [[package]]
 name = "structmeta"
 version = "0.2.0"
@@ -3163,6 +3680,29 @@ dependencies = [
  "unicode-ident",
 ]
 
+[[package]]
+name = "syntect"
+version = "5.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "874dcfa363995604333cf947ae9f751ca3af4522c60886774c4963943b4746b1"
+dependencies = [
+ "bincode",
+ "bitflags 1.3.2",
+ "fancy-regex",
+ "flate2",
+ "fnv",
+ "once_cell",
+ "onig",
+ "plist",
+ "regex-syntax 0.8.1",
+ "serde",
+ "serde_derive",
+ "serde_json",
+ "thiserror",
+ "walkdir",
+ "yaml-rust",
+]
+
 [[package]]
 name = "tar"
 version = "0.4.38"
@@ -3194,6 +3734,17 @@ dependencies = [
  "windows-sys 0.48.0",
 ]
 
+[[package]]
+name = "tendril"
+version = "0.4.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d24a120c5fc464a3458240ee02c299ebcb9d67b5249c8848b09d639dca8d7bb0"
+dependencies = [
+ "futf",
+ "mac",
+ "utf-8",
+]
+
 [[package]]
 name = "termcolor"
 version = "1.1.3"
@@ -3203,6 +3754,16 @@ dependencies = [
  "winapi-util",
 ]
 
+[[package]]
+name = "terminal_size"
+version = "0.2.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8e6bf6f19e9f8ed8d4048dc22981458ebcf406d67e94cd422e5ecd73d63b3237"
+dependencies = [
+ "rustix 0.37.19",
+ "windows-sys 0.48.0",
+]
+
 [[package]]
 name = "termtree"
 version = "0.4.0"
@@ -3490,6 +4051,12 @@ version = "0.2.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "3528ecfd12c466c6f163363caf2d02a71161dd5e1cc6ae7b34207ea2d42d81ed"
 
+[[package]]
+name = "typed-arena"
+version = "2.0.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6af6ae20167a9ece4bcb41af5b80f8a1f1df981f6391189ce00fd257af04126a"
+
 [[package]]
 name = "typenum"
 version = "1.15.0"
@@ -3553,6 +4120,12 @@ version = "0.2.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "f962df74c8c05a667b5ee8bcf162993134c104e96440b663c8daa176dc772d8c"
 
+[[package]]
+name = "unicode_categories"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "39ec24b3121d976906ece63c9daad25b85969647682eee313cb5779fdd69e14e"
+
 [[package]]
 name = "unindent"
 version = "0.2.3"
@@ -3592,6 +4165,12 @@ dependencies = [
  "serde",
 ]
 
+[[package]]
+name = "utf-8"
+version = "0.7.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "09cc8ee72d2a9becf2f2febe0205bbed8fc6615b7cb429ad062dc7b7ddd036a9"
+
 [[package]]
 name = "utf8parse"
 version = "0.2.1"
@@ -3707,7 +4286,7 @@ dependencies = [
  "assert_cmd",
  "camino",
  "chrono",
- "clap 4.0.10",
+ "clap 4.4.3",
  "colorchoice",
  "const_format",
  "cstr",
@@ -4190,23 +4769,58 @@ dependencies = [
  "libc",
 ]
 
+[[package]]
+name = "xdg"
+version = "2.5.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "213b7324336b53d2414b2db8537e56544d981803139155afa84f76eeebb7a546"
+
 [[package]]
 name = "xtask"
 version = "0.0.0"
 dependencies = [
  "cbindgen",
- "clap 4.0.10",
+ "clap 4.4.3",
  "color-eyre",
  "eyre",
  "fs-err",
 ]
 
+[[package]]
+name = "yaml-rust"
+version = "0.4.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "56c1936c4cc7a1c9ab21a1ebb602eb942ba868cbd44a99cb7cdc5892335e1c85"
+dependencies = [
+ "linked-hash-map",
+]
+
 [[package]]
 name = "yansi"
 version = "0.5.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "09041cd90cf85f7f8b2df60c646f853b7f535ce68f85244eb6731cf89fa498ec"
 
+[[package]]
+name = "zerocopy"
+version = "0.7.35"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1b9b4fd18abc82b8136838da5d50bae7bdea537c574d8dc1a34ed098d6c166f0"
+dependencies = [
+ "zerocopy-derive",
+]
+
+[[package]]
+name = "zerocopy-derive"
+version = "0.7.35"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fa4f8080344d4671fb4e831a13ad1e68092748387dfc4f55e356242fae12ce3e"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.48",
+]
+
 [[package]]
 name = "zeroize"
 version = "1.5.7"
diff --git a/Cargo.toml b/Cargo.toml
index b467c583e..2ada5cbb5 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -19,6 +19,7 @@ chrono = { version = "0.4.26", default-features = false }
 clap = "4.0.10"
 color-eyre = "0.6.2"
 colorchoice = "1.0.0"
+comrak = "0.26.0"
 const_format = "0.2.32"
 cstr = "0.2.11" # https://github.com/dtolnay/syn/issues/1502
 derive-getters = "0.2.0"
@@ -67,6 +68,7 @@ regex = "1.10.0"
 reqwest = { version = "0.11.13", default-features = false }
 rstest = "0.15.0"
 rstest_reuse = "0.6.0"
+scraper = "0.19.1"
 serde = "1.0.203"
 serde_json = "1.0.85"
 serde_with = "3.3.0"
diff --git a/crates/downloader/Cargo.toml b/crates/downloader/Cargo.toml
index 20d90e087..c60afd3b6 100644
--- a/crates/downloader/Cargo.toml
+++ b/crates/downloader/Cargo.toml
@@ -11,16 +11,19 @@ anyhow.workspace = true
 binstall-tar.workspace = true
 bytes.workspace = true
 clap = { workspace = true, features = ["derive"] }
+comrak.workspace = true
 flate2.workspace = true
 fs-err = { workspace = true, features = ["tokio"] }
 futures-core.workspace = true
 futures-util.workspace = true
 indicatif.workspace = true
+itertools.workspace = true
 octocrab = { workspace = true, default-features = false, features = ["rustls-tls", "stream"] }
 once_cell.workspace = true
 parse-display.workspace = true
 rayon.workspace = true
 reqwest = { workspace = true, default-features = false, features = ["rustls-tls", "stream"] }
+scraper.workspace = true
 strum = { workspace = true, features = ["derive"] }
 tokio = { workspace = true, features = ["macros", "rt", "rt-multi-thread", "sync"] }
 tracing.workspace = true
diff --git a/crates/downloader/src/main.rs b/crates/downloader/src/main.rs
index 03a426478..0432ea0a9 100644
--- a/crates/downloader/src/main.rs
+++ b/crates/downloader/src/main.rs
@@ -1,6 +1,6 @@
 use std::{
     borrow::Cow,
-    collections::HashSet,
+    collections::{BTreeSet, HashSet},
     env,
     future::Future,
     io::{self, Cursor, Read},
@@ -9,13 +9,14 @@ use std::{
     time::Duration,
 };
 
-use anyhow::{bail, Context as _};
+use anyhow::{anyhow, bail, Context as _};
 use bytes::Bytes;
 use clap::{Parser as _, ValueEnum};
 use flate2::read::GzDecoder;
 use futures_core::Stream;
-use futures_util::{future::OptionFuture, StreamExt as _, TryStreamExt as _};
+use futures_util::{stream::FuturesOrdered, StreamExt as _, TryStreamExt as _};
 use indicatif::{MultiProgress, ProgressBar, ProgressStyle};
+use itertools::Itertools as _;
 use octocrab::{
     models::{
         repos::{Asset, Release},
@@ -39,6 +40,7 @@ const DEFAULT_OUTPUT: &str = if cfg!(windows) {
 
 const LIB_NAME: &str = "voicevox_core";
 const DEFAULT_CORE_REPO: &str = "VOICEVOX/voicevox_core";
+const DEFAULT_ONNXRUNTIME_BUILDER_REPO: &str = "VOICEVOX/onnxruntime-builder";
 const DEFAULT_ADDITIONAL_LIBRARIES_REPO: &str = "VOICEVOX/voicevox_additional_libraries";
 
 static OPEN_JTALK_DIC_URL: Lazy<Url> = Lazy::new(|| {
@@ -74,13 +76,17 @@ struct Args {
     #[arg(short, long, value_name("GIT_TAG_OR_LATEST"), default_value("latest"))]
     version: String,
 
+    /// ダウンロードするONNX Runtimeのバージョンの指定
+    #[arg(long, value_name("GIT_TAG_OR_LATEST"), default_value("latest"))]
+    onnxruntime_version: String,
+
     /// 追加でダウンロードするライブラリのバージョン
     #[arg(long, value_name("GIT_TAG_OR_LATEST"), default_value("latest"))]
     additional_libraries_version: String,
 
     /// ダウンロードするデバイスを指定する(cudaはlinuxのみ)
-    #[arg(value_enum, long, default_value(<&str>::from(Device::default())))]
-    device: Device,
+    #[arg(value_enum, long, num_args(1..), default_value(<&str>::from(Device::default())))]
+    devices: Vec<Device>,
 
     /// ダウンロードするcpuのアーキテクチャを指定する
     #[arg(value_enum, long, default_value(CpuArch::default_opt().map(<&str>::from)))]
@@ -93,6 +99,13 @@ struct Args {
     #[arg(long, value_name("REPOSITORY"), default_value(DEFAULT_CORE_REPO))]
     core_repo: RepoName,
 
+    #[arg(
+        long,
+        value_name("REPOSITORY"),
+        default_value(DEFAULT_ONNXRUNTIME_BUILDER_REPO)
+    )]
+    onnxruntime_builder_repo: RepoName,
+
     #[arg(
         long,
         value_name("REPOSITORY"),
@@ -105,11 +118,14 @@ struct Args {
 enum DownloadTarget {
     Core,
     Models,
+    Onnxruntime,
     AdditionalLibraries,
     Dict,
 }
 
-#[derive(Default, ValueEnum, Display, IntoStaticStr, Clone, Copy, PartialEq)]
+#[derive(
+    Default, ValueEnum, Display, IntoStaticStr, Clone, Copy, PartialEq, Eq, PartialOrd, Ord,
+)]
 #[strum(serialize_all = "kebab-case")]
 enum Device {
     #[default]
@@ -156,7 +172,7 @@ impl Os {
 }
 
 #[derive(parse_display::FromStr, parse_display::Display, Clone)]
-#[from_str(regex = "(?<owner>[a-zA-Z0-9_]+)/(?<repo>[a-zA-Z0-9_]+)")]
+#[from_str(regex = "(?<owner>[a-zA-Z0-9_-]+)/(?<repo>[a-zA-Z0-9_-]+)")]
 #[display("{owner}/{repo}")]
 struct RepoName {
     owner: String,
@@ -173,13 +189,16 @@ async fn main() -> anyhow::Result<()> {
         min,
         output,
         version,
+        onnxruntime_version,
         additional_libraries_version,
-        device,
+        devices,
         cpu_arch,
         os,
         core_repo,
+        onnxruntime_builder_repo,
         additional_libraries_repo,
     } = Args::parse();
+    let devices = devices.into_iter().collect::<BTreeSet<_>>();
 
     let targets: HashSet<_> = if !only.is_empty() {
         assert!(exclude.is_empty() && !min);
@@ -224,9 +243,9 @@ async fn main() -> anyhow::Result<()> {
                  `additional-libraries-version`はダウンロード対象から除外されています",
             );
         }
-        if device == Device::Cpu {
+        if devices == [Device::Cpu].into() {
             warn!(
-                "`--device`が指定されていない、もしくは`--device=cpu`が指定されていますが、\
+                "`--devices`が指定されていない、もしくは`--devices=cpu`が指定されていますが、\
                  `additional-libraries-version`はダウンロード対象から除外されています",
             );
         }
@@ -234,44 +253,67 @@ async fn main() -> anyhow::Result<()> {
 
     let octocrab = &octocrab()?;
 
-    let core = find_gh_asset(octocrab, &core_repo, &version, |tag| {
-        let device = match (os, device) {
-            (Os::Linux, Device::Cuda) => "gpu",
-            (_, device) => device.into(),
-        };
-        format!("{LIB_NAME}-{os}-{cpu_arch}-{device}-{tag}.zip")
+    let core = find_gh_asset(octocrab, &core_repo, &version, |tag, _| {
+        Ok(format!("{LIB_NAME}-{os}-{cpu_arch}-{tag}.zip"))
     })
     .await?;
 
-    let model = find_gh_asset(octocrab, &core_repo, &version, |tag| {
-        format!("model-{tag}.zip")
+    let model = find_gh_asset(octocrab, &core_repo, &version, |tag, _| {
+        Ok(format!("model-{tag}.zip"))
     })
     .await?;
 
-    let additional_libraries = OptionFuture::from((device != Device::Cpu).then(|| {
-        find_gh_asset(
-            octocrab,
-            &additional_libraries_repo,
-            &additional_libraries_version,
-            |_| {
-                let device = match device {
-                    Device::Cpu => unreachable!(),
-                    Device::Cuda => "CUDA",
-                    Device::Directml => "DirectML",
-                };
-                format!("{device}-{os}-{cpu_arch}.zip")
-            },
-        )
-    }))
-    .await
-    .transpose()?;
+    let onnxruntime = find_gh_asset(
+        octocrab,
+        &onnxruntime_builder_repo,
+        &onnxruntime_version,
+        |_, body| {
+            let body = body.with_context(|| "リリースノートがありません")?;
+            find_onnxruntime(body, os, cpu_arch, &devices)
+        },
+    )
+    .await?;
+
+    let additional_libraries = devices
+        .iter()
+        .filter(|&&device| device != Device::Cpu)
+        .map(|&device| {
+            find_gh_asset(
+                octocrab,
+                &additional_libraries_repo,
+                &additional_libraries_version,
+                move |_, _| {
+                    Ok({
+                        let device = match device {
+                            Device::Cpu => unreachable!(),
+                            Device::Cuda => "CUDA",
+                            Device::Directml => "DirectML",
+                        };
+                        format!("{device}-{os}-{cpu_arch}.zip")
+                    })
+                },
+            )
+        })
+        .collect::<FuturesOrdered<_>>()
+        .try_collect::<Vec<_>>()
+        .await?;
 
     info!("対象OS: {os}");
     info!("対象CPUアーキテクチャ: {cpu_arch}");
-    info!("ダウンロードデバイスタイプ: {device}");
+    info!(
+        "ダウンロードデバイスタイプ: {}",
+        devices.iter().format(", "),
+    );
     info!("ダウンロード{LIB_NAME}バージョン: {}", core.tag);
-    if let Some(GhAsset { tag, .. }) = &additional_libraries {
-        info!("ダウンロード追加ライブラリバージョン: {tag}");
+    info!("ダウンロードONNX Runtimeバージョン: {}", onnxruntime.tag);
+    if !additional_libraries.is_empty() {
+        info!(
+            "ダウンロード追加ライブラリバージョン: {}",
+            additional_libraries
+                .iter()
+                .map(|GhAsset { tag, .. }| tag)
+                .format(", "),
+        );
     }
 
     let progresses = MultiProgress::new();
@@ -294,8 +336,16 @@ async fn main() -> anyhow::Result<()> {
             &progresses,
         )?);
     }
+    if targets.contains(&DownloadTarget::Onnxruntime) {
+        tasks.spawn(download_and_extract_from_gh(
+            onnxruntime,
+            Stripping::FirstDir,
+            &output.join("onnxruntime"),
+            &progresses,
+        )?);
+    }
     if targets.contains(&DownloadTarget::AdditionalLibraries) {
-        if let Some(additional_libraries) = additional_libraries {
+        for additional_libraries in additional_libraries {
             tasks.spawn(download_and_extract_from_gh(
                 additional_libraries,
                 Stripping::FirstDir,
@@ -348,11 +398,15 @@ async fn find_gh_asset(
     octocrab: &Arc<Octocrab>,
     repo: &RepoName,
     git_tag_or_latest: &str,
-    asset_name: impl FnOnce(&str) -> String,
+    asset_name: impl FnOnce(
+        &str,         // タグ名
+        Option<&str>, // リリースノートの内容
+    ) -> anyhow::Result<String>,
 ) -> anyhow::Result<GhAsset> {
     let Release {
         html_url,
         tag_name,
+        body,
         assets,
         ..
     } = {
@@ -364,7 +418,11 @@ async fn find_gh_asset(
         }?
     };
 
-    let asset_name = asset_name(&tag_name);
+    let asset_name = asset_name(&tag_name, body.as_deref()).with_context(|| {
+        format!(
+            "`{repo}`の`{tag_name}`の中から条件に合致するビルドが見つけることができませんでした",
+        )
+    })?;
     let Asset { id, name, size, .. } = assets
         .into_iter()
         .find(|Asset { name, .. }| *name == asset_name)
@@ -380,6 +438,82 @@ async fn find_gh_asset(
     })
 }
 
+/// `find_gh_asset`に用いる。
+///
+/// 候補が複数あった場合、「デバイス」の数が最も小さいもののうち最初のものを選ぶ。
+fn find_onnxruntime(
+    body: &str, // リリースの"body" (i.e. リリースノートの内容)
+    os: Os,
+    cpu_arch: CpuArch,
+    devices: &BTreeSet<Device>,
+) -> anyhow::Result<String> {
+    macro_rules! selector {
+        ($expr:expr $(,)?) => {{
+            static SELECTOR: Lazy<scraper::Selector> =
+                Lazy::new(|| scraper::Selector::parse($expr).expect("should be valid"));
+            &SELECTOR
+        }};
+    }
+
+    const TARGET: &str = "table\
+        [data-voicevox-onnxruntime-specs-format-version=\"1\"]\
+        [data-voicevox-onnxruntime-specs-type=\"dylibs\"]";
+
+    comrak::parse_document(&Default::default(), body, &Default::default())
+        .descendants()
+        .flat_map(|node| match &node.data.borrow().value {
+            comrak::nodes::NodeValue::HtmlBlock(comrak::nodes::NodeHtmlBlock {
+                literal, ..
+            }) => Some(scraper::Html::parse_fragment(literal)),
+            _ => None,
+        })
+        .collect::<Vec<_>>()
+        .iter()
+        .flat_map(|html_block| html_block.select(selector!(TARGET)))
+        .exactly_one()
+        .map_err(|err| match err.count() {
+            0 => anyhow!("リリースノートの中に`{TARGET}`が見つかりませんでした"),
+            _ => anyhow!("リリースノートの中に`{TARGET}`が複数ありました"),
+        })?
+        .select(selector!("tbody > tr"))
+        .map(|tr| {
+            tr.select(selector!("td"))
+                .map(|td| td.text().exactly_one().ok())
+                .collect::<Option<Vec<_>>>()
+                .and_then(|text| text.try_into().ok())
+                .with_context(|| format!("リリースノート中の`{TARGET}`をパースできませんでした"))
+        })
+        .collect::<Result<Vec<[_; 4]>, _>>()?
+        .into_iter()
+        .filter(|&[spec_os, spec_cpu_arch, spec_devices, _]| {
+            spec_os
+                == match os {
+                    Os::Windows => "Windows",
+                    Os::Linux => "Linux",
+                    Os::Osx => "macOS",
+                }
+                && spec_cpu_arch
+                    == match cpu_arch {
+                        CpuArch::X86 => "x86",
+                        CpuArch::X64 => "x86_64",
+                        CpuArch::Arm64 => "AArch64",
+                    }
+                && devices.iter().all(|device| {
+                    spec_devices.split('/').any(|spec_device| {
+                        spec_device
+                            == match device {
+                                Device::Cpu => "CPU",
+                                Device::Cuda => "CUDA",
+                                Device::Directml => "DirectML",
+                            }
+                    })
+                })
+        })
+        .min_by_key(|&[.., spec_devices, _]| spec_devices.split('/').count())
+        .map(|[.., name]| name.to_owned())
+        .with_context(|| "指定されたOS, アーキテクチャ, デバイスを含むものが見つかりませんでした")
+}
+
 fn download_and_extract_from_gh(
     GhAsset {
         octocrab,
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index 527fa7494..c9ed52725 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -8,17 +8,12 @@ publish.workspace = true
 features = ["load-onnxruntime", "link-onnxruntime"]
 rustdoc-args = ["--cfg", "docsrs"]
 
+# rustdocを参照
 [features]
 default = []
-
-# ONNX Runtimeのリンク方法を決めるフィーチャ（rustdocを参照）。
 load-onnxruntime = ["voicevox-ort/load-dynamic"]
 link-onnxruntime = []
 
-# GPUを利用可能にするフィーチャ（rustdocを参照）。
-cuda = ["voicevox-ort/cuda"]
-directml = ["voicevox-ort/directml"]
-
 [dependencies]
 anyhow.workspace = true
 async_zip = { workspace = true, features = ["deflate"] }
diff --git a/crates/voicevox_core/src/devices.rs b/crates/voicevox_core/src/devices.rs
index dfe8d7e64..f3027e741 100644
--- a/crates/voicevox_core/src/devices.rs
+++ b/crates/voicevox_core/src/devices.rs
@@ -1,10 +1,76 @@
+use std::{
+    collections::BTreeMap,
+    fmt::{self, Display},
+    ops::Index,
+};
+
+use derive_more::BitAnd;
 use serde::{Deserialize, Serialize};
 
-/// このライブラリで利用可能なデバイスの情報。
+pub(crate) fn test_gpus(
+    gpus: impl IntoIterator<Item = GpuSpec>,
+    inference_rt_name: &'static str,
+    devices_supported_by_inference_rt: SupportedDevices,
+    test: impl Fn(GpuSpec) -> anyhow::Result<()>,
+) -> DeviceAvailabilities {
+    DeviceAvailabilities(
+        gpus.into_iter()
+            .map(|gpu| {
+                let availability = test_gpu(
+                    gpu,
+                    inference_rt_name,
+                    devices_supported_by_inference_rt,
+                    &test,
+                );
+                (gpu, availability)
+            })
+            .collect(),
+    )
+}
+
+fn test_gpu(
+    gpu: GpuSpec,
+    inference_rt_name: &'static str,
+    devices_supported_by_inference_rt: SupportedDevices,
+    test: impl Fn(GpuSpec) -> anyhow::Result<()>,
+) -> DeviceAvailability {
+    if !SupportedDevices::THIS[gpu] {
+        DeviceAvailability::NotSupportedByThisLib
+    } else if !devices_supported_by_inference_rt[gpu] {
+        DeviceAvailability::NotSupportedByCurrentLoadedInferenceRuntime(inference_rt_name)
+    } else {
+        match test(gpu) {
+            Ok(()) => DeviceAvailability::Ok,
+            Err(err) => DeviceAvailability::Err(err),
+        }
+    }
+}
+
+/// 利用可能なデバイスの情報。
 ///
-/// あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったと
+/// あくまで本ライブラリもしくはONNX Runtimeが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったと
 /// しても`cuda`や`dml`は`true`を示しうる。
-#[derive(Debug, Serialize, Deserialize)]
+///
+/// ```
+/// # #[tokio::main]
+/// # async fn main() -> anyhow::Result<()> {
+/// use voicevox_core::{tokio::Onnxruntime, SupportedDevices};
+///
+/// # voicevox_core::blocking::Onnxruntime::load_once()
+/// #     .filename(if cfg!(windows) {
+/// #         // Windows\System32\onnxruntime.dllを回避
+/// #         test_util::ONNXRUNTIME_DYLIB_PATH
+/// #     } else {
+/// #         voicevox_core::blocking::Onnxruntime::LIB_VERSIONED_FILENAME
+/// #     })
+/// #     .exec()?;
+/// #
+/// let onnxruntime = Onnxruntime::get().unwrap();
+/// dbg!(SupportedDevices::THIS & onnxruntime.supported_devices()?);
+/// # Ok(())
+/// # }
+/// ```
+#[derive(Clone, Copy, PartialEq, Eq, Debug, BitAnd, Serialize, Deserialize)]
 pub struct SupportedDevices {
     /// CPUが利用可能。
     ///
@@ -27,7 +93,146 @@ pub struct SupportedDevices {
 }
 
 impl SupportedDevices {
-    pub fn to_json(&self) -> serde_json::Value {
+    /// このライブラリで利用可能なデバイスの情報。
+    ///
+    /// `load-onnxruntime`のフィーチャが有効化されているときはすべて`true`となる。
+    ///
+    #[cfg_attr(feature = "load-onnxruntime", doc = "```")]
+    #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```no_run")]
+    /// # use voicevox_core::SupportedDevices;
+    /// assert!(SupportedDevices::THIS.cuda);
+    /// assert!(SupportedDevices::THIS.dml);
+    /// ```
+    ///
+    /// `link-onnxruntime`のフィーチャが有効化されているときは`cpu`を除き`false`となる。
+    ///
+    #[cfg_attr(feature = "link-onnxruntime", doc = "```")]
+    #[cfg_attr(not(feature = "link-onnxruntime"), doc = "```no_run")]
+    /// # use voicevox_core::SupportedDevices;
+    /// assert!(!SupportedDevices::THIS.cuda);
+    /// assert!(!SupportedDevices::THIS.dml);
+    /// ```
+    pub const THIS: Self = if cfg!(feature = "load-onnxruntime") {
+        Self {
+            cpu: true,
+            cuda: true,
+            dml: true,
+        }
+    } else if cfg!(feature = "link-onnxruntime") {
+        Self {
+            cpu: true,
+            cuda: false,
+            dml: false,
+        }
+    } else {
+        panic!("either `load-onnxruntime` or `link-onnxruntime` must be enabled");
+    };
+
+    pub fn to_json(self) -> serde_json::Value {
         serde_json::to_value(self).expect("should not fail")
     }
 }
+
+#[derive(Debug)]
+pub(crate) struct DeviceAvailabilities(BTreeMap<GpuSpec, DeviceAvailability>);
+
+impl DeviceAvailabilities {
+    pub(crate) fn oks(&self) -> Vec<GpuSpec> {
+        self.0
+            .iter()
+            .filter(|(_, result)| matches!(result, DeviceAvailability::Ok))
+            .map(|(&gpu, _)| gpu)
+            .collect()
+    }
+}
+
+impl Display for DeviceAvailabilities {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        for (gpu, availability) in &self.0 {
+            match availability {
+                DeviceAvailability::Ok => writeln!(f, "* {gpu}: OK"),
+                DeviceAvailability::Err(err) => {
+                    writeln!(f, "* {gpu}: {err}", err = err.to_string().trim_end())
+                }
+                DeviceAvailability::NotSupportedByThisLib => {
+                    writeln!(
+                        f,
+                        "* {gpu}: この`{name}`のビルドでは利用できません",
+                        name = env!("CARGO_PKG_NAME"),
+                    )
+                }
+                DeviceAvailability::NotSupportedByCurrentLoadedInferenceRuntime(name) => {
+                    writeln!(f, "* {gpu}: {name}では利用できません")
+                }
+            }?;
+        }
+        Ok(())
+    }
+}
+
+#[derive(Debug)]
+enum DeviceAvailability {
+    Ok,
+    Err(anyhow::Error),
+    NotSupportedByThisLib,
+    NotSupportedByCurrentLoadedInferenceRuntime(&'static str),
+}
+
+#[derive(Clone, Copy, PartialEq, Debug, derive_more::Display)]
+pub(crate) enum DeviceSpec {
+    #[display(fmt = "CPU")]
+    Cpu,
+
+    #[display(fmt = "{_0}")]
+    Gpu(GpuSpec),
+}
+
+#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Debug, derive_more::Display)]
+pub(crate) enum GpuSpec {
+    #[display(fmt = "CUDA (device_id=0)")]
+    Cuda,
+
+    #[display(fmt = "DirectML (device_id=0)")]
+    Dml,
+}
+
+impl GpuSpec {
+    pub(crate) fn defaults() -> Vec<Self> {
+        vec![Self::Cuda, Self::Dml]
+    }
+}
+
+impl Index<GpuSpec> for SupportedDevices {
+    type Output = bool;
+
+    fn index(&self, gpu: GpuSpec) -> &Self::Output {
+        match gpu {
+            GpuSpec::Cuda => &self.cuda,
+            GpuSpec::Dml => &self.dml,
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use pretty_assertions::assert_eq;
+
+    use super::{GpuSpec, SupportedDevices};
+
+    #[test]
+    fn gpu_spec_defaults_is_exhaustive() {
+        static SUPPORTED_DEVICES: SupportedDevices = SupportedDevices::THIS; // whatever
+
+        assert_eq!(
+            {
+                #[forbid(unused_variables)]
+                let SupportedDevices { cpu: _, cuda, dml } = &SUPPORTED_DEVICES;
+                [cuda as *const _, dml as *const _]
+            },
+            *GpuSpec::defaults()
+                .into_iter()
+                .map(|gpu| &SUPPORTED_DEVICES[gpu] as *const _)
+                .collect::<Vec<_>>(),
+        );
+    }
+}
diff --git a/crates/voicevox_core/src/error.rs b/crates/voicevox_core/src/error.rs
index d0e7fced0..0125b1cc6 100644
--- a/crates/voicevox_core/src/error.rs
+++ b/crates/voicevox_core/src/error.rs
@@ -1,4 +1,5 @@
 use crate::{
+    devices::DeviceAvailabilities,
     engine::{FullContextLabelError, KanaParseError},
     user_dict::InvalidWordError,
     StyleId, StyleType, VoiceModelId,
@@ -33,7 +34,7 @@ impl Error {
     pub fn kind(&self) -> ErrorKind {
         match &self.0 {
             ErrorRepr::NotLoadedOpenjtalkDict => ErrorKind::NotLoadedOpenjtalkDict,
-            ErrorRepr::GpuSupport => ErrorKind::GpuSupport,
+            ErrorRepr::GpuSupport(_) => ErrorKind::GpuSupport,
             ErrorRepr::InitInferenceRuntime { .. } => ErrorKind::InitInferenceRuntime,
             ErrorRepr::LoadModel(LoadModelError { context, .. }) => match context {
                 LoadModelErrorKind::OpenZipFile => ErrorKind::OpenZipFile,
@@ -63,8 +64,8 @@ pub(crate) enum ErrorRepr {
     #[error("OpenJTalkの辞書が読み込まれていません")]
     NotLoadedOpenjtalkDict,
 
-    #[error("GPU機能をサポートすることができません")]
-    GpuSupport,
+    #[error("GPU機能をサポートすることができません:\n{_0}")]
+    GpuSupport(DeviceAvailabilities),
 
     #[error("{runtime_display_name}のロードまたは初期化ができませんでした")]
     InitInferenceRuntime {
diff --git a/crates/voicevox_core/src/infer.rs b/crates/voicevox_core/src/infer.rs
index cffd0d524..112ca6b53 100644
--- a/crates/voicevox_core/src/infer.rs
+++ b/crates/voicevox_core/src/infer.rs
@@ -11,16 +11,25 @@ use enum_map::{Enum, EnumMap};
 use ndarray::{Array, ArrayD, Dimension, ShapeError};
 use thiserror::Error;
 
-use crate::{StyleType, SupportedDevices};
+use crate::{
+    devices::{DeviceSpec, GpuSpec},
+    StyleType, SupportedDevices,
+};
 
 pub(crate) trait InferenceRuntime: 'static {
     // TODO: "session"とは何なのかを定め、ドキュメントを書く。`InferenceSessionSet`も同様。
     type Session: Sized + Send + 'static;
     type RunContext<'a>: From<&'a mut Self::Session> + PushInputTensor;
 
-    /// このライブラリで利用可能なデバイスの情報を取得する。
+    /// 名前。
+    const DISPLAY_NAME: &'static str;
+
+    /// このランタイムで利用可能なデバイスの情報を取得する。
     fn supported_devices(&self) -> crate::Result<SupportedDevices>;
 
+    /// GPUが実際に利用できそうかどうか判定する。
+    fn test_gpu(&self, gpu: GpuSpec) -> anyhow::Result<()>;
+
     #[allow(clippy::type_complexity)]
     fn new_session(
         &self,
@@ -187,7 +196,7 @@ impl<D: PartialEq> ParamInfo<D> {
 #[derive(new, Clone, Copy, PartialEq, Debug)]
 pub(crate) struct InferenceSessionOptions {
     pub(crate) cpu_num_threads: u16,
-    pub(crate) use_gpu: bool,
+    pub(crate) device: DeviceSpec,
 }
 
 #[derive(Error, Debug)]
diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
index 74dc8a601..15ba963eb 100644
--- a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
+++ b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -8,7 +8,10 @@ use ort::{
     GraphOptimizationLevel, IntoTensorElementType, TensorElementType, ValueType,
 };
 
-use crate::{devices::SupportedDevices, error::ErrorRepr};
+use crate::{
+    devices::{DeviceSpec, GpuSpec, SupportedDevices},
+    error::ErrorRepr,
+};
 
 use super::super::{
     DecryptModelError, InferenceRuntime, InferenceSessionOptions, InputScalarKind,
@@ -22,6 +25,14 @@ impl InferenceRuntime for self::blocking::Onnxruntime {
     type Session = ort::Session;
     type RunContext<'a> = OnnxruntimeRunContext<'a>;
 
+    const DISPLAY_NAME: &'static str = if cfg!(feature = "load-onnxruntime") {
+        "現在ロードされているONNX Runtime"
+    } else if cfg!(feature = "link-onnxruntime") {
+        "現在リンクされているONNX Runtime"
+    } else {
+        panic!("either `load-onnxruntime` or `link-onnxruntime` must be enabled");
+    };
+
     fn supported_devices(&self) -> crate::Result<SupportedDevices> {
         (|| {
             let cpu = CPUExecutionProvider::default().is_available()?;
@@ -40,6 +51,15 @@ impl InferenceRuntime for self::blocking::Onnxruntime {
         .map_err(Into::into)
     }
 
+    fn test_gpu(&self, gpu: GpuSpec) -> anyhow::Result<()> {
+        let sess_builder = &ort::SessionBuilder::new()?;
+        match gpu {
+            GpuSpec::Cuda => CUDAExecutionProvider::default().register(sess_builder),
+            GpuSpec::Dml => DirectMLExecutionProvider::default().register(sess_builder),
+        }
+        .map_err(Into::into)
+    }
+
     fn new_session(
         &self,
         model: impl FnOnce() -> std::result::Result<Vec<u8>, DecryptModelError>,
@@ -53,14 +73,18 @@ impl InferenceRuntime for self::blocking::Onnxruntime {
             .with_optimization_level(GraphOptimizationLevel::Level1)?
             .with_intra_threads(options.cpu_num_threads.into())?;
 
-        if options.use_gpu && cfg!(feature = "directml") {
-            builder = builder
-                .with_parallel_execution(false)?
-                .with_memory_pattern(false)?;
-            DirectMLExecutionProvider::default().register(&builder)?;
-        } else if options.use_gpu && cfg!(feature = "cuda") {
-            CUDAExecutionProvider::default().register(&builder)?;
-        }
+        match options.device {
+            DeviceSpec::Cpu => {}
+            DeviceSpec::Gpu(GpuSpec::Cuda) => {
+                CUDAExecutionProvider::default().register(&builder)?;
+            }
+            DeviceSpec::Gpu(GpuSpec::Dml) => {
+                builder = builder
+                    .with_parallel_execution(false)?
+                    .with_memory_pattern(false)?;
+                DirectMLExecutionProvider::default().register(&builder)?;
+            }
+        };
 
         let model = model()?;
         let sess = builder.commit_from_memory(&{ model })?;
@@ -365,7 +389,7 @@ pub(crate) mod blocking {
             }
         }
 
-        /// このライブラリで利用可能なデバイスの情報を取得する。
+        /// ONNX Runtimeとして利用可能なデバイスの情報を取得する。
         pub fn supported_devices(&self) -> crate::Result<SupportedDevices> {
             <Self as InferenceRuntime>::supported_devices(self)
         }
@@ -517,7 +541,7 @@ pub(crate) mod tokio {
                 .map(Self::from_blocking)
         }
 
-        /// このライブラリで利用可能なデバイスの情報を取得する。
+        /// ONNX Runtimeとして利用可能なデバイスの情報を取得する。
         pub fn supported_devices(&self) -> crate::Result<SupportedDevices> {
             self.0.supported_devices()
         }
diff --git a/crates/voicevox_core/src/lib.rs b/crates/voicevox_core/src/lib.rs
index 25ff64f9e..fedf538cf 100644
--- a/crates/voicevox_core/src/lib.rs
+++ b/crates/voicevox_core/src/lib.rs
@@ -2,39 +2,25 @@
 //!
 //! # Feature flags
 //!
-//! ## ONNX Runtimeのリンク方法を決めるフィーチャ
-//!
 //! このクレートの利用にあたっては以下の二つの[Cargoフィーチャ]のうちどちらかを有効にしなければなり
 //! ません。両方の有効化はコンパイルエラーとなります。[`Onnxruntime`]の初期化方法はこれらの
 //! フィーチャによって決まります。
 //!
-//! - **`load-onnxruntime`**: ONNX Runtimeを`dlopen`/`LoadLibraryExW`で開きます。
+//! - **`load-onnxruntime`**: ONNX Runtimeを`dlopen`/`LoadLibraryExW`で
+//!     開きます。[CUDA]と[DirectML]が利用できます。
 //! - **`link-onnxruntime`**: ONNX Runtimeをロード時動的リンクします。iOSのような`dlopen`の利用が
 //!     困難な環境でのみこちらを利用するべきです。_Note_:
 //!     [動的リンク対象のライブラリ名]は`onnxruntime`で固定です。変更
-//!     は`patchelf(1)`や`install_name_tool(1)`で行ってください。
-//!
-//! ## GPUを利用可能にするフィーチャ
-//!
-//! - **`cuda`**
-//! - **`directml`**
-// TODO: こんな感じ(↓)で書く
-////! - **`cuda`**: [CUDAを用いた機械学習推論]を可能にします。
-////!     - ❗ <code>[acceleration\_mode]={Gpu,Auto}</code>のときの挙動が変化します。`directml`と共に
-////!         有効化したときの挙動は未規定です。
-////! - **`directml`**: [DirectMLを用いた機械学習推論]を可能にします。
-////!     - ❗ 〃
-////!
-////! [CUDAを用いた機械学習推論]:
-////! https://onnxruntime.ai/docs/execution-providers/CUDA-ExecutionProvider.html
-////! [DirectMLを用いた機械学習推論]:
-////! https://onnxruntime.ai/docs/execution-providers/DirectML-ExecutionProvider.html
-////! [acceleration\_mode]: InitializeOptions::acceleration_mode
+//!     は`patchelf(1)`や`install_name_tool(1)`で行ってください。また、[ONNX RuntimeのGPU機能]を使う
+//!     ことはできません。
 //!
 //! [Cargoフィーチャ]: https://doc.rust-lang.org/stable/cargo/reference/features.html
+//! [CUDA]: https://onnxruntime.ai/docs/execution-providers/CUDA-ExecutionProvider.html
+//! [DirectML]: https://onnxruntime.ai/docs/execution-providers/DirectML-ExecutionProvider.html
 //! [動的リンク対象のライブラリ名]:
 //! https://doc.rust-lang.org/cargo/reference/build-scripts.html#rustc-link-lib
 //! [`Onnxruntime`]: blocking::Onnxruntime
+//! [ONNX RuntimeのGPU機能]: https://onnxruntime.ai/docs/execution-providers/
 
 #![cfg_attr(docsrs, feature(doc_cfg))]
 
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index 8c75d64d9..419be52f5 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -350,6 +350,7 @@ mod tests {
     use rstest::rstest;
 
     use crate::{
+        devices::{DeviceSpec, GpuSpec},
         infer::{
             domains::{InferenceDomainMap, TalkOperation},
             InferenceSessionOptions,
@@ -360,16 +361,16 @@ mod tests {
     use super::Status;
 
     #[rstest]
-    #[case(true, 0)]
-    #[case(true, 1)]
-    #[case(true, 8)]
-    #[case(false, 2)]
-    #[case(false, 4)]
-    #[case(false, 8)]
-    #[case(false, 0)]
-    fn status_new_works(#[case] use_gpu: bool, #[case] cpu_num_threads: u16) {
-        let light_session_options = InferenceSessionOptions::new(cpu_num_threads, false);
-        let heavy_session_options = InferenceSessionOptions::new(cpu_num_threads, use_gpu);
+    #[case(DeviceSpec::Gpu(GpuSpec::Cuda), 0)]
+    #[case(DeviceSpec::Gpu(GpuSpec::Cuda), 1)]
+    #[case(DeviceSpec::Gpu(GpuSpec::Cuda), 8)]
+    #[case(DeviceSpec::Cpu, 2)]
+    #[case(DeviceSpec::Cpu, 4)]
+    #[case(DeviceSpec::Cpu, 8)]
+    #[case(DeviceSpec::Cpu, 0)]
+    fn status_new_works(#[case] device_for_heavy: DeviceSpec, #[case] cpu_num_threads: u16) {
+        let light_session_options = InferenceSessionOptions::new(cpu_num_threads, DeviceSpec::Cpu);
+        let heavy_session_options = InferenceSessionOptions::new(cpu_num_threads, device_for_heavy);
         let session_options = InferenceDomainMap {
             talk: enum_map! {
                 TalkOperation::PredictDuration
@@ -404,7 +405,7 @@ mod tests {
         let status = Status::new(
             crate::blocking::Onnxruntime::from_test_util_data().unwrap(),
             InferenceDomainMap {
-                talk: enum_map!(_ => InferenceSessionOptions::new(0, false)),
+                talk: enum_map!(_ => InferenceSessionOptions::new(0, DeviceSpec::Cpu)),
             },
         );
         let model = &crate::tokio::VoiceModel::sample().await.unwrap();
@@ -420,7 +421,7 @@ mod tests {
         let status = Status::new(
             crate::blocking::Onnxruntime::from_test_util_data().unwrap(),
             InferenceDomainMap {
-                talk: enum_map!(_ => InferenceSessionOptions::new(0, false)),
+                talk: enum_map!(_ => InferenceSessionOptions::new(0, DeviceSpec::Cpu)),
             },
         );
         let vvm = &crate::tokio::VoiceModel::sample().await.unwrap();
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index a11af2d5b..adae7c4b5 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -45,7 +45,7 @@ impl Default for TtsOptions {
 }
 
 /// ハードウェアアクセラレーションモードを設定する設定値。
-#[derive(Default, Debug, PartialEq, Eq)]
+#[derive(Default, Clone, Copy, Debug, PartialEq, Eq)]
 pub enum AccelerationMode {
     /// 実行環境に合った適切なハードウェアアクセラレーションモードを選択する。
     #[default]
@@ -74,8 +74,10 @@ pub(crate) mod blocking {
     use std::io::{Cursor, Write as _};
 
     use enum_map::enum_map;
+    use tracing::info;
 
     use crate::{
+        devices::{DeviceSpec, GpuSpec},
         engine::{create_kana, mora_to_text, Mora, OjtPhoneme},
         error::ErrorRepr,
         infer::{
@@ -84,7 +86,7 @@ pub(crate) mod blocking {
                 PredictDurationOutput, PredictIntonationInput, PredictIntonationOutput, TalkDomain,
                 TalkOperation,
             },
-            InferenceSessionOptions,
+            InferenceRuntime as _, InferenceSessionOptions,
         },
         status::Status,
         text_analyzer::{KanaAnalyzer, OpenJTalkAnalyzer, TextAnalyzer},
@@ -150,31 +152,44 @@ pub(crate) mod blocking {
             #[cfg(windows)]
             list_windows_video_cards();
 
-            let use_gpu = match options.acceleration_mode {
-                AccelerationMode::Auto => {
-                    let supported_devices = onnxruntime.supported_devices()?;
+            let test_gpus = || {
+                info!("GPUをテストします:");
+                let availabilities = crate::devices::test_gpus(
+                    GpuSpec::defaults(),
+                    crate::blocking::Onnxruntime::DISPLAY_NAME,
+                    onnxruntime.supported_devices()?,
+                    |gpu| onnxruntime.test_gpu(gpu),
+                );
+                for line in availabilities.to_string().lines() {
+                    info!("  {line}");
+                }
+                crate::Result::Ok(availabilities)
+            };
 
-                    if cfg!(feature = "directml") {
-                        supported_devices.dml
-                    } else {
-                        supported_devices.cuda
+            let device_for_heavy = match options.acceleration_mode {
+                AccelerationMode::Auto => match *test_gpus()?.oks() {
+                    [] => DeviceSpec::Cpu,
+                    [gpu, ..] => DeviceSpec::Gpu(gpu),
+                },
+                AccelerationMode::Cpu => DeviceSpec::Cpu,
+                AccelerationMode::Gpu => {
+                    let availabilities = test_gpus()?;
+                    match *availabilities.oks() {
+                        [] => return Err(ErrorRepr::GpuSupport(availabilities).into()),
+                        [gpu, ..] => DeviceSpec::Gpu(gpu),
                     }
                 }
-                AccelerationMode::Cpu => false,
-                AccelerationMode::Gpu => true,
             };
 
-            if use_gpu && !can_support_gpu_feature(onnxruntime)? {
-                return Err(ErrorRepr::GpuSupport.into());
-            }
+            info!("{device_for_heavy}を利用します");
 
             // 軽いモデルはこちらを使う
             let light_session_options =
-                InferenceSessionOptions::new(options.cpu_num_threads, false);
+                InferenceSessionOptions::new(options.cpu_num_threads, DeviceSpec::Cpu);
 
             // 重いモデルはこちらを使う
             let heavy_session_options =
-                InferenceSessionOptions::new(options.cpu_num_threads, use_gpu);
+                InferenceSessionOptions::new(options.cpu_num_threads, device_for_heavy);
 
             let status = Status::new(
                 onnxruntime,
@@ -187,22 +202,14 @@ pub(crate) mod blocking {
                 },
             );
 
-            return Ok(Self {
+            let use_gpu = matches!(device_for_heavy, DeviceSpec::Gpu(_));
+
+            Ok(Self {
                 status,
                 open_jtalk_analyzer: OpenJTalkAnalyzer::new(open_jtalk),
                 kana_analyzer: KanaAnalyzer,
                 use_gpu,
-            });
-
-            fn can_support_gpu_feature(onnxruntime: &crate::blocking::Onnxruntime) -> Result<bool> {
-                let supported_devices = onnxruntime.supported_devices()?;
-
-                if cfg!(feature = "directml") {
-                    Ok(supported_devices.dml)
-                } else {
-                    Ok(supported_devices.cuda)
-                }
-            }
+            })
         }
 
         pub fn onnxruntime(&self) -> &'static crate::blocking::Onnxruntime {
@@ -993,13 +1000,13 @@ pub(crate) mod blocking {
             CreateDXGIFactory, IDXGIFactory, DXGI_ADAPTER_DESC, DXGI_ERROR_NOT_FOUND,
         };
 
-        info!("検出されたGPU (DirectMLには1番目のGPUが使われます):");
+        info!("検出されたGPU (DirectMLにはGPU 0が使われます):");
         match list_windows_video_cards() {
             Ok(descs) => {
-                for desc in descs {
+                for (device_id, desc) in descs.into_iter().enumerate() {
                     let description = OsString::from_wide(trim_nul(&desc.Description));
                     let vram = humansize::format_size(desc.DedicatedVideoMemory, BINARY);
-                    info!("  - {description:?} ({vram})");
+                    info!("  GPU {device_id}: {description:?} ({vram})");
                 }
             }
             Err(err) => error!("{err}"),
diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml
index 29b66e55a..1b86521d1 100644
--- a/crates/voicevox_core_c_api/Cargo.toml
+++ b/crates/voicevox_core_c_api/Cargo.toml
@@ -15,8 +15,6 @@ name = "e2e"
 [features]
 load-onnxruntime = ["voicevox_core/load-onnxruntime"]
 link-onnxruntime = ["voicevox_core/link-onnxruntime"]
-cuda = ["voicevox_core/cuda"]
-directml = ["voicevox_core/directml"]
 
 [dependencies]
 anstream = { workspace = true, default-features = false, features = ["auto"] }
diff --git a/crates/voicevox_core_c_api/include/voicevox_core.h b/crates/voicevox_core_c_api/include/voicevox_core.h
index fe19a4c2e..fe514dfa9 100644
--- a/crates/voicevox_core_c_api/include/voicevox_core.h
+++ b/crates/voicevox_core_c_api/include/voicevox_core.h
@@ -806,11 +806,11 @@ __declspec(dllimport)
 char *voicevox_synthesizer_create_metas_json(const struct VoicevoxSynthesizer *synthesizer);
 
 /**
- * このライブラリで利用可能なデバイスの情報を、JSONで取得する。
+ * ONNX Runtimeとして利用可能なデバイスの情報を、JSONで取得する。
  *
  * JSONの解放は ::voicevox_json_free で行う。
  *
- * あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても`cuda`や`dml`は`true`を示しうる。
+ * あくまでONNX Runtimeが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても`cuda`や`dml`は`true`を示しうる。
  *
  * @param [in] onnxruntime
  * @param [out] output_supported_devices_json サポートデバイス情報のJSON文字列
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index a634e6ae8..6f157bf6b 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -650,11 +650,11 @@ pub extern "C" fn voicevox_synthesizer_create_metas_json(
     C_STRING_DROP_CHECKER.whitelist(metas).into_raw()
 }
 
-/// このライブラリで利用可能なデバイスの情報を、JSONで取得する。
+/// ONNX Runtimeとして利用可能なデバイスの情報を、JSONで取得する。
 ///
 /// JSONの解放は ::voicevox_json_free で行う。
 ///
-/// あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても`cuda`や`dml`は`true`を示しうる。
+/// あくまでONNX Runtimeが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても`cuda`や`dml`は`true`を示しうる。
 ///
 /// @param [in] onnxruntime
 /// @param [out] output_supported_devices_json サポートデバイス情報のJSON文字列
diff --git a/crates/voicevox_core_c_api/tests/e2e/log_mask.rs b/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
index 9b08c9af7..93114976e 100644
--- a/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
@@ -30,7 +30,7 @@ impl Utf8Output {
     pub(crate) fn mask_windows_video_cards(self) -> Self {
         self.mask_stderr(
             static_regex!(
-                r#"(?m)^\{timestamp\}  INFO voicevox_core::synthesizer::blocking: 検出されたGPU \(DirectMLには1番目のGPUが使われます\):(\n\{timestamp\}  INFO voicevox_core::synthesizer::blocking:   - "[^"]+" \([0-9.]+ [a-zA-Z]+\))+"#,
+                r#"(?m)^\{timestamp\}  INFO voicevox_core::synthesizer::blocking: 検出されたGPU \(DirectMLにはGPU 0が使われます\):(\n\{timestamp\}  INFO voicevox_core::synthesizer::blocking:   GPU [0-9]+: "[^"]+" \([0-9.]+ [a-zA-Z]+\))+"#,
             ),
             "{windows-video-cards}",
         )
diff --git a/crates/voicevox_core_c_api/tests/e2e/snapshots.toml b/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
index b623119dd..17ccd61f8 100644
--- a/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
+++ b/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
@@ -53,9 +53,11 @@ metas = '''
 stderr.windows = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 stderr.unix = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 
 [compatible_engine_load_model_before_initialize]
@@ -97,9 +99,11 @@ output."こんにちは、音声合成の世界へようこそ".wav_length = 176
 stderr.windows = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 stderr.unix = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 
 [synthesizer_new_output_json]
@@ -157,9 +161,11 @@ metas = '''
 stderr.windows = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 stderr.unix = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 
 [tts_via_audio_query]
@@ -167,9 +173,11 @@ output."こんにちは、音声合成の世界へようこそ".wav_length = 176
 stderr.windows = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 stderr.unix = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 
 # FIXME: "user_dict_load"のはず
@@ -177,9 +185,11 @@ stderr.unix = '''
 stderr.windows = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 stderr.unix = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
+{timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 
 [user_dict_manipulate]
diff --git a/crates/voicevox_core_java_api/Cargo.toml b/crates/voicevox_core_java_api/Cargo.toml
index e9cced8b2..ec4e2d616 100644
--- a/crates/voicevox_core_java_api/Cargo.toml
+++ b/crates/voicevox_core_java_api/Cargo.toml
@@ -7,10 +7,6 @@ publish.workspace = true
 [lib]
 crate-type = ["cdylib"]
 
-[features]
-cuda = ["voicevox_core/cuda"]
-directml = ["voicevox_core/directml"]
-
 [dependencies]
 android_logger.workspace = true
 chrono = { workspace = true, default-features = false, features = ["clock"] }
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java
index 010e69073..496c2ccc4 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/GlobalInfo.java
@@ -24,10 +24,10 @@ public static String getVersion() {
 
   // FIXME: `Onnxruntime`に移すか、独立させる
   /**
-   * このライブラリで利用可能なデバイスの情報。
+   * ONNX Runtime利用可能なデバイスの情報。
    *
-   * <p>あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても {@link #cuda} や {@link #dml} は {@code
-   * true} を示しうる。
+   * <p>あくまでONNX Runtimeが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても {@link #cuda} や {@link #dml} は
+   * {@code true} を示しうる。
    */
   public static class SupportedDevices {
     /**
diff --git a/crates/voicevox_core_python_api/Cargo.toml b/crates/voicevox_core_python_api/Cargo.toml
index 48c92dfb4..e0877b623 100644
--- a/crates/voicevox_core_python_api/Cargo.toml
+++ b/crates/voicevox_core_python_api/Cargo.toml
@@ -7,10 +7,6 @@ publish.workspace = true
 [lib]
 crate-type = ["cdylib"]
 
-[features]
-cuda = ["voicevox_core/cuda"]
-directml = ["voicevox_core/directml"]
-
 [dependencies]
 camino.workspace = true
 easy-ext.workspace = true
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_models.py b/crates/voicevox_core_python_api/python/voicevox_core/_models.py
index f7929fae2..941ed84fc 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_models.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_models.py
@@ -90,9 +90,9 @@ class SpeakerMeta:
 @pydantic.dataclasses.dataclass
 class SupportedDevices:
     """
-    このライブラリで利用可能なデバイスの情報。
+    ONNX Runtimeとして利用可能なデバイスの情報。
 
-    あくまで本ライブラリが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても
+    あくまでONNX Runtimeが対応しているデバイスの情報であることに注意。GPUが使える環境ではなかったとしても
     ``cuda`` や ``dml`` は ``True`` を示しうる。
     """
 
diff --git a/docs/downloader.md b/docs/downloader.md
index aeff5b4a8..76148197f 100644
--- a/docs/downloader.md
+++ b/docs/downloader.md
@@ -49,7 +49,7 @@ download
 または
 
 ```
-download --device cpu
+download --devices cpu
 ```
 
 <a id="directml"></a>
@@ -57,7 +57,7 @@ download --device cpu
 ## DirectML 版をダウンロードする場合
 
 ```
-download --device directml
+download --devices directml
 ```
 
 <a id="cuda"></a>
@@ -65,7 +65,7 @@ download --device directml
 ## CUDA 版をダウンロードする場合
 
 ```
-download --device cuda
+download --devices cuda
 ```
 
 <a id="help"></a>
diff --git a/docs/usage.md b/docs/usage.md
index e828ae220..067250126 100644
--- a/docs/usage.md
+++ b/docs/usage.md
@@ -31,10 +31,10 @@ chmod +x download
 ./download
 
 # DirectML版を利用する場合
-./download --device directml
+./download --devices directml
 
 # CUDA版を利用する場合
-./download --device cuda
+./download --devices cuda
 ```
 
 `voicevox_core`ディレクトリにファイル一式がダウンロードされています。以降の説明ではこのディレクトリで作業を行います。
diff --git a/example/cpp/windows/README.md b/example/cpp/windows/README.md
index 660d4190c..4012acdf9 100644
--- a/example/cpp/windows/README.md
+++ b/example/cpp/windows/README.md
@@ -14,7 +14,7 @@ Visual Studio Installerを使用しインストールしてください。
 
 出力フォルダを作成するために、一度ビルドします。「windows_example.sln」をVisual Studioで開き、メニューの「ビルド」→「ソリューションのビルド」を押します。
 この段階では、ビルドは失敗します。「bin」フォルダと「lib」フォルダが生成されていればOKです。  
-[Releases](https://github.com/VOICEVOX/voicevox_core/releases/latest)から「voicevox_core-windows-x64-cpu-{バージョン名}.zip」をダウンロードし、展開します。[ダウンローダー](https://github.com/VOICEVOX/voicevox_core/blob/main/docs/downloader.md)を使うと便利です。  
+[Releases](https://github.com/VOICEVOX/voicevox_core/releases/latest)から「voicevox_core-windows-x64-{バージョン名}.zip」をダウンロードし、展開します。[ダウンローダー](https://github.com/VOICEVOX/voicevox_core/blob/main/docs/downloader.md)を使うと便利です。  
 展開してできたファイル・フォルダをそれぞれ下記のフォルダへ配置します。
 
 - simple_tts に配置
diff --git a/example/python/README.md b/example/python/README.md
index 97303eb81..48678edb2 100644
--- a/example/python/README.md
+++ b/example/python/README.md
@@ -18,6 +18,8 @@ https://github.com/VOICEVOX/voicevox_core/releases/latest
 
 2. ダウンローダーを使って環境構築します。
 
+FIXME: 今は`--exclude core`がある
+
 linux/mac の場合
 
 download-linux-x64 のところはアーキテクチャや OS によって適宜読み替えてください。

From 1e75e4e5ca7ec7fb447844b701f9d2ec5dcff2c2 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Mon, 12 Aug 2024 02:35:08 +0900
Subject: [PATCH 18/36] =?UTF-8?q?chore:=20Rust=201.79=E3=81=A81.80?=
 =?UTF-8?q?=E3=81=A7=E8=BF=BD=E5=8A=A0=E3=81=95=E3=82=8C=E3=81=9F=E6=A9=9F?=
 =?UTF-8?q?=E8=83=BD=E3=82=92=E5=88=A9=E7=94=A8=E3=81=99=E3=82=8B=20(#816)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* `once_cell::sync::Lazy` → `std::sync::LazyLock`

* `NonNull`に直接生えたメソッドを使う

* `<[[T; N]]>::as_flattened`

* `if`と`match`でのライフタイム延長

* `associated_type_bounds`
---
 Cargo.lock                                    |  5 ----
 crates/downloader/Cargo.toml                  |  1 -
 crates/downloader/src/main.rs                 | 19 +++++++-------
 crates/test_util/Cargo.toml                   |  1 -
 crates/test_util/src/lib.rs                   |  4 +--
 crates/voicevox_core/Cargo.toml               |  1 -
 .../src/engine/acoustic_feature_extractor.rs  | 10 ++++----
 .../voicevox_core/src/engine/kana_parser.rs   | 11 +++++---
 .../voicevox_core/src/infer/domains/talk.rs   |  6 ++---
 crates/voicevox_core/src/infer/session_set.rs |  7 +++---
 crates/voicevox_core/src/metas.rs             |  7 +++---
 crates/voicevox_core/src/synthesizer.rs       | 15 +++++------
 .../src/user_dict/part_of_speech_data.rs      |  6 ++---
 crates/voicevox_core/src/user_dict/word.rs    | 16 ++++++------
 crates/voicevox_core/src/voice_model.rs       |  5 ++--
 crates/voicevox_core_c_api/Cargo.toml         |  1 -
 .../src/compatible_engine.rs                  | 15 ++++++-----
 crates/voicevox_core_c_api/src/drop_check.rs  |  2 +-
 crates/voicevox_core_c_api/src/lib.rs         | 25 ++++++-------------
 crates/voicevox_core_c_api/src/slice_owner.rs |  4 +--
 .../voicevox_core_c_api/tests/e2e/log_mask.rs |  5 ++--
 .../tests/e2e/snapshots.rs                    |  2 +-
 .../tests/e2e/testcases/compatible_engine.rs  |  4 +--
 ...ble_engine_load_model_before_initialize.rs |  5 ++--
 .../tests/e2e/testcases/global_info.rs        |  5 ++--
 .../tests/e2e/testcases/simple_tts.rs         |  5 ++--
 .../testcases/synthesizer_new_output_json.rs  |  4 +--
 .../e2e/testcases/tts_via_audio_query.rs      |  5 ++--
 .../tests/e2e/testcases/user_dict_load.rs     |  8 +++---
 .../e2e/testcases/user_dict_manipulate.rs     |  7 +++---
 crates/voicevox_core_java_api/Cargo.toml      |  1 -
 31 files changed, 96 insertions(+), 116 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 9fdf8f695..3da1581da 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1062,7 +1062,6 @@ dependencies = [
  "indicatif",
  "itertools 0.10.5",
  "octocrab",
- "once_cell",
  "parse-display",
  "rayon",
  "reqwest",
@@ -3782,7 +3781,6 @@ dependencies = [
  "fs-err",
  "indoc",
  "libloading 0.7.3",
- "once_cell",
  "reqwest",
  "serde",
  "serde_json",
@@ -4250,7 +4248,6 @@ dependencies = [
  "itertools 0.10.5",
  "jlabel",
  "ndarray",
- "once_cell",
  "open_jtalk",
  "ouroboros",
  "pretty_assertions",
@@ -4301,7 +4298,6 @@ dependencies = [
  "libtest-mimic",
  "ndarray",
  "ndarray-stats",
- "once_cell",
  "process_path",
  "ref-cast",
  "regex",
@@ -4330,7 +4326,6 @@ dependencies = [
  "duplicate",
  "easy-ext",
  "jni",
- "once_cell",
  "pretty_assertions",
  "rstest",
  "serde_json",
diff --git a/crates/downloader/Cargo.toml b/crates/downloader/Cargo.toml
index c60afd3b6..427a1854d 100644
--- a/crates/downloader/Cargo.toml
+++ b/crates/downloader/Cargo.toml
@@ -19,7 +19,6 @@ futures-util.workspace = true
 indicatif.workspace = true
 itertools.workspace = true
 octocrab = { workspace = true, default-features = false, features = ["rustls-tls", "stream"] }
-once_cell.workspace = true
 parse-display.workspace = true
 rayon.workspace = true
 reqwest = { workspace = true, default-features = false, features = ["rustls-tls", "stream"] }
diff --git a/crates/downloader/src/main.rs b/crates/downloader/src/main.rs
index 0432ea0a9..6ece6d054 100644
--- a/crates/downloader/src/main.rs
+++ b/crates/downloader/src/main.rs
@@ -5,7 +5,7 @@ use std::{
     future::Future,
     io::{self, Cursor, Read},
     path::{Path, PathBuf},
-    sync::Arc,
+    sync::{Arc, LazyLock},
     time::Duration,
 };
 
@@ -24,7 +24,6 @@ use octocrab::{
     },
     Octocrab,
 };
-use once_cell::sync::Lazy;
 use rayon::iter::{IntoParallelIterator as _, ParallelIterator as _};
 use strum::{Display, IntoStaticStr};
 use tokio::task::{JoinError, JoinSet};
@@ -43,7 +42,7 @@ const DEFAULT_CORE_REPO: &str = "VOICEVOX/voicevox_core";
 const DEFAULT_ONNXRUNTIME_BUILDER_REPO: &str = "VOICEVOX/onnxruntime-builder";
 const DEFAULT_ADDITIONAL_LIBRARIES_REPO: &str = "VOICEVOX/voicevox_additional_libraries";
 
-static OPEN_JTALK_DIC_URL: Lazy<Url> = Lazy::new(|| {
+static OPEN_JTALK_DIC_URL: LazyLock<Url> = LazyLock::new(|| {
     "https://jaist.dl.sourceforge.net/project/open-jtalk/Dictionary/open_jtalk_dic-1.11/open_jtalk_dic_utf_8-1.11.tar.gz"
         .parse()
         .unwrap()
@@ -449,8 +448,8 @@ fn find_onnxruntime(
 ) -> anyhow::Result<String> {
     macro_rules! selector {
         ($expr:expr $(,)?) => {{
-            static SELECTOR: Lazy<scraper::Selector> =
-                Lazy::new(|| scraper::Selector::parse($expr).expect("should be valid"));
+            static SELECTOR: LazyLock<scraper::Selector> =
+                LazyLock::new(|| scraper::Selector::parse($expr).expect("should be valid"));
             &SELECTOR
         }};
     }
@@ -595,8 +594,8 @@ fn add_progress_bar(
 
     const INTERVAL: Duration = Duration::from_millis(100);
 
-    static PROGRESS_STYLE: Lazy<ProgressStyle> =
-        Lazy::new(|| ProgressStyle::with_template("{prefix}").unwrap());
+    static PROGRESS_STYLE: LazyLock<ProgressStyle> =
+        LazyLock::new(|| ProgressStyle::with_template("{prefix}").unwrap());
 }
 
 async fn download_and_extract(
@@ -614,15 +613,15 @@ async fn download_and_extract(
     let files = &read_archive(archive, archive_kind, pb.clone()).await?;
     return extract(files, stripping, output, pb).await;
 
-    static PROGRESS_STYLE1: Lazy<ProgressStyle> = Lazy::new(|| {
+    static PROGRESS_STYLE1: LazyLock<ProgressStyle> = LazyLock::new(|| {
         ProgressStyle::with_template(
             "{prefix:55} {bytes:>11} {bytes_per_sec:>13} {elapsed_precise} {bar} {percent:>3}%",
         )
         .unwrap()
     });
 
-    static PROGRESS_STYLE2: Lazy<ProgressStyle> =
-        Lazy::new(|| ProgressStyle::with_template("{prefix:55} {spinner} {msg}").unwrap());
+    static PROGRESS_STYLE2: LazyLock<ProgressStyle> =
+        LazyLock::new(|| ProgressStyle::with_template("{prefix:55} {spinner} {msg}").unwrap());
 
     async fn with_style(
         pb: ProgressBar,
diff --git a/crates/test_util/Cargo.toml b/crates/test_util/Cargo.toml
index fe0c2f6dd..329d5f603 100644
--- a/crates/test_util/Cargo.toml
+++ b/crates/test_util/Cargo.toml
@@ -4,7 +4,6 @@ edition.workspace = true
 
 [dependencies]
 libloading.workspace = true
-once_cell.workspace = true
 serde = { workspace = true, features = ["derive"] }
 serde_json.workspace = true
 
diff --git a/crates/test_util/src/lib.rs b/crates/test_util/src/lib.rs
index 6473e438e..740cfb415 100644
--- a/crates/test_util/src/lib.rs
+++ b/crates/test_util/src/lib.rs
@@ -17,7 +17,7 @@ pub mod c_api {
     pub const VV_MODELS_ROOT_DIR: &str = super::VV_MODELS_ROOT_DIR;
 }
 
-use once_cell::sync::Lazy;
+use std::sync::LazyLock;
 
 pub use self::typing::{
     DecodeExampleData, DurationExampleData, ExampleData, IntonationExampleData,
@@ -36,6 +36,6 @@ const EXAMPLE_DATA_JSON: &str = include_str!(concat!(
     "/data/example_data.json"
 ));
 
-pub static EXAMPLE_DATA: Lazy<ExampleData> = Lazy::new(|| {
+pub static EXAMPLE_DATA: LazyLock<ExampleData> = LazyLock::new(|| {
     serde_json::from_str(EXAMPLE_DATA_JSON).expect("failed to parse example_data.json")
 });
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index c9ed52725..8cb2b1cfc 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -32,7 +32,6 @@ indexmap = { workspace = true, features = ["serde"] }
 itertools.workspace = true
 jlabel.workspace = true
 ndarray.workspace = true
-once_cell.workspace = true
 open_jtalk.workspace = true
 ouroboros.workspace = true
 rayon.workspace = true
diff --git a/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs b/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
index 5ee7ea540..a75770dd9 100644
--- a/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
+++ b/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
@@ -1,7 +1,7 @@
+use std::{collections::HashMap, sync::LazyLock};
+
 use derive_getters::Getters;
 use derive_new::new;
-use once_cell::sync::Lazy;
-use std::collections::HashMap;
 
 #[rustfmt::skip]
 const PHONEME_LIST: &[&str] = &[
@@ -52,7 +52,7 @@ const PHONEME_LIST: &[&str] = &[
     "z",
 ];
 
-static PHONEME_MAP: Lazy<HashMap<&str, i64>> = Lazy::new(|| {
+static PHONEME_MAP: LazyLock<HashMap<&str, i64>> = LazyLock::new(|| {
     let mut m = HashMap::new();
     for (i, s) in PHONEME_LIST.iter().enumerate() {
         m.insert(*s, i as i64);
@@ -70,8 +70,8 @@ pub(crate) struct OjtPhoneme {
 }
 
 impl OjtPhoneme {
-    pub(crate) fn num_phoneme() -> usize {
-        PHONEME_MAP.len()
+    pub(crate) const fn num_phoneme() -> usize {
+        PHONEME_LIST.len() // == PHONEME_MAP.len()
     }
 
     fn space_phoneme() -> String {
diff --git a/crates/voicevox_core/src/engine/kana_parser.rs b/crates/voicevox_core/src/engine/kana_parser.rs
index 9397376f6..67aa276cb 100644
--- a/crates/voicevox_core/src/engine/kana_parser.rs
+++ b/crates/voicevox_core/src/engine/kana_parser.rs
@@ -1,7 +1,10 @@
-use crate::engine::model::{AccentPhrase, Mora};
-use crate::engine::mora_list::MORA_LIST_MINIMUM;
-use once_cell::sync::Lazy;
 use std::collections::HashMap;
+use std::sync::LazyLock;
+
+use crate::engine::{
+    model::{AccentPhrase, Mora},
+    mora_list::MORA_LIST_MINIMUM,
+};
 
 const UNVOICE_SYMBOL: char = '_';
 const ACCENT_SYMBOL: char = '\'';
@@ -16,7 +19,7 @@ pub(crate) struct KanaParseError(String);
 
 type KanaParseResult<T> = std::result::Result<T, KanaParseError>;
 
-static TEXT2MORA_WITH_UNVOICE: Lazy<HashMap<String, Mora>> = Lazy::new(|| {
+static TEXT2MORA_WITH_UNVOICE: LazyLock<HashMap<String, Mora>> = LazyLock::new(|| {
     let mut text2mora_with_unvoice = HashMap::new();
     for [text, consonant, vowel] in MORA_LIST_MINIMUM {
         let consonant = if !consonant.is_empty() {
diff --git a/crates/voicevox_core/src/infer/domains/talk.rs b/crates/voicevox_core/src/infer/domains/talk.rs
index e0716fa50..b2470c124 100644
--- a/crates/voicevox_core/src/infer/domains/talk.rs
+++ b/crates/voicevox_core/src/infer/domains/talk.rs
@@ -1,9 +1,8 @@
-use std::collections::BTreeSet;
+use std::{collections::BTreeSet, sync::LazyLock};
 
 use enum_map::Enum;
 use macros::{InferenceInputSignature, InferenceOperation, InferenceOutputSignature};
 use ndarray::{Array0, Array1, Array2};
-use once_cell::sync::Lazy;
 
 use crate::StyleType;
 
@@ -17,7 +16,8 @@ impl InferenceDomain for TalkDomain {
     type Operation = TalkOperation;
 
     fn style_types() -> &'static BTreeSet<StyleType> {
-        static STYLE_TYPES: Lazy<BTreeSet<StyleType>> = Lazy::new(|| [StyleType::Talk].into());
+        static STYLE_TYPES: LazyLock<BTreeSet<StyleType>> =
+            LazyLock::new(|| [StyleType::Talk].into());
         &STYLE_TYPES
     }
 }
diff --git a/crates/voicevox_core/src/infer/session_set.rs b/crates/voicevox_core/src/infer/session_set.rs
index 95f081bac..ad85e93ac 100644
--- a/crates/voicevox_core/src/infer/session_set.rs
+++ b/crates/voicevox_core/src/infer/session_set.rs
@@ -61,8 +61,8 @@ impl<R: InferenceRuntime, D: InferenceDomain> InferenceSessionSet<R, D> {
                 .iter()
                 .map(|ParamInfo { name, dt, ndim }| {
                     let brackets = match *ndim {
-                        Some(ndim) => "[]".repeat(ndim),
-                        None => "[]...".to_owned(),
+                        Some(ndim) => &"[]".repeat(ndim),
+                        None => "[]...",
                     };
                     format!("{name}: {dt}{brackets}")
                 })
@@ -74,8 +74,7 @@ impl<R: InferenceRuntime, D: InferenceDomain> InferenceSessionSet<R, D> {
 impl<R: InferenceRuntime, D: InferenceDomain> InferenceSessionSet<R, D> {
     pub(crate) fn get<I>(&self) -> InferenceSessionCell<R, I>
     where
-        I: InferenceInputSignature,
-        I::Signature: InferenceSignature<Domain = D>,
+        I: InferenceInputSignature<Signature: InferenceSignature<Domain = D>>,
     {
         InferenceSessionCell {
             inner: self.0[I::Signature::OPERATION].clone(),
diff --git a/crates/voicevox_core/src/metas.rs b/crates/voicevox_core/src/metas.rs
index 1fb4a7f9d..97c3922c7 100644
--- a/crates/voicevox_core/src/metas.rs
+++ b/crates/voicevox_core/src/metas.rs
@@ -209,12 +209,13 @@ pub enum StyleType {
 
 #[cfg(test)]
 mod tests {
-    use once_cell::sync::Lazy;
+    use std::sync::LazyLock;
+
     use serde_json::json;
 
     #[test]
     fn merge_works() -> anyhow::Result<()> {
-        static INPUT: Lazy<serde_json::Value> = Lazy::new(|| {
+        static INPUT: LazyLock<serde_json::Value> = LazyLock::new(|| {
             json!([
                 {
                     "name": "B",
@@ -267,7 +268,7 @@ mod tests {
             ])
         });
 
-        static EXPECTED: Lazy<serde_json::Value> = Lazy::new(|| {
+        static EXPECTED: LazyLock<serde_json::Value> = LazyLock::new(|| {
             json!([
                 {
                     "name": "A",
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index adae7c4b5..8dcbf848a 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -265,12 +265,12 @@ pub(crate) mod blocking {
             } = audio_query;
 
             let accent_phrases = if options.enable_interrogative_upspeak {
-                adjust_interrogative_accent_phrases(accent_phrases)
+                &adjust_interrogative_accent_phrases(accent_phrases)
             } else {
-                accent_phrases.clone()
+                accent_phrases
             };
 
-            let (flatten_moras, phoneme_data_list) = initial_process(&accent_phrases);
+            let (flatten_moras, phoneme_data_list) = initial_process(accent_phrases);
 
             let mut phoneme_length_list = vec![*pre_phoneme_length];
             let mut f0_list = vec![0.];
@@ -318,7 +318,7 @@ pub(crate) mod blocking {
 
             let (_, _, vowel_indexes) = split_mora(&phoneme_data_list);
 
-            let mut phoneme: Vec<Vec<f32>> = Vec::new();
+            let mut phoneme = Vec::new();
             let mut f0: Vec<f32> = Vec::new();
             {
                 const RATE: f32 = 24000. / 256.;
@@ -335,7 +335,7 @@ pub(crate) mod blocking {
                     let phoneme_id = phoneme_data_list[i].phoneme_id();
 
                     for _ in 0..phoneme_length {
-                        let mut phonemes_vec = vec![0.; OjtPhoneme::num_phoneme()];
+                        let mut phonemes_vec = [0.; OjtPhoneme::num_phoneme()];
                         phonemes_vec[phoneme_id as usize] = 1.;
                         phoneme.push(phonemes_vec)
                     }
@@ -352,14 +352,11 @@ pub(crate) mod blocking {
                 }
             }
 
-            // 2次元のvectorを1次元に変換し、アドレスを連続させる
-            let flatten_phoneme = phoneme.into_iter().flatten().collect::<Vec<_>>();
-
             let wave = &self.decode(
                 f0.len(),
                 OjtPhoneme::num_phoneme(),
                 &f0,
-                &flatten_phoneme,
+                phoneme.as_flattened(),
                 style_id,
             )?;
             return Ok(to_wav(wave, audio_query));
diff --git a/crates/voicevox_core/src/user_dict/part_of_speech_data.rs b/crates/voicevox_core/src/user_dict/part_of_speech_data.rs
index b7bc95440..908885c65 100644
--- a/crates/voicevox_core/src/user_dict/part_of_speech_data.rs
+++ b/crates/voicevox_core/src/user_dict/part_of_speech_data.rs
@@ -1,5 +1,5 @@
-use once_cell::sync::Lazy;
 use std::collections::HashMap;
+use std::sync::LazyLock;
 
 use crate::UserDictWordType;
 
@@ -30,8 +30,8 @@ pub(super) struct PartOfSpeechDetail {
 }
 
 // 元データ： https://github.com/VOICEVOX/voicevox_engine/blob/master/voicevox_engine/part_of_speech_data.py
-pub(super) static PART_OF_SPEECH_DETAIL: Lazy<HashMap<UserDictWordType, PartOfSpeechDetail>> =
-    Lazy::new(|| {
+pub(super) static PART_OF_SPEECH_DETAIL: LazyLock<HashMap<UserDictWordType, PartOfSpeechDetail>> =
+    LazyLock::new(|| {
         HashMap::from_iter([
             (
                 UserDictWordType::ProperNoun,
diff --git a/crates/voicevox_core/src/user_dict/word.rs b/crates/voicevox_core/src/user_dict/word.rs
index f6bbc182f..0a42f1da5 100644
--- a/crates/voicevox_core/src/user_dict/word.rs
+++ b/crates/voicevox_core/src/user_dict/word.rs
@@ -1,3 +1,8 @@
+use std::{ops::RangeToInclusive, sync::LazyLock};
+
+use regex::Regex;
+use serde::{de::Error as _, Deserialize, Serialize};
+
 use crate::{
     error::ErrorRepr,
     result::Result,
@@ -5,10 +10,6 @@ use crate::{
         priority2cost, MAX_PRIORITY, MIN_PRIORITY, PART_OF_SPEECH_DETAIL,
     },
 };
-use once_cell::sync::Lazy;
-use regex::Regex;
-use serde::{de::Error as _, Deserialize, Serialize};
-use std::ops::RangeToInclusive;
 
 /// ユーザー辞書の単語。
 #[derive(Clone, Debug, Serialize)]
@@ -77,8 +78,9 @@ impl InvalidWordError {
 
 type InvalidWordResult<T> = std::result::Result<T, InvalidWordError>;
 
-static PRONUNCIATION_REGEX: Lazy<Regex> = Lazy::new(|| Regex::new(r"^[ァ-ヴー]+$").unwrap());
-static MORA_REGEX: Lazy<Regex> = Lazy::new(|| {
+static PRONUNCIATION_REGEX: LazyLock<Regex> =
+    LazyLock::new(|| Regex::new(r"^[ァ-ヴー]+$").unwrap());
+static MORA_REGEX: LazyLock<Regex> = LazyLock::new(|| {
     Regex::new(concat!(
         "(?:",
         "[イ][ェ]|[ヴ][ャュョ]|[トド][ゥ]|[テデ][ィャュョ]|[デ][ェ]|[クグ][ヮ]|", // rule_others
@@ -89,7 +91,7 @@ static MORA_REGEX: Lazy<Regex> = Lazy::new(|| {
     ))
     .unwrap()
 });
-static SPACE_REGEX: Lazy<Regex> = Lazy::new(|| Regex::new(r"\p{Z}").unwrap());
+static SPACE_REGEX: LazyLock<Regex> = LazyLock::new(|| Regex::new(r"\p{Z}").unwrap());
 
 impl Default for UserDictWord {
     fn default() -> Self {
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index 027747ab7..48477256c 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -454,7 +454,8 @@ pub(crate) mod tokio {
 
 #[cfg(test)]
 mod tests {
-    use once_cell::sync::Lazy;
+    use std::sync::LazyLock;
+
     use rstest::{fixture, rstest};
     use serde_json::json;
 
@@ -501,7 +502,7 @@ mod tests {
         assert_eq!(expected, actual);
     }
 
-    static TALK_MANIFEST: Lazy<TalkManifest> = Lazy::new(|| TalkManifest {
+    static TALK_MANIFEST: LazyLock<TalkManifest> = LazyLock::new(|| TalkManifest {
         predict_duration_filename: "".to_owned(),
         predict_intonation_filename: "".to_owned(),
         decode_filename: "".to_owned(),
diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml
index 1b86521d1..996367a5f 100644
--- a/crates/voicevox_core_c_api/Cargo.toml
+++ b/crates/voicevox_core_c_api/Cargo.toml
@@ -29,7 +29,6 @@ easy-ext.workspace = true
 futures.workspace = true
 itertools.workspace = true
 libc.workspace = true
-once_cell.workspace = true
 process_path.workspace = true
 ref-cast.workspace = true
 serde_json = { workspace = true, features = ["preserve_order"] }
diff --git a/crates/voicevox_core_c_api/src/compatible_engine.rs b/crates/voicevox_core_c_api/src/compatible_engine.rs
index 70fa83710..68b836f2f 100644
--- a/crates/voicevox_core_c_api/src/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/src/compatible_engine.rs
@@ -2,12 +2,11 @@ use std::{
     collections::BTreeMap,
     env,
     ffi::{c_char, CString},
-    sync::{Mutex, MutexGuard},
+    sync::{LazyLock, Mutex, MutexGuard},
 };
 
 use libc::c_int;
 
-use once_cell::sync::Lazy;
 use voicevox_core::{StyleId, VoiceModelId, __internal::interop::PerformInference as _};
 
 use crate::{helpers::display_error, init_logger_once};
@@ -24,9 +23,9 @@ macro_rules! ensure_initialized {
     };
 }
 
-static ERROR_MESSAGE: Lazy<Mutex<String>> = Lazy::new(|| Mutex::new(String::new()));
+static ERROR_MESSAGE: LazyLock<Mutex<String>> = LazyLock::new(|| Mutex::new(String::new()));
 
-static ONNXRUNTIME: Lazy<&'static voicevox_core::blocking::Onnxruntime> = Lazy::new(|| {
+static ONNXRUNTIME: LazyLock<&'static voicevox_core::blocking::Onnxruntime> = LazyLock::new(|| {
     voicevox_core::blocking::Onnxruntime::load_once()
         .exec()
         .unwrap_or_else(|err| {
@@ -42,7 +41,7 @@ struct VoiceModelSet {
     model_map: BTreeMap<VoiceModelId, voicevox_core::blocking::VoiceModel>,
 }
 
-static VOICE_MODEL_SET: Lazy<VoiceModelSet> = Lazy::new(|| {
+static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
     let all_vvms = get_all_models();
     let model_map: BTreeMap<_, _> = all_vvms.iter().map(|vvm| (vvm.id(), vvm.clone())).collect();
     let metas = voicevox_core::__internal::interop::merge_metas(
@@ -99,8 +98,8 @@ fn voice_model_set() -> &'static VoiceModelSet {
     &VOICE_MODEL_SET
 }
 
-static SYNTHESIZER: Lazy<Mutex<Option<voicevox_core::blocking::Synthesizer<()>>>> =
-    Lazy::new(|| Mutex::new(None));
+static SYNTHESIZER: LazyLock<Mutex<Option<voicevox_core::blocking::Synthesizer<()>>>> =
+    LazyLock::new(|| Mutex::new(None));
 
 fn lock_synthesizer() -> MutexGuard<'static, Option<voicevox_core::blocking::Synthesizer<()>>> {
     SYNTHESIZER.lock().unwrap()
@@ -203,7 +202,7 @@ pub extern "C" fn supported_devices() -> *const c_char {
     init_logger_once();
     return SUPPORTED_DEVICES.as_ptr();
 
-    static SUPPORTED_DEVICES: Lazy<CString> = Lazy::new(|| {
+    static SUPPORTED_DEVICES: LazyLock<CString> = LazyLock::new(|| {
         CString::new(
             ONNXRUNTIME
                 .supported_devices()
diff --git a/crates/voicevox_core_c_api/src/drop_check.rs b/crates/voicevox_core_c_api/src/drop_check.rs
index 36acec570..09b94c284 100644
--- a/crates/voicevox_core_c_api/src/drop_check.rs
+++ b/crates/voicevox_core_c_api/src/drop_check.rs
@@ -13,7 +13,7 @@ use std::{
 /// `CString`は`Box<impl Sized>`と同様Cの世界でもポインタ一つで実体を表すことができるため、こちら側
 /// で管理すべきものは本来無い。しかしながら本クレートが提供するAPIには「解放不要」な文字列を返すも
 /// のが含まれている。ユーザーが誤ってそのような文字列を解放するのは未定義動作 (undefined behavior)
-/// であるため、綺麗にSEGVするとも限らない。`once_cell::sync::Lazy`由来の文字列の場合、最悪解放が成
+/// であるため、綺麗にSEGVするとも限らない。`std::sync::LazyLock`由来の文字列の場合、最悪解放が成
 /// 功してしまう。
 ///
 /// この構造体はCの世界から帰ってきた`*mut c_char`を`CString`としてdropする際、それが本当にこちら側
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 6f157bf6b..f35179807 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -218,7 +218,7 @@ pub unsafe extern "C" fn voicevox_onnxruntime_load_once(
         let instance = VoicevoxOnnxruntime::load_once(filename)?;
         unsafe {
             // SAFETY: ユーザーに要求している条件で十分
-            out_onnxruntime.as_ptr().write_unaligned(instance);
+            out_onnxruntime.write_unaligned(instance);
         }
         Ok(())
     })())
@@ -249,7 +249,7 @@ pub unsafe extern "C" fn voicevox_onnxruntime_init_once(
         let instance = VoicevoxOnnxruntime::init_once()?;
         unsafe {
             // SAFETY: ユーザーに要求している条件で十分
-            out_onnxruntime.as_ptr().write_unaligned(instance);
+            out_onnxruntime.write_unaligned(instance);
         }
         Ok(())
     })())
@@ -303,7 +303,7 @@ pub unsafe extern "C" fn voicevox_open_jtalk_rc_new(
     into_result_code_with_error((|| {
         let open_jtalk_dic_dir = ensure_utf8(CStr::from_ptr(open_jtalk_dic_dir))?;
         let open_jtalk = OpenJtalkRc::new(open_jtalk_dic_dir)?.into();
-        out_open_jtalk.as_ptr().write_unaligned(open_jtalk);
+        out_open_jtalk.write_unaligned(open_jtalk);
         Ok(())
     })())
 }
@@ -434,7 +434,7 @@ pub unsafe extern "C" fn voicevox_voice_model_new_from_path(
     into_result_code_with_error((|| {
         let path = ensure_utf8(CStr::from_ptr(path))?;
         let model = VoicevoxVoiceModel::from_path(path)?.into();
-        out_model.as_ptr().write_unaligned(model);
+        out_model.write_unaligned(model);
         Ok(())
     })())
 }
@@ -518,7 +518,7 @@ pub unsafe extern "C" fn voicevox_synthesizer_new(
         let options = options.into();
 
         let synthesizer = VoicevoxSynthesizer::new(onnxruntime, open_jtalk, &options)?.into();
-        out_synthesizer.as_ptr().write_unaligned(synthesizer);
+        out_synthesizer.write_unaligned(synthesizer);
         Ok(())
     })())
 }
@@ -681,7 +681,7 @@ pub unsafe extern "C" fn voicevox_onnxruntime_create_supported_devices_json(
     into_result_code_with_error((|| {
         let supported_devices =
             CString::new(onnxruntime.0.supported_devices()?.to_json().to_string()).unwrap();
-        output_supported_devices_json.as_ptr().write_unaligned(
+        output_supported_devices_json.write_unaligned(
             C_STRING_DROP_CHECKER
                 .whitelist(supported_devices)
                 .into_raw(),
@@ -733,7 +733,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_create_audio_query_from_kana(
         let audio_query = CString::new(audio_query_model_to_json(&audio_query))
             .expect("should not contain '\\0'");
         output_audio_query_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(audio_query).into_raw());
         Ok(())
     })())
@@ -782,7 +781,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_create_audio_query(
         let audio_query = CString::new(audio_query_model_to_json(&audio_query))
             .expect("should not contain '\\0'");
         output_audio_query_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(audio_query).into_raw());
         Ok(())
     })())
@@ -830,7 +828,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_create_accent_phrases_from_kana(
         let accent_phrases = CString::new(accent_phrases_to_json(&accent_phrases))
             .expect("should not contain '\\0'");
         output_accent_phrases_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(accent_phrases).into_raw());
         Ok(())
     })())
@@ -877,7 +874,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_create_accent_phrases(
         let accent_phrases = CString::new(accent_phrases_to_json(&accent_phrases))
             .expect("should not contain '\\0'");
         output_accent_phrases_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(accent_phrases).into_raw());
         Ok(())
     })())
@@ -917,7 +913,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_replace_mora_data(
         let accent_phrases = CString::new(accent_phrases_to_json(&accent_phrases))
             .expect("should not contain '\\0'");
         output_accent_phrases_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(accent_phrases).into_raw());
         Ok(())
     })())
@@ -957,7 +952,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_replace_phoneme_length(
         let accent_phrases = CString::new(accent_phrases_to_json(&accent_phrases))
             .expect("should not contain '\\0'");
         output_accent_phrases_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(accent_phrases).into_raw());
         Ok(())
     })())
@@ -997,7 +991,6 @@ pub unsafe extern "C" fn voicevox_synthesizer_replace_mora_pitch(
         let accent_phrases = CString::new(accent_phrases_to_json(&accent_phrases))
             .expect("should not contain '\\0'");
         output_accent_phrases_json
-            .as_ptr()
             .write_unaligned(C_STRING_DROP_CHECKER.whitelist(accent_phrases).into_raw());
         Ok(())
     })())
@@ -1347,7 +1340,7 @@ pub unsafe extern "C" fn voicevox_user_dict_add_word(
     into_result_code_with_error((|| {
         let word = word.read_unaligned().try_into_word()?;
         let uuid = user_dict.dict.add_word(word)?;
-        output_word_uuid.as_ptr().write_unaligned(uuid.into_bytes());
+        output_word_uuid.write_unaligned(uuid.into_bytes());
 
         Ok(())
     })())
@@ -1425,9 +1418,7 @@ pub unsafe extern "C" fn voicevox_user_dict_to_json(
     init_logger_once();
     let json = user_dict.dict.to_json();
     let json = CString::new(json).expect("\\0を含まない文字列であることが保証されている");
-    output_json
-        .as_ptr()
-        .write_unaligned(C_STRING_DROP_CHECKER.whitelist(json).into_raw());
+    output_json.write_unaligned(C_STRING_DROP_CHECKER.whitelist(json).into_raw());
     VoicevoxResultCode::VOICEVOX_RESULT_OK
 }
 
diff --git a/crates/voicevox_core_c_api/src/slice_owner.rs b/crates/voicevox_core_c_api/src/slice_owner.rs
index fa75add52..239847cb7 100644
--- a/crates/voicevox_core_c_api/src/slice_owner.rs
+++ b/crates/voicevox_core_c_api/src/slice_owner.rs
@@ -55,8 +55,8 @@ impl<T> SliceOwner<T> {
             );
         }
 
-        out_ptr.as_ptr().write_unaligned(ptr);
-        out_len.as_ptr().write_unaligned(len);
+        out_ptr.write_unaligned(ptr);
+        out_len.write_unaligned(len);
     }
 
     /// `own_and_lend`でC API利用者に貸し出したポインタに対応する`Box<[u8]>`をデストラクトする。
diff --git a/crates/voicevox_core_c_api/tests/e2e/log_mask.rs b/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
index 93114976e..4e6d26482 100644
--- a/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/log_mask.rs
@@ -1,11 +1,12 @@
-use once_cell::sync::Lazy;
+use std::sync::LazyLock;
+
 use regex::{Regex, Replacer};
 
 use crate::assert_cdylib::Utf8Output;
 
 macro_rules! static_regex {
     ($regex:expr $(,)?) => {{
-        static REGEX: Lazy<Regex> = Lazy::new(|| $regex.parse().unwrap());
+        static REGEX: LazyLock<Regex> = LazyLock::new(|| $regex.parse().unwrap());
         &REGEX
     }};
 }
diff --git a/crates/voicevox_core_c_api/tests/e2e/snapshots.rs b/crates/voicevox_core_c_api/tests/e2e/snapshots.rs
index 249bc5f09..c4c181603 100644
--- a/crates/voicevox_core_c_api/tests/e2e/snapshots.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/snapshots.rs
@@ -10,7 +10,7 @@ macro_rules! section {
             $section_name: T,
         }
 
-        ::once_cell::sync::Lazy::new(|| {
+        ::std::sync::LazyLock::new(|| {
             let Snapshots { $section_name } =
                 ::toml::from_str(crate::snapshots::SNAPSHOTS_TOML).unwrap();
             $section_name
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs
index 79b1d5dc8..e69ad68fd 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine.rs
@@ -1,10 +1,10 @@
 // エンジンを起動してyukarin_s・yukarin_sa・decodeの推論を行う
 
 use std::ffi::CStr;
+use std::sync::LazyLock;
 
 use assert_cmd::assert::AssertResult;
 use libloading::Library;
-use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 use voicevox_core::SupportedDevices;
 
@@ -106,7 +106,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(compatible_engine);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(compatible_engine);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs
index 18482f0de..7b709a83d 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/compatible_engine_load_model_before_initialize.rs
@@ -1,10 +1,9 @@
 // initialize前にモデルを読み込むとエラーになるテスト
 
-use std::ffi::CStr;
+use std::{ffi::CStr, sync::LazyLock};
 
 use assert_cmd::assert::AssertResult;
 use libloading::Library;
-use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 use test_util::c_api::CApi;
 
@@ -43,7 +42,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> =
+static SNAPSHOTS: LazyLock<Snapshots> =
     snapshots::section!(compatible_engine_load_model_before_initialize);
 
 #[derive(Deserialize)]
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
index d2a8fc7e7..e3303db4f 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
@@ -1,8 +1,7 @@
-use std::{collections::HashMap, ffi::CStr, mem::MaybeUninit, str};
+use std::{collections::HashMap, ffi::CStr, mem::MaybeUninit, str, sync::LazyLock};
 
 use assert_cmd::assert::AssertResult;
 use libloading::Library;
-use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 use serde_with::{serde_as, DisplayFromStr};
 use test_util::c_api::{self, CApi, VoicevoxResultCode};
@@ -99,7 +98,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(global_info);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(global_info);
 
 #[serde_as]
 #[derive(Deserialize)]
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
index 4635b0271..a4381f74d 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
@@ -1,8 +1,7 @@
-use std::{collections::HashMap, ffi::CString, mem::MaybeUninit};
+use std::{collections::HashMap, ffi::CString, mem::MaybeUninit, sync::LazyLock};
 
 use assert_cmd::assert::AssertResult;
 use libloading::Library;
-use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 use test_util::{
     c_api::{self, CApi, VoicevoxInitializeOptions, VoicevoxResultCode},
@@ -115,7 +114,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(simple_tts);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(simple_tts);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
index 8a2fd1951..9ac8f4b35 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
@@ -1,11 +1,11 @@
 use std::{
     ffi::{CStr, CString},
     mem::MaybeUninit,
+    sync::LazyLock,
 };
 
 use assert_cmd::assert::AssertResult;
 use libloading::Library;
-use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 
 use test_util::{
@@ -104,7 +104,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(synthesizer_new_output_json);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(synthesizer_new_output_json);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
index 728f21339..0f2ff5fc8 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
@@ -1,8 +1,7 @@
-use std::{collections::HashMap, ffi::CString, mem::MaybeUninit};
+use std::{collections::HashMap, ffi::CString, mem::MaybeUninit, sync::LazyLock};
 
 use assert_cmd::assert::AssertResult;
 use libloading::Library;
-use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 use test_util::{
     c_api::{self, CApi, VoicevoxInitializeOptions, VoicevoxResultCode},
@@ -127,7 +126,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(tts_via_audio_query);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(tts_via_audio_query);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
index 646c5647b..64e062251 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
@@ -1,16 +1,16 @@
 // ユーザー辞書の登録によって読みが変化することを確認するテスト。
 // 辞書ロード前後でAudioQueryのkanaが変化するかどうかで確認する。
 
-use assert_cmd::assert::AssertResult;
-use once_cell::sync::Lazy;
 use std::ffi::{CStr, CString};
 use std::mem::MaybeUninit;
-use test_util::OPEN_JTALK_DIC_DIR;
+use std::sync::LazyLock;
 
+use assert_cmd::assert::AssertResult;
 use cstr::cstr;
 use libloading::Library;
 use serde::{Deserialize, Serialize};
 use test_util::c_api::{self, CApi, VoicevoxInitializeOptions, VoicevoxResultCode};
+use test_util::OPEN_JTALK_DIC_DIR;
 
 use crate::{
     assert_cdylib::{self, case, Utf8Output},
@@ -144,7 +144,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(user_dict);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(user_dict);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs
index bec0d61b5..d3c37f127 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_manipulate.rs
@@ -1,11 +1,12 @@
 // ユーザー辞書の操作をテストする。
 
-use assert_cmd::assert::AssertResult;
-use once_cell::sync::Lazy;
 use std::{
     ffi::{CStr, CString},
     mem::MaybeUninit,
+    sync::LazyLock,
 };
+
+use assert_cmd::assert::AssertResult;
 use tempfile::NamedTempFile;
 use uuid::Uuid;
 
@@ -149,7 +150,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: Lazy<Snapshots> = snapshots::section!(user_dict_manipulate);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(user_dict_manipulate);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_java_api/Cargo.toml b/crates/voicevox_core_java_api/Cargo.toml
index ec4e2d616..aed67c058 100644
--- a/crates/voicevox_core_java_api/Cargo.toml
+++ b/crates/voicevox_core_java_api/Cargo.toml
@@ -14,7 +14,6 @@ derive_more.workspace = true
 duplicate.workspace = true
 easy-ext.workspace = true
 jni.workspace = true
-once_cell.workspace = true
 pretty_assertions = "1.3.0"
 rstest.workspace = true
 serde_json = { workspace = true, features = ["preserve_order"] }

From a98b98e55f78fa867dfe13fcee3e91e93ca820d9 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Mon, 12 Aug 2024 23:28:36 +0900
Subject: [PATCH 19/36] =?UTF-8?q?ci:=20Renovate=20v38=E3=81=AB=E9=81=A9?=
 =?UTF-8?q?=E5=BF=9C=E3=81=99=E3=82=8B=20(#817)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 renovate.json | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/renovate.json b/renovate.json
index 5704cd5f4..19e437554 100644
--- a/renovate.json
+++ b/renovate.json
@@ -8,12 +8,19 @@
     {
       "groupSlug": "rust",
       "groupName": "Rust",
-      "matchDepPatterns": "^Rust$"
+      "matchPackagePatterns": [
+        "^rust-lang/rust$"
+      ]
     },
     {
       "groupSlug": "others",
       "groupName": "Others",
-      "excludeDepPatterns": "^Rust$",
+      "matchPackagePatterns": [
+        "*"
+      ],
+      "excludePackagePatterns": [
+        "^rust-lang/rust$"
+      ],
       "dependencyDashboardApproval": true
     }
   ],

From 983f2e11730d9718f69b2e413b4ab6c320265181 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Tue, 13 Aug 2024 22:55:56 +0900
Subject: [PATCH 20/36] =?UTF-8?q?ci:=20Renovate=E3=81=AEdatasource?=
 =?UTF-8?q?=E3=82=92`github-tags`=E3=81=AB=E3=81=99=E3=82=8B=20(#819)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 renovate.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/renovate.json b/renovate.json
index 19e437554..f56767ea0 100644
--- a/renovate.json
+++ b/renovate.json
@@ -35,7 +35,7 @@
       ],
       "depNameTemplate": "Rust",
       "packageNameTemplate": "rust-lang/rust",
-      "datasourceTemplate": "github-releases"
+      "datasourceTemplate": "github-tags"
     }
   ]
 }

From d6765462fd246d22306a7badd438d34745345231 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Wed, 14 Aug 2024 00:00:48 +0900
Subject: [PATCH 21/36] chore(deps): update dependency rust to v1.80.1 (#820)

Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com>
---
 rust-toolchain | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rust-toolchain b/rust-toolchain
index aaceec04e..97e98527c 100644
--- a/rust-toolchain
+++ b/rust-toolchain
@@ -1 +1 @@
-1.80.0
+1.80.1

From a15753f4b4c9196c870b09de39ee75e37a19a4ed Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sun, 18 Aug 2024 04:18:04 +0900
Subject: [PATCH 22/36] =?UTF-8?q?update:=20ort=E3=82=92=E6=9B=B4=E6=96=B0?=
 =?UTF-8?q?=20(#822)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 Cargo.lock                                    | 25 ++++++++++++++-----
 Cargo.toml                                    |  2 +-
 .../src/infer/runtimes/onnxruntime.rs         |  4 +--
 3 files changed, 22 insertions(+), 9 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 3da1581da..7d70c15b8 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2649,9 +2649,9 @@ checksum = "8b870d8c151b6f2fb93e84a13146138f05d02ed11c7e7c54f8826aaaf7c9f184"
 
 [[package]]
 name = "pkg-config"
-version = "0.3.25"
+version = "0.3.30"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1df8c4ec4b0627e53bdf214615ad287367e482558cf84b109250b37464dc03ae"
+checksum = "d231b230927b5e4ad203db57bbcbee2802f6bce620b1e4a9024a07d94e2907ec"
 
 [[package]]
 name = "plist"
@@ -3550,6 +3550,17 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "socks"
+version = "0.3.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f0c3dbbd9ae980613c6dd8e28a9407b50509d3803b57624d5dfe8315218cd58b"
+dependencies = [
+ "byteorder",
+ "libc",
+ "winapi",
+]
+
 [[package]]
 name = "spin"
 version = "0.5.2"
@@ -4147,6 +4158,7 @@ dependencies = [
  "once_cell",
  "rustls 0.21.7",
  "rustls-webpki",
+ "socks",
  "url",
  "webpki-roots 0.25.4",
 ]
@@ -4199,8 +4211,8 @@ checksum = "49874b5167b65d7193b8aba1567f5c7d93d001cafc34600cee003eda787e483f"
 
 [[package]]
 name = "voicevox-ort"
-version = "2.0.0-rc.2"
-source = "git+https://github.com/VOICEVOX/ort.git?rev=07c047c449b959d8f76593046e139bae520d59c3#07c047c449b959d8f76593046e139bae520d59c3"
+version = "2.0.0-rc.4"
+source = "git+https://github.com/VOICEVOX/ort.git?rev=8627833456a69e7841ae2a29fd184752df8de8d9#8627833456a69e7841ae2a29fd184752df8de8d9"
 dependencies = [
  "anyhow",
  "half",
@@ -4216,10 +4228,11 @@ dependencies = [
 
 [[package]]
 name = "voicevox-ort-sys"
-version = "2.0.0-rc.2"
-source = "git+https://github.com/VOICEVOX/ort.git?rev=07c047c449b959d8f76593046e139bae520d59c3#07c047c449b959d8f76593046e139bae520d59c3"
+version = "2.0.0-rc.4"
+source = "git+https://github.com/VOICEVOX/ort.git?rev=8627833456a69e7841ae2a29fd184752df8de8d9#8627833456a69e7841ae2a29fd184752df8de8d9"
 dependencies = [
  "flate2",
+ "pkg-config",
  "sha2",
  "tar",
  "ureq",
diff --git a/Cargo.toml b/Cargo.toml
index 2ada5cbb5..d72625c5f 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -92,7 +92,7 @@ zip = "0.6.3"
 
 [workspace.dependencies.voicevox-ort]
 git = "https://github.com/VOICEVOX/ort.git"
-rev = "07c047c449b959d8f76593046e139bae520d59c3"
+rev = "8627833456a69e7841ae2a29fd184752df8de8d9"
 
 [workspace.dependencies.open_jtalk]
 git = "https://github.com/VOICEVOX/open_jtalk-rs.git"
diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
index 15ba963eb..7d975f7f7 100644
--- a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
+++ b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -5,7 +5,7 @@ use duplicate::duplicate_item;
 use ndarray::{Array, Dimension};
 use ort::{
     CPUExecutionProvider, CUDAExecutionProvider, DirectMLExecutionProvider, ExecutionProvider as _,
-    GraphOptimizationLevel, IntoTensorElementType, TensorElementType, ValueType,
+    GraphOptimizationLevel, PrimitiveTensorElementType, TensorElementType, ValueType,
 };
 
 use crate::{
@@ -209,7 +209,7 @@ impl OnnxruntimeRunContext<'_> {
     fn push_input(
         &mut self,
         input: Array<
-            impl IntoTensorElementType + Debug + Clone + 'static,
+            impl PrimitiveTensorElementType + Debug + Clone + 'static,
             impl Dimension + 'static,
         >,
     ) -> anyhow::Result<()> {

From 317b433e985c5612510dec53c347a098f35361f0 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Tue, 20 Aug 2024 02:29:07 +0900
Subject: [PATCH 23/36] =?UTF-8?q?change:=20`InferenceFailed`=20=E2=86=92?=
 =?UTF-8?q?=20`RunModel`=20(#823)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crates/voicevox_core/src/error.rs             |  6 +-
 crates/voicevox_core/src/infer/session_set.rs |  2 +-
 .../include/voicevox_core.h                   |  2 +-
 crates/voicevox_core_c_api/src/helpers.rs     |  2 +-
 crates/voicevox_core_c_api/src/result_code.rs |  4 +-
 .../tests/e2e/testcases/global_info.rs        |  2 +-
 .../hiroshiba/voicevoxcore/Synthesizer.java   | 67 +++++++++----------
 .../exceptions/InferenceFailedException.java  | 14 ----
 .../exceptions/RunModelException.java         | 14 ++++
 .../voicevoxcore/SynthesizerTest.java         |  8 +--
 .../hiroshiba/voicevoxcore/UserDictTest.java  |  5 +-
 crates/voicevox_core_java_api/src/common.rs   |  2 +-
 .../python/voicevox_core/__init__.py          |  4 +-
 .../python/voicevox_core/_rust/__init__.pyi   |  2 +-
 .../voicevox_core_python_api/src/convert.rs   |  6 +-
 crates/voicevox_core_python_api/src/lib.rs    |  2 +-
 16 files changed, 68 insertions(+), 74 deletions(-)
 delete mode 100644 crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InferenceFailedException.java
 create mode 100644 crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/RunModelException.java

diff --git a/crates/voicevox_core/src/error.rs b/crates/voicevox_core/src/error.rs
index 0125b1cc6..33775bda0 100644
--- a/crates/voicevox_core/src/error.rs
+++ b/crates/voicevox_core/src/error.rs
@@ -47,7 +47,7 @@ impl Error {
             ErrorRepr::GetSupportedDevices(_) => ErrorKind::GetSupportedDevices,
             ErrorRepr::StyleNotFound { .. } => ErrorKind::StyleNotFound,
             ErrorRepr::ModelNotFound { .. } => ErrorKind::ModelNotFound,
-            ErrorRepr::InferenceFailed { .. } => ErrorKind::InferenceFailed,
+            ErrorRepr::RunModel { .. } => ErrorKind::RunModel,
             ErrorRepr::ExtractFullContextLabel(_) => ErrorKind::ExtractFullContextLabel,
             ErrorRepr::ParseKana(_) => ErrorKind::ParseKana,
             ErrorRepr::LoadUserDict(_) => ErrorKind::LoadUserDict,
@@ -97,7 +97,7 @@ pub(crate) enum ErrorRepr {
     ModelNotFound { model_id: VoiceModelId },
 
     #[error("推論に失敗しました")]
-    InferenceFailed(#[source] anyhow::Error),
+    RunModel(#[source] anyhow::Error),
 
     #[error(transparent)]
     ExtractFullContextLabel(#[from] FullContextLabelError),
@@ -149,7 +149,7 @@ pub enum ErrorKind {
     /// 音声モデルIDに対する音声モデルが見つからなかった。
     ModelNotFound,
     /// 推論に失敗した。
-    InferenceFailed,
+    RunModel,
     /// コンテキストラベル出力に失敗した。
     ExtractFullContextLabel,
     /// AquesTalk風記法のテキストの解析に失敗した。
diff --git a/crates/voicevox_core/src/infer/session_set.rs b/crates/voicevox_core/src/infer/session_set.rs
index ad85e93ac..e94fff962 100644
--- a/crates/voicevox_core/src/infer/session_set.rs
+++ b/crates/voicevox_core/src/infer/session_set.rs
@@ -95,7 +95,7 @@ impl<R: InferenceRuntime, I: InferenceInputSignature> InferenceSessionCell<R, I>
     ) -> crate::Result<<I::Signature as InferenceSignature>::Output> {
         let inner = &mut self.inner.lock().unwrap();
         (|| R::run(input.make_run_context::<R>(inner)?)?.try_into())()
-            .map_err(ErrorRepr::InferenceFailed)
+            .map_err(ErrorRepr::RunModel)
             .map_err(Into::into)
     }
 }
diff --git a/crates/voicevox_core_c_api/include/voicevox_core.h b/crates/voicevox_core_c_api/include/voicevox_core.h
index fe514dfa9..422f32978 100644
--- a/crates/voicevox_core_c_api/include/voicevox_core.h
+++ b/crates/voicevox_core_c_api/include/voicevox_core.h
@@ -141,7 +141,7 @@ enum VoicevoxResultCode
   /**
    * 推論に失敗した
    */
-  VOICEVOX_RESULT_INFERENCE_ERROR = 8,
+  VOICEVOX_RESULT_RUN_MODEL_ERROR = 8,
   /**
    * コンテキストラベル出力に失敗した
    */
diff --git a/crates/voicevox_core_c_api/src/helpers.rs b/crates/voicevox_core_c_api/src/helpers.rs
index af4057d09..26a60d033 100644
--- a/crates/voicevox_core_c_api/src/helpers.rs
+++ b/crates/voicevox_core_c_api/src/helpers.rs
@@ -39,7 +39,7 @@ pub(crate) fn into_result_code_with_error(result: CApiResult<()>) -> VoicevoxRes
                 GetSupportedDevices => VOICEVOX_RESULT_GET_SUPPORTED_DEVICES_ERROR,
                 StyleNotFound => VOICEVOX_RESULT_STYLE_NOT_FOUND_ERROR,
                 ModelNotFound => VOICEVOX_RESULT_MODEL_NOT_FOUND_ERROR,
-                InferenceFailed => VOICEVOX_RESULT_INFERENCE_ERROR,
+                RunModel => VOICEVOX_RESULT_RUN_MODEL_ERROR,
                 ExtractFullContextLabel => VOICEVOX_RESULT_EXTRACT_FULL_CONTEXT_LABEL_ERROR,
                 ParseKana => VOICEVOX_RESULT_PARSE_KANA_ERROR,
                 LoadUserDict => VOICEVOX_RESULT_LOAD_USER_DICT_ERROR,
diff --git a/crates/voicevox_core_c_api/src/result_code.rs b/crates/voicevox_core_c_api/src/result_code.rs
index 085f2b8c6..bfdbc8444 100644
--- a/crates/voicevox_core_c_api/src/result_code.rs
+++ b/crates/voicevox_core_c_api/src/result_code.rs
@@ -24,7 +24,7 @@ pub enum VoicevoxResultCode {
     /// 音声モデルIDに対する音声モデルが見つからなかった
     VOICEVOX_RESULT_MODEL_NOT_FOUND_ERROR = 7,
     /// 推論に失敗した
-    VOICEVOX_RESULT_INFERENCE_ERROR = 8,
+    VOICEVOX_RESULT_RUN_MODEL_ERROR = 8,
     /// コンテキストラベル出力に失敗した
     VOICEVOX_RESULT_EXTRACT_FULL_CONTEXT_LABEL_ERROR = 11,
     /// 無効なutf8文字列が入力された
@@ -83,7 +83,7 @@ pub(crate) const fn error_result_to_message(result_code: VoicevoxResultCode) ->
             "指定されたIDに対する音声モデルが見つかりませんでした。読み込まれていないか、読み込み\
              が既に解除されています"
         ),
-        VOICEVOX_RESULT_INFERENCE_ERROR => cstr!("推論に失敗しました"),
+        VOICEVOX_RESULT_RUN_MODEL_ERROR => cstr!("推論に失敗しました"),
         VOICEVOX_RESULT_EXTRACT_FULL_CONTEXT_LABEL_ERROR => {
             cstr!("入力テキストからのフルコンテキストラベル抽出に失敗しました")
         }
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
index e3303db4f..a36a7d9bd 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/global_info.rs
@@ -54,7 +54,7 @@ impl assert_cdylib::TestCase for TestCase {
             c_api::VoicevoxResultCode_VOICEVOX_RESULT_GPU_SUPPORT_ERROR,
             c_api::VoicevoxResultCode_VOICEVOX_RESULT_STYLE_NOT_FOUND_ERROR,
             c_api::VoicevoxResultCode_VOICEVOX_RESULT_MODEL_NOT_FOUND_ERROR,
-            c_api::VoicevoxResultCode_VOICEVOX_RESULT_INFERENCE_ERROR,
+            c_api::VoicevoxResultCode_VOICEVOX_RESULT_RUN_MODEL_ERROR,
             c_api::VoicevoxResultCode_VOICEVOX_RESULT_EXTRACT_FULL_CONTEXT_LABEL_ERROR,
             c_api::VoicevoxResultCode_VOICEVOX_RESULT_INVALID_UTF8_INPUT_ERROR,
             c_api::VoicevoxResultCode_VOICEVOX_RESULT_PARSE_KANA_ERROR,
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
index 8d5694267..2fac70741 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
@@ -7,8 +7,8 @@
 import java.util.List;
 import java.util.Optional;
 import java.util.UUID;
-import jp.hiroshiba.voicevoxcore.exceptions.InferenceFailedException;
 import jp.hiroshiba.voicevoxcore.exceptions.InvalidModelDataException;
+import jp.hiroshiba.voicevoxcore.exceptions.RunModelException;
 
 /**
  * 音声シンセサイザ。
@@ -99,11 +99,10 @@ public boolean isLoadedVoiceModel(UUID voiceModelId) {
    * @param kana AquesTalk風記法。
    * @param styleId スタイルID。
    * @return {@link AudioQuery}。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
-  public AudioQuery createAudioQueryFromKana(String kana, int styleId)
-      throws InferenceFailedException {
+  public AudioQuery createAudioQueryFromKana(String kana, int styleId) throws RunModelException {
     if (!Utils.isU32(styleId)) {
       throw new IllegalArgumentException("styleId");
     }
@@ -123,10 +122,10 @@ public AudioQuery createAudioQueryFromKana(String kana, int styleId)
    * @param text 日本語のテキスト。
    * @param styleId スタイルID。
    * @return {@link AudioQuery}。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
-  public AudioQuery createAudioQuery(String text, int styleId) throws InferenceFailedException {
+  public AudioQuery createAudioQuery(String text, int styleId) throws RunModelException {
     if (!Utils.isU32(styleId)) {
       throw new IllegalArgumentException("styleId");
     }
@@ -146,11 +145,11 @@ public AudioQuery createAudioQuery(String text, int styleId) throws InferenceFai
    * @param kana AquesTalk風記法。
    * @param styleId スタイルID。
    * @return {@link AccentPhrase} のリスト。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
   public List<AccentPhrase> createAccentPhrasesFromKana(String kana, int styleId)
-      throws InferenceFailedException {
+      throws RunModelException {
     String accentPhrasesJson = rsAccentPhrasesFromKana(kana, styleId);
     Gson gson = new Gson();
     AccentPhrase[] rawAccentPhrases = gson.fromJson(accentPhrasesJson, AccentPhrase[].class);
@@ -166,11 +165,10 @@ public List<AccentPhrase> createAccentPhrasesFromKana(String kana, int styleId)
    * @param text 日本語のテキスト。
    * @param styleId スタイルID。
    * @return {@link AccentPhrase} のリスト。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
-  public List<AccentPhrase> createAccentPhrases(String text, int styleId)
-      throws InferenceFailedException {
+  public List<AccentPhrase> createAccentPhrases(String text, int styleId) throws RunModelException {
     String accentPhrasesJson = rsAccentPhrases(text, styleId);
     Gson gson = new Gson();
     AccentPhrase[] rawAccentPhrases = gson.fromJson(accentPhrasesJson, AccentPhrase[].class);
@@ -186,11 +184,11 @@ public List<AccentPhrase> createAccentPhrases(String text, int styleId)
    * @param accentPhrases 変更元のアクセント句の配列。
    * @param styleId スタイルID。
    * @return 変更後のアクセント句の配列。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
   public List<AccentPhrase> replaceMoraData(List<AccentPhrase> accentPhrases, int styleId)
-      throws InferenceFailedException {
+      throws RunModelException {
     if (!Utils.isU32(styleId)) {
       throw new IllegalArgumentException("styleId");
     }
@@ -206,11 +204,11 @@ public List<AccentPhrase> replaceMoraData(List<AccentPhrase> accentPhrases, int
    * @param accentPhrases 変更元のアクセント句の配列。
    * @param styleId スタイルID。
    * @return 変更後のアクセント句の配列。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
   public List<AccentPhrase> replacePhonemeLength(List<AccentPhrase> accentPhrases, int styleId)
-      throws InferenceFailedException {
+      throws RunModelException {
     if (!Utils.isU32(styleId)) {
       throw new IllegalArgumentException("styleId");
     }
@@ -226,11 +224,11 @@ public List<AccentPhrase> replacePhonemeLength(List<AccentPhrase> accentPhrases,
    * @param accentPhrases 変更元のアクセント句の配列。
    * @param styleId スタイルID。
    * @return 変更後のアクセント句の配列。
-   * @throws InferenceFailedException 推論に失敗した場合。
+   * @throws RunModelException 推論に失敗した場合。
    */
   @Nonnull
   public List<AccentPhrase> replaceMoraPitch(List<AccentPhrase> accentPhrases, int styleId)
-      throws InferenceFailedException {
+      throws RunModelException {
     if (!Utils.isU32(styleId)) {
       throw new IllegalArgumentException("styleId");
     }
@@ -293,43 +291,40 @@ public TtsConfigurator tts(String text, int styleId) {
   private native boolean rsIsLoadedVoiceModel(UUID voiceModelId);
 
   @Nonnull
-  private native String rsAudioQueryFromKana(String kana, int styleId)
-      throws InferenceFailedException;
+  private native String rsAudioQueryFromKana(String kana, int styleId) throws RunModelException;
 
   @Nonnull
-  private native String rsAudioQuery(String text, int styleId) throws InferenceFailedException;
+  private native String rsAudioQuery(String text, int styleId) throws RunModelException;
 
   @Nonnull
-  private native String rsAccentPhrasesFromKana(String kana, int styleId)
-      throws InferenceFailedException;
+  private native String rsAccentPhrasesFromKana(String kana, int styleId) throws RunModelException;
 
   @Nonnull
-  private native String rsAccentPhrases(String text, int styleId) throws InferenceFailedException;
+  private native String rsAccentPhrases(String text, int styleId) throws RunModelException;
 
   @Nonnull
   private native String rsReplaceMoraData(String accentPhrasesJson, int styleId, boolean kana)
-      throws InferenceFailedException;
+      throws RunModelException;
 
   @Nonnull
   private native String rsReplacePhonemeLength(String accentPhrasesJson, int styleId, boolean kana)
-      throws InferenceFailedException;
+      throws RunModelException;
 
   @Nonnull
   private native String rsReplaceMoraPitch(String accentPhrasesJson, int styleId, boolean kana)
-      throws InferenceFailedException;
+      throws RunModelException;
 
   @Nonnull
   private native byte[] rsSynthesis(
-      String queryJson, int styleId, boolean enableInterrogativeUpspeak)
-      throws InferenceFailedException;
+      String queryJson, int styleId, boolean enableInterrogativeUpspeak) throws RunModelException;
 
   @Nonnull
   private native byte[] rsTtsFromKana(String kana, int styleId, boolean enableInterrogativeUpspeak)
-      throws InferenceFailedException;
+      throws RunModelException;
 
   @Nonnull
   private native byte[] rsTts(String text, int styleId, boolean enableInterrogativeUpspeak)
-      throws InferenceFailedException;
+      throws RunModelException;
 
   private native void rsDrop();
 
@@ -436,10 +431,10 @@ public SynthesisConfigurator interrogativeUpspeak(boolean interrogativeUpspeak)
      * {@link AudioQuery} から音声合成する。
      *
      * @return 音声データ。
-     * @throws InferenceFailedException 推論に失敗した場合。
+     * @throws RunModelException 推論に失敗した場合。
      */
     @Nonnull
-    public byte[] execute() throws InferenceFailedException {
+    public byte[] execute() throws RunModelException {
       if (!Utils.isU32(styleId)) {
         throw new IllegalArgumentException("styleId");
       }
@@ -481,10 +476,10 @@ public TtsFromKanaConfigurator interrogativeUpspeak(boolean interrogativeUpspeak
      * {@link AudioQuery} から音声合成する。
      *
      * @return 音声データ。
-     * @throws InferenceFailedException 推論に失敗した場合。
+     * @throws RunModelException 推論に失敗した場合。
      */
     @Nonnull
-    public byte[] execute() throws InferenceFailedException {
+    public byte[] execute() throws RunModelException {
       if (!Utils.isU32(styleId)) {
         throw new IllegalArgumentException("styleId");
       }
@@ -524,10 +519,10 @@ public TtsConfigurator interrogativeUpspeak(boolean interrogativeUpspeak) {
      * {@link AudioQuery} から音声合成する。
      *
      * @return 音声データ。
-     * @throws InferenceFailedException 推論に失敗した場合。
+     * @throws RunModelException 推論に失敗した場合。
      */
     @Nonnull
-    public byte[] execute() throws InferenceFailedException {
+    public byte[] execute() throws RunModelException {
       if (!Utils.isU32(styleId)) {
         throw new IllegalArgumentException("styleId");
       }
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InferenceFailedException.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InferenceFailedException.java
deleted file mode 100644
index 499a530df..000000000
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/InferenceFailedException.java
+++ /dev/null
@@ -1,14 +0,0 @@
-package jp.hiroshiba.voicevoxcore.exceptions;
-
-import java.io.IOException;
-
-/** 推論に失敗した。 */
-public class InferenceFailedException extends IOException {
-  public InferenceFailedException(String message) {
-    super(message);
-  }
-
-  public InferenceFailedException(String message, Throwable cause) {
-    super(message, cause);
-  }
-}
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/RunModelException.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/RunModelException.java
new file mode 100644
index 000000000..67d7f061f
--- /dev/null
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/exceptions/RunModelException.java
@@ -0,0 +1,14 @@
+package jp.hiroshiba.voicevoxcore.exceptions;
+
+import java.io.IOException;
+
+/** 推論に失敗した。 */
+public class RunModelException extends IOException {
+  public RunModelException(String message) {
+    super(message);
+  }
+
+  public RunModelException(String message, Throwable cause) {
+    super(message, cause);
+  }
+}
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
index 4de2f617b..0dfa17ea3 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
@@ -8,8 +8,8 @@
 import static org.junit.jupiter.api.Assertions.assertTrue;
 
 import java.util.List;
-import jp.hiroshiba.voicevoxcore.exceptions.InferenceFailedException;
 import jp.hiroshiba.voicevoxcore.exceptions.InvalidModelDataException;
+import jp.hiroshiba.voicevoxcore.exceptions.RunModelException;
 import org.junit.jupiter.api.Test;
 
 class SynthesizerTest extends TestUtils {
@@ -67,7 +67,7 @@ void checkModel() throws InvalidModelDataException {
   }
 
   @Test
-  void checkAudioQuery() throws InferenceFailedException, InvalidModelDataException {
+  void checkAudioQuery() throws RunModelException, InvalidModelDataException {
     VoiceModel model = loadModel();
     Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
@@ -79,7 +79,7 @@ void checkAudioQuery() throws InferenceFailedException, InvalidModelDataExceptio
   }
 
   @Test
-  void checkAccentPhrases() throws InferenceFailedException, InvalidModelDataException {
+  void checkAccentPhrases() throws RunModelException, InvalidModelDataException {
     VoiceModel model = loadModel();
     OpenJtalk openJtalk = loadOpenJtalk();
     Onnxruntime onnxruntime = loadOnnxruntime();
@@ -110,7 +110,7 @@ void checkAccentPhrases() throws InferenceFailedException, InvalidModelDataExcep
   }
 
   @Test
-  void checkTts() throws InferenceFailedException, InvalidModelDataException {
+  void checkTts() throws RunModelException, InvalidModelDataException {
     VoiceModel model = loadModel();
     Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
index 5300b81f3..2fcfc06ab 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
@@ -4,9 +4,9 @@
 
 import java.nio.file.Files;
 import java.nio.file.Path;
-import jp.hiroshiba.voicevoxcore.exceptions.InferenceFailedException;
 import jp.hiroshiba.voicevoxcore.exceptions.InvalidModelDataException;
 import jp.hiroshiba.voicevoxcore.exceptions.LoadUserDictException;
+import jp.hiroshiba.voicevoxcore.exceptions.RunModelException;
 import org.junit.jupiter.api.Test;
 
 class UserDictTest extends TestUtils {
@@ -14,8 +14,7 @@ class UserDictTest extends TestUtils {
   // 辞書ロードのテスト。
   // 辞書ロード前後でkanaが異なることを確認する
   @Test
-  void checkLoad()
-      throws InferenceFailedException, InvalidModelDataException, LoadUserDictException {
+  void checkLoad() throws RunModelException, InvalidModelDataException, LoadUserDictException {
     VoiceModel model = loadModel();
     Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
diff --git a/crates/voicevox_core_java_api/src/common.rs b/crates/voicevox_core_java_api/src/common.rs
index c55ce8106..1b45dd44d 100644
--- a/crates/voicevox_core_java_api/src/common.rs
+++ b/crates/voicevox_core_java_api/src/common.rs
@@ -82,7 +82,7 @@ where
                             GetSupportedDevices,
                             StyleNotFound,
                             ModelNotFound,
-                            InferenceFailed,
+                            RunModel,
                             ExtractFullContextLabel,
                             ParseKana,
                             LoadUserDict,
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/__init__.py b/crates/voicevox_core_python_api/python/voicevox_core/__init__.py
index e9a0a03c0..ea1f246b9 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/__init__.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/__init__.py
@@ -18,7 +18,6 @@
     ExtractFullContextLabelError,
     GetSupportedDevicesError,
     GpuSupportError,
-    InferenceFailedError,
     InitInferenceRuntimeError,
     InvalidModelDataError,
     InvalidWordError,
@@ -29,6 +28,7 @@
     OpenZipFileError,
     ParseKanaError,
     ReadZipEntryError,
+    RunModelError,
     SaveUserDictError,
     StyleAlreadyLoadedError,
     StyleNotFoundError,
@@ -49,7 +49,6 @@
     "ExtractFullContextLabelError",
     "GetSupportedDevicesError",
     "GpuSupportError",
-    "InferenceFailedError",
     "InitInferenceRuntimeError",
     "InvalidModelDataError",
     "InvalidWordError",
@@ -61,6 +60,7 @@
     "OpenZipFileError",
     "ParseKanaError",
     "ReadZipEntryError",
+    "RunModelError",
     "SaveUserDictError",
     "SpeakerMeta",
     "StyleAlreadyLoadedError",
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi
index 81168843f..a456b1162 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/__init__.pyi
@@ -60,7 +60,7 @@ class ModelNotFoundError(KeyError):
 
     ...
 
-class InferenceFailedError(Exception):
+class RunModelError(Exception):
     """推論に失敗した。"""
 
     ...
diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs
index b625f70b5..e57f2fb13 100644
--- a/crates/voicevox_core_python_api/src/convert.rs
+++ b/crates/voicevox_core_python_api/src/convert.rs
@@ -13,10 +13,10 @@ use uuid::Uuid;
 use voicevox_core::{AccelerationMode, AccentPhrase, StyleId, UserDictWordType, VoiceModelMeta};
 
 use crate::{
-    ExtractFullContextLabelError, GetSupportedDevicesError, GpuSupportError, InferenceFailedError,
+    ExtractFullContextLabelError, GetSupportedDevicesError, GpuSupportError,
     InitInferenceRuntimeError, InvalidModelDataError, InvalidModelFormatError, InvalidWordError,
     LoadUserDictError, ModelAlreadyLoadedError, ModelNotFoundError, NotLoadedOpenjtalkDictError,
-    OpenZipFileError, ParseKanaError, ReadZipEntryError, SaveUserDictError,
+    OpenZipFileError, ParseKanaError, ReadZipEntryError, RunModelError, SaveUserDictError,
     StyleAlreadyLoadedError, StyleNotFoundError, UseUserDictError, WordNotFoundError,
 };
 
@@ -196,7 +196,7 @@ pub(crate) impl<T> voicevox_core::Result<T> {
                 ErrorKind::GetSupportedDevices => GetSupportedDevicesError::new_err(msg),
                 ErrorKind::StyleNotFound => StyleNotFoundError::new_err(msg),
                 ErrorKind::ModelNotFound => ModelNotFoundError::new_err(msg),
-                ErrorKind::InferenceFailed => InferenceFailedError::new_err(msg),
+                ErrorKind::RunModel => RunModelError::new_err(msg),
                 ErrorKind::ExtractFullContextLabel => ExtractFullContextLabelError::new_err(msg),
                 ErrorKind::ParseKana => ParseKanaError::new_err(msg),
                 ErrorKind::LoadUserDict => LoadUserDictError::new_err(msg),
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index 001df0713..d3d790075 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -78,7 +78,7 @@ exceptions! {
     GetSupportedDevicesError: PyException;
     StyleNotFoundError: PyKeyError;
     ModelNotFoundError: PyKeyError;
-    InferenceFailedError: PyException;
+    RunModelError: PyException;
     ExtractFullContextLabelError: PyException;
     ParseKanaError: PyValueError;
     LoadUserDictError: PyException;

From 62bfd713557bbac412186c73a0f91ccf725080b4 Mon Sep 17 00:00:00 2001
From: cm-ayf <cm.ayf2734@gmail.com>
Date: Fri, 30 Aug 2024 00:01:29 +0900
Subject: [PATCH 24/36] Update jump-to version on README (#824)

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index ae60f587b..4812c1297 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # VOICEVOX CORE
 
-## **現在の main ブランチは工事中なので正しく動かないことがあります。[バージョン 0.14.4](https://github.com/VOICEVOX/voicevox_core/tree/0.14.4)をご利用ください。**
+## **現在の main ブランチは工事中なので正しく動かないことがあります。[バージョン 0.15.4](https://github.com/VOICEVOX/voicevox_core/tree/0.15.4)をご利用ください。**
 
 [![releases](https://img.shields.io/github/v/release/VOICEVOX/voicevox_core?label=release)](https://github.com/VOICEVOX/voicevox_core/releases)
 [![test](https://github.com/VOICEVOX/voicevox_core/actions/workflows/test.yml/badge.svg)](https://github.com/VOICEVOX/voicevox_core/actions/workflows/test.yml)

From 2ab02bd37adbf7330c4459e9921af1bc19dcf1b3 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Fri, 6 Sep 2024 02:13:46 +0900
Subject: [PATCH 25/36] chore(deps): update dependency rust to v1.81.0 (#826)

Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com>
---
 rust-toolchain | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rust-toolchain b/rust-toolchain
index 97e98527c..dbd41264a 100644
--- a/rust-toolchain
+++ b/rust-toolchain
@@ -1 +1 @@
-1.80.1
+1.81.0

From 088ef7ee59e178ebbf952780fa394880ec645121 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 6 Sep 2024 15:10:51 +0900
Subject: [PATCH 26/36] =?UTF-8?q?chore:=20Rust=201.81=E3=81=A7=E8=BF=BD?=
 =?UTF-8?q?=E5=8A=A0=E3=81=95=E3=82=8C=E3=81=9F=E6=A9=9F=E8=83=BD=E3=82=92?=
 =?UTF-8?q?=E5=88=A9=E7=94=A8=E3=81=99=E3=82=8B=20(#827)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crates/test_util/src/lib.rs                        |  4 +++-
 crates/voicevox_core/src/devices.rs                |  5 ++++-
 .../src/engine/acoustic_feature_extractor.rs       |  3 +--
 crates/voicevox_core/src/infer.rs                  | 12 ++++++++++--
 crates/voicevox_core/src/lib.rs                    |  6 ++++--
 crates/voicevox_core/src/manifest.rs               |  4 ++--
 crates/voicevox_core/src/synthesizer.rs            |  6 +++++-
 crates/voicevox_core/src/user_dict/word.rs         |  2 +-
 crates/voicevox_core_c_api/src/lib.rs              | 10 ++++++++--
 crates/voicevox_core_c_api/src/result_code.rs      |  7 ++++---
 crates/voicevox_core_python_api/src/lib.rs         | 14 +++++++-------
 11 files changed, 49 insertions(+), 24 deletions(-)

diff --git a/crates/test_util/src/lib.rs b/crates/test_util/src/lib.rs
index 740cfb415..92e8e941a 100644
--- a/crates/test_util/src/lib.rs
+++ b/crates/test_util/src/lib.rs
@@ -8,7 +8,9 @@ include!(concat!(env!("OUT_DIR"), "/sample_voice_model_file.rs"));
     non_upper_case_globals,
     unused_extern_crates,
     clippy::missing_safety_doc,
-    clippy::too_many_arguments
+    clippy::too_many_arguments,
+    reason = "bindgenが生成するコードのため。`#[expect]`ではなく`#[allow]`なのは、bindgenが生成\
+              するコードがOSにより変わるため"
 )]
 pub mod c_api {
     include!(concat!(env!("OUT_DIR"), "/c_api.rs"));
diff --git a/crates/voicevox_core/src/devices.rs b/crates/voicevox_core/src/devices.rs
index f3027e741..6c0e87d06 100644
--- a/crates/voicevox_core/src/devices.rs
+++ b/crates/voicevox_core/src/devices.rs
@@ -225,7 +225,10 @@ mod tests {
 
         assert_eq!(
             {
-                #[forbid(unused_variables)]
+                #[forbid(
+                    unused_variables,
+                    reason = "比較対象としてここは網羅されてなければなりません"
+                )]
                 let SupportedDevices { cpu: _, cuda, dml } = &SUPPORTED_DEVICES;
                 [cuda as *const _, dml as *const _]
             },
diff --git a/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs b/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
index a75770dd9..ca2da4697 100644
--- a/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
+++ b/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
@@ -63,9 +63,8 @@ static PHONEME_MAP: LazyLock<HashMap<&str, i64>> = LazyLock::new(|| {
 #[derive(Debug, Clone, PartialEq, new, Default, Getters)]
 pub(crate) struct OjtPhoneme {
     phoneme: String,
-    #[allow(dead_code)]
+    // FIXME: derive-getters(多分)が警告を覆い隠しているが、以下の二つは使っていないはず
     start: f32,
-    #[allow(dead_code)]
     end: f32,
 }
 
diff --git a/crates/voicevox_core/src/infer.rs b/crates/voicevox_core/src/infer.rs
index 112ca6b53..0dc322049 100644
--- a/crates/voicevox_core/src/infer.rs
+++ b/crates/voicevox_core/src/infer.rs
@@ -30,7 +30,11 @@ pub(crate) trait InferenceRuntime: 'static {
     /// GPUが実際に利用できそうかどうか判定する。
     fn test_gpu(&self, gpu: GpuSpec) -> anyhow::Result<()>;
 
-    #[allow(clippy::type_complexity)]
+    #[expect(
+        clippy::type_complexity,
+        reason = "ここを呼び出すのは現状一箇所なので、可読性が著しく落ちてはいないことを考えると\
+                  別にこのままでいいはず"
+    )]
     fn new_session(
         &self,
         model: impl FnOnce() -> std::result::Result<Vec<u8>, DecryptModelError>,
@@ -64,7 +68,11 @@ pub(crate) trait InferenceDomain: Sized {
 /// `::macros::InferenceOperation`により導出される。
 pub(crate) trait InferenceOperation: Copy + Enum {
     /// `{InferenceInputSignature,InferenceOutputSignature}::PARAM_INFOS`を集めたもの。
-    #[allow(clippy::type_complexity)]
+    #[expect(
+        clippy::type_complexity,
+        reason = "ここを参照するのは現状一箇所なので、可読性が著しく落ちてはいないことを考えると\
+                  別にこのままでいいはず"
+    )]
     const PARAM_INFOS: EnumMap<
         Self,
         (
diff --git a/crates/voicevox_core/src/lib.rs b/crates/voicevox_core/src/lib.rs
index fedf538cf..94ccc0d5a 100644
--- a/crates/voicevox_core/src/lib.rs
+++ b/crates/voicevox_core/src/lib.rs
@@ -72,8 +72,10 @@ pub mod tokio;
 #[cfg(test)]
 mod test_util;
 
-// https://crates.io/crates/rstest_reuse#use-rstest_resuse-at-the-top-of-your-crate
-#[allow(clippy::single_component_path_imports)]
+#[expect(
+    clippy::single_component_path_imports,
+    reason = "https://crates.io/crates/rstest_reuse/0.6.0#use-rstest_resuse-at-the-top-of-your-crate"
+)]
 #[cfg(test)]
 use rstest_reuse;
 
diff --git a/crates/voicevox_core/src/manifest.rs b/crates/voicevox_core/src/manifest.rs
index 0808a6414..4460f10bf 100644
--- a/crates/voicevox_core/src/manifest.rs
+++ b/crates/voicevox_core/src/manifest.rs
@@ -67,7 +67,7 @@ impl Display for InnerVoiceId {
 
 #[derive(Deserialize, Getters, Clone)]
 pub struct Manifest {
-    #[allow(dead_code)]
+    #[expect(dead_code, reason = "現状はバリデーションのためだけに存在")]
     vvm_format_version: FormatVersionV1,
     pub(crate) id: VoiceModelId,
     metas_filename: String,
@@ -125,7 +125,7 @@ mod tests {
 
         #[derive(Deserialize)]
         struct ManifestPart {
-            #[allow(dead_code)]
+            #[expect(dead_code, reason = "バリデーションのためだけに存在")]
             vvm_format_version: FormatVersionV1,
         }
     }
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 8dcbf848a..3b9642c8a 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -808,7 +808,11 @@ pub(crate) mod blocking {
         /// # Performance
         ///
         /// CPU-boundな操作であるため、非同期ランタイム上では直接実行されるべきではない。
-        #[allow(clippy::too_many_arguments)]
+        #[expect(
+            clippy::too_many_arguments,
+            reason = "compatible_engineでの`predict_intonation`の形を考えると、ここの引数を構造体に\
+                      まとめたりしても可読性に寄与しない"
+        )]
         fn predict_intonation(
             &self,
             length: usize,
diff --git a/crates/voicevox_core/src/user_dict/word.rs b/crates/voicevox_core/src/user_dict/word.rs
index 0a42f1da5..afc023669 100644
--- a/crates/voicevox_core/src/user_dict/word.rs
+++ b/crates/voicevox_core/src/user_dict/word.rs
@@ -55,7 +55,7 @@ impl<'de> Deserialize<'de> for UserDictWord {
     }
 }
 
-#[allow(clippy::enum_variant_names)] // FIXME
+#[expect(clippy::enum_variant_names, reason = "特に理由はないので正されるべき")] // FIXME
 #[derive(thiserror::Error, Debug, PartialEq)]
 pub(crate) enum InvalidWordError {
     #[error("{}: 無効な発音です({_1}): {_0:?}", Self::BASE_MSG)]
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index f35179807..161af38e9 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -354,7 +354,10 @@ pub extern "C" fn voicevox_open_jtalk_rc_delete(open_jtalk: Box<OpenJtalkRc>) {
 /// ハードウェアアクセラレーションモードを設定する設定値。
 #[repr(i32)]
 #[derive(Debug, PartialEq, Eq)]
-#[allow(non_camel_case_types)]
+#[allow(
+    non_camel_case_types,
+    reason = "実際に公開するC APIとの差異をできるだけ少なくするため"
+)]
 pub enum VoicevoxAccelerationMode {
     /// 実行環境に合った適切なハードウェアアクセラレーションモードを選択する
     VOICEVOX_ACCELERATION_MODE_AUTO = 0,
@@ -1247,7 +1250,10 @@ pub struct VoicevoxUserDictWord {
 
 /// ユーザー辞書の単語の種類。
 #[repr(i32)]
-#[allow(non_camel_case_types)]
+#[allow(
+    non_camel_case_types,
+    reason = "実際に公開するC APIとの差異をできるだけ少なくするため"
+)]
 #[derive(Copy, Clone)]
 pub enum VoicevoxUserDictWordType {
     /// 固有名詞。
diff --git a/crates/voicevox_core_c_api/src/result_code.rs b/crates/voicevox_core_c_api/src/result_code.rs
index bfdbc8444..c3515ce0e 100644
--- a/crates/voicevox_core_c_api/src/result_code.rs
+++ b/crates/voicevox_core_c_api/src/result_code.rs
@@ -5,10 +5,11 @@ use cstr::cstr;
 /// 処理結果を示す結果コード。
 #[repr(i32)]
 #[derive(Debug, PartialEq, Eq, Clone, Copy)]
-#[allow(non_camel_case_types)]
+#[allow(
+    non_camel_case_types,
+    reason = "実際に公開するC APIとの差異をできるだけ少なくするため"
+)]
 pub enum VoicevoxResultCode {
-    // C でのenum定義に合わせて大文字で定義している
-    // 出力フォーマットを変更すればRustでよく使われているUpperCamelにできるが、実際に出力されるコードとの差異をできるだけ少なくするため
     /// 成功
     VOICEVOX_RESULT_OK = 0,
     /// open_jtalk辞書ファイルが読み込まれていない
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index d3d790075..9eabae6a3 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -322,9 +322,9 @@ mod blocking {
 
         fn __exit__(
             &mut self,
-            #[allow(unused_variables)] exc_type: &PyAny,
-            #[allow(unused_variables)] exc_value: &PyAny,
-            #[allow(unused_variables)] traceback: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_type: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_value: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] traceback: &PyAny,
         ) {
             self.close();
         }
@@ -759,7 +759,7 @@ mod asyncio {
 
     #[pymethods]
     impl OpenJtalk {
-        #[allow(clippy::new_ret_no_self)]
+        #[expect(clippy::new_ret_no_self, reason = "これはPython API")]
         #[staticmethod]
         fn new(
             #[pyo3(from_py_with = "crate::convert::from_utf8_path")]
@@ -829,9 +829,9 @@ mod asyncio {
 
         fn __exit__(
             &mut self,
-            #[allow(unused_variables)] exc_type: &PyAny,
-            #[allow(unused_variables)] exc_value: &PyAny,
-            #[allow(unused_variables)] traceback: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_type: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_value: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] traceback: &PyAny,
         ) {
             self.close();
         }

From e07c795846c44837e969a91b9ebf3aaa7937ee81 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Thu, 12 Sep 2024 19:03:34 +0900
Subject: [PATCH 27/36] improve: rework `VoiceModel` (#830)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* improve: rework `VoiceModel`

* diffを抑える工夫

* Minor refactor

* `.ref_map(…)` → `.each_ref().map(…)`

* `collect_results` → `collect`, `collect_future_results` → `join`

* `join`から`Result`の`collect`を分離

* fixup! diffを抑える工夫

* `blocking`版はblockingクレートに依存しない

* async_zip v0.0.17に備える

* `SmolBlocking` → `BlockingThreadPool`

* Minor refactor

* `futures_lite::future::block_on`を`.block_on()`として使えるようにする

* `join` → `join_all`

https://github.com/VOICEVOX/voicevox_core/pull/830#discussion_r1751120123

* `find_index` → `find_entry_index`

https://github.com/VOICEVOX/voicevox_core/pull/830#discussion_r1751135133

* "join"しない

* Minor refactor

* `crate::asyncs`にdoc

https://github.com/VOICEVOX/voicevox_core/pull/830#discussion_r1751106595

* `Unstoppable` → `SingleTasked`

https://github.com/VOICEVOX/voicevox_core/pull/830#discussion_r1754333231
https://chatgpt.com/share/cdae540e-5751-43a5-a1fb-ac1f17d6a1b8
---
 Cargo.lock                                    | 112 +++-
 Cargo.toml                                    |   3 +-
 crates/voicevox_core/Cargo.toml               |   7 +-
 crates/voicevox_core/src/asyncs.rs            |  82 +++
 crates/voicevox_core/src/future.rs            |  16 +
 crates/voicevox_core/src/infer/domains.rs     |  47 ++
 crates/voicevox_core/src/lib.rs               |   2 +
 crates/voicevox_core/src/manifest.rs          |  31 +-
 crates/voicevox_core/src/voice_model.rs       | 571 +++++++++---------
 crates/voicevox_core_c_api/Cargo.toml         |   1 -
 .../src/compatible_engine.rs                  |  10 +-
 crates/voicevox_core_macros/src/extract.rs    |  31 +
 .../src/inference_domain.rs                   |  40 +-
 crates/voicevox_core_macros/src/lib.rs        |  31 +
 crates/voicevox_core_macros/src/manifest.rs   |  72 +++
 crates/voicevox_core_python_api/src/lib.rs    |  10 +-
 16 files changed, 726 insertions(+), 340 deletions(-)
 create mode 100644 crates/voicevox_core/src/asyncs.rs
 create mode 100644 crates/voicevox_core/src/future.rs
 create mode 100644 crates/voicevox_core_macros/src/extract.rs
 create mode 100644 crates/voicevox_core_macros/src/manifest.rs

diff --git a/Cargo.lock b/Cargo.lock
index 7d70c15b8..53117ce5c 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -166,6 +166,18 @@ dependencies = [
  "yansi",
 ]
 
+[[package]]
+name = "async-channel"
+version = "2.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "89b47800b0be77592da0afd425cc03468052844aff33b84e33cc696f64e77b6a"
+dependencies = [
+ "concurrent-queue",
+ "event-listener-strategy",
+ "futures-core",
+ "pin-project-lite",
+]
+
 [[package]]
 name = "async-compression"
 version = "0.4.6"
@@ -179,6 +191,34 @@ dependencies = [
  "pin-project-lite",
 ]
 
+[[package]]
+name = "async-fs"
+version = "2.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ebcd09b382f40fcd159c2d695175b2ae620ffa5f3bd6f664131efff4e8b9e04a"
+dependencies = [
+ "async-lock",
+ "blocking",
+ "futures-lite",
+]
+
+[[package]]
+name = "async-lock"
+version = "3.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ff6e472cdea888a4bd64f342f09b3f50e1886d32afe8df3d663c01140b811b18"
+dependencies = [
+ "event-listener",
+ "event-listener-strategy",
+ "pin-project-lite",
+]
+
+[[package]]
+name = "async-task"
+version = "4.7.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8b75356056920673b02621b35afd0f7dda9306d03c79a30f5c56c44cf256e3de"
+
 [[package]]
 name = "async-trait"
 version = "0.1.57"
@@ -203,6 +243,12 @@ dependencies = [
  "thiserror",
 ]
 
+[[package]]
+name = "atomic-waker"
+version = "1.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1505bd5d3d116872e7271a6d4e16d81d0c8570876c8de68093a09ac269d8aac0"
+
 [[package]]
 name = "atty"
 version = "0.2.14"
@@ -354,6 +400,19 @@ dependencies = [
  "generic-array",
 ]
 
+[[package]]
+name = "blocking"
+version = "1.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "703f41c54fc768e63e091340b424302bb1c29ef4aa0c7f10fe849dfb114d29ea"
+dependencies = [
+ "async-channel",
+ "async-task",
+ "futures-io",
+ "futures-lite",
+ "piper",
+]
+
 [[package]]
 name = "bstr"
 version = "1.2.0"
@@ -695,6 +754,15 @@ version = "0.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "82a90734b3d5dcf656e7624cca6bce9c3a90ee11f900e80141a7427ccfb3d317"
 
+[[package]]
+name = "concurrent-queue"
+version = "2.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4ca0197aee26d1ae37445ee532fefce43251d24cc7c166799f4d46817f1d3973"
+dependencies = [
+ "crossbeam-utils",
+]
+
 [[package]]
 name = "console"
 version = "0.15.4"
@@ -1253,6 +1321,27 @@ dependencies = [
  "libc",
 ]
 
+[[package]]
+name = "event-listener"
+version = "5.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6032be9bd27023a771701cc49f9f053c751055f71efb2e0ae5c15809093675ba"
+dependencies = [
+ "concurrent-queue",
+ "parking",
+ "pin-project-lite",
+]
+
+[[package]]
+name = "event-listener-strategy"
+version = "0.5.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0f214dc438f977e6d4e3500aaa277f5ad94ca83fbbd9b1a15713ce2344ccc5a1"
+dependencies = [
+ "event-listener",
+ "pin-project-lite",
+]
+
 [[package]]
 name = "eyre"
 version = "0.6.8"
@@ -2637,9 +2726,9 @@ dependencies = [
 
 [[package]]
 name = "pin-project-lite"
-version = "0.2.9"
+version = "0.2.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e0a7ae3ac2f1173085d398531c705756c94a4c56843785df85a60c1a0afac116"
+checksum = "bda66fc9667c18cb2758a2ac84d1167245054bcf85d5d1aaa6923f45801bdd02"
 
 [[package]]
 name = "pin-utils"
@@ -2647,6 +2736,17 @@ version = "0.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "8b870d8c151b6f2fb93e84a13146138f05d02ed11c7e7c54f8826aaaf7c9f184"
 
+[[package]]
+name = "piper"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "96c8c490f422ef9a4efd2cb5b42b76c8613d7e7dfc1caf667b8a3350a5acc066"
+dependencies = [
+ "atomic-waker",
+ "fastrand 2.0.1",
+ "futures-io",
+]
+
 [[package]]
 name = "pkg-config"
 version = "0.3.30"
@@ -4243,6 +4343,7 @@ name = "voicevox_core"
 version = "0.0.0"
 dependencies = [
  "anyhow",
+ "async-fs",
  "async_zip",
  "camino",
  "const_format",
@@ -4254,7 +4355,9 @@ dependencies = [
  "educe",
  "enum-map",
  "fs-err",
- "futures",
+ "futures-io",
+ "futures-lite",
+ "futures-util",
  "heck",
  "humansize",
  "indexmap 2.0.0",
@@ -4264,7 +4367,6 @@ dependencies = [
  "open_jtalk",
  "ouroboros",
  "pretty_assertions",
- "rayon",
  "ref-cast",
  "regex",
  "rstest",
@@ -4283,7 +4385,6 @@ dependencies = [
  "voicevox-ort",
  "voicevox_core_macros",
  "windows",
- "zip",
 ]
 
 [[package]]
@@ -4303,7 +4404,6 @@ dependencies = [
  "derive-getters",
  "duct",
  "easy-ext",
- "futures",
  "inventory",
  "itertools 0.10.5",
  "libc",
diff --git a/Cargo.toml b/Cargo.toml
index d72625c5f..3a2fffb01 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -8,6 +8,7 @@ anstream = { version = "0.5.0", default-features = false }
 anstyle-query = "1.0.0"
 anyhow = "1.0.65"
 assert_cmd = "2.0.8"
+async-fs = "2.1.2"
 async_zip = "=0.0.16"
 bindgen = "0.69.4"
 binstall-tar = "0.4.39"
@@ -33,10 +34,10 @@ enum-map = "3.0.0-beta.1"
 eyre = "0.6.8"
 flate2 = "1.0.25"
 fs-err = "2.11.0"
-futures = "0.3.26"
 futures-core = "0.3.25"
 futures-util = "0.3.25"
 futures-lite = "2.2.0"
+futures-io = "0.3.28"
 heck = "0.4.1"
 humansize = "2.1.2"
 indexmap = "2.0.0"
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index 8cb2b1cfc..74feebb4b 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -16,6 +16,7 @@ link-onnxruntime = []
 
 [dependencies]
 anyhow.workspace = true
+async-fs.workspace = true
 async_zip = { workspace = true, features = ["deflate"] }
 camino.workspace = true
 const_format.workspace = true
@@ -27,14 +28,15 @@ easy-ext.workspace = true
 educe.workspace = true
 enum-map.workspace = true
 fs-err = { workspace = true, features = ["tokio"] }
-futures.workspace = true
+futures-io.workspace = true
+futures-lite.workspace = true
+futures-util = { workspace = true, features = ["io"] }
 indexmap = { workspace = true, features = ["serde"] }
 itertools.workspace = true
 jlabel.workspace = true
 ndarray.workspace = true
 open_jtalk.workspace = true
 ouroboros.workspace = true
-rayon.workspace = true
 ref-cast.workspace = true
 regex.workspace = true
 serde = { workspace = true, features = ["derive", "rc"] }
@@ -49,7 +51,6 @@ tracing.workspace = true
 uuid = { workspace = true, features = ["v4", "serde"] }
 voicevox-ort = { workspace = true, features = ["download-binaries", "__init-for-voicevox"] }
 voicevox_core_macros = { path = "../voicevox_core_macros" }
-zip.workspace = true
 
 [dev-dependencies]
 heck.workspace = true
diff --git a/crates/voicevox_core/src/asyncs.rs b/crates/voicevox_core/src/asyncs.rs
new file mode 100644
index 000000000..7bbabbb06
--- /dev/null
+++ b/crates/voicevox_core/src/asyncs.rs
@@ -0,0 +1,82 @@
+//! 非同期操作の実装の切り替えを行う。
+//!
+//! 「[ブロッキング版API]」と「[非同期版API]」との違いはここに集約される
+//! …予定。現在は[`crate::voice_model`]のみで利用している。
+//!
+//! # Motivation
+//!
+//! [blocking]クレートで駆動する非同期処理はランタイムが無くても動作する。そのため非同期版APIを
+//! もとにブロッキング版APIを構成することはできる。しかし将来WASMビルドすることを考えると、スレッド
+//! がまともに扱えないため機能しなくなってしまう。そのためWASM化を見越したブロッキング版APIのため
+//! に[`SingleTasked`]を用意している。
+//!
+//! [ブロッキング版API]: crate::blocking
+//! [非同期版API]: crate::tokio
+//! [blocking]: https://docs.rs/crate/blocking
+
+use std::{
+    io::{self, Read as _, Seek as _, SeekFrom},
+    path::Path,
+    pin::Pin,
+    task::{self, Poll},
+};
+
+use futures_io::{AsyncRead, AsyncSeek};
+
+pub(crate) trait Async: 'static {
+    async fn open_file(path: impl AsRef<Path>) -> io::Result<impl AsyncRead + AsyncSeek + Unpin>;
+}
+
+/// エグゼキュータが非同期タスクの並行実行をしないことを仮定する、[`Async`]の実装。
+///
+/// [ブロッキング版API]用。
+///
+/// # Performance
+///
+/// `async`の中でブロッキング操作を直接行う。そのためTokioやasync-stdのような通常の非同期ランタイム
+/// 上で動くべきではない。
+///
+/// [ブロッキング版API]: crate::blocking
+pub(crate) enum SingleTasked {}
+
+impl Async for SingleTasked {
+    async fn open_file(path: impl AsRef<Path>) -> io::Result<impl AsyncRead + AsyncSeek + Unpin> {
+        return std::fs::File::open(path).map(BlockingFile);
+
+        struct BlockingFile(std::fs::File);
+
+        impl AsyncRead for BlockingFile {
+            fn poll_read(
+                mut self: Pin<&mut Self>,
+                _: &mut task::Context<'_>,
+                buf: &mut [u8],
+            ) -> Poll<io::Result<usize>> {
+                Poll::Ready(self.0.read(buf))
+            }
+        }
+
+        impl AsyncSeek for BlockingFile {
+            fn poll_seek(
+                mut self: Pin<&mut Self>,
+                _: &mut task::Context<'_>,
+                pos: SeekFrom,
+            ) -> Poll<io::Result<u64>> {
+                Poll::Ready(self.0.seek(pos))
+            }
+        }
+    }
+}
+
+/// [blocking]クレートで駆動する[`Async`]の実装。
+///
+/// [非同期版API]用。
+///
+/// [blocking]: https://docs.rs/crate/blocking
+/// [非同期版API]: crate::tokio
+pub(crate) enum BlockingThreadPool {}
+
+impl Async for BlockingThreadPool {
+    async fn open_file(path: impl AsRef<Path>) -> io::Result<impl AsyncRead + AsyncSeek + Unpin> {
+        async_fs::File::open(path).await
+    }
+}
diff --git a/crates/voicevox_core/src/future.rs b/crates/voicevox_core/src/future.rs
new file mode 100644
index 000000000..4ddbf3303
--- /dev/null
+++ b/crates/voicevox_core/src/future.rs
@@ -0,0 +1,16 @@
+use std::future::Future;
+
+use easy_ext::ext;
+
+/// `futures_lite::future::block_on`を、[pollster]のように`.block_on()`という形で使えるようにする。
+///
+/// [pollster]: https://docs.rs/crate/pollster
+#[ext(FutureExt)]
+impl<F: Future> F {
+    pub(crate) fn block_on(self) -> Self::Output
+    where
+        Self: Sized,
+    {
+        futures_lite::future::block_on(self)
+    }
+}
diff --git a/crates/voicevox_core/src/infer/domains.rs b/crates/voicevox_core/src/infer/domains.rs
index 687550399..5225f2ec3 100644
--- a/crates/voicevox_core/src/infer/domains.rs
+++ b/crates/voicevox_core/src/infer/domains.rs
@@ -1,14 +1,61 @@
 mod talk;
 
+use educe::Educe;
+use serde::{Deserialize, Deserializer};
+
 pub(crate) use self::talk::{
     DecodeInput, DecodeOutput, PredictDurationInput, PredictDurationOutput, PredictIntonationInput,
     PredictIntonationOutput, TalkDomain, TalkOperation,
 };
 
+#[derive(Educe)]
+// TODO: `bounds`に`V: ?Sized`も入れようとすると、よくわからない理由で弾かれる。最新版のeduce
+// でもそうなのか？また最新版でも駄目だとしたら、弾いている理由は何なのか？
+#[educe(Clone(bound = "V: InferenceDomainMapValues, V::Talk: Clone"))]
 pub(crate) struct InferenceDomainMap<V: InferenceDomainMapValues + ?Sized> {
     pub(crate) talk: V::Talk,
 }
 
+impl<T> InferenceDomainMap<(T,)> {
+    pub(crate) fn each_ref(&self) -> InferenceDomainMap<(&T,)> {
+        let talk = &self.talk;
+        InferenceDomainMap { talk }
+    }
+
+    pub(crate) fn map<T2, Ft: FnOnce(T) -> T2>(
+        self,
+        fs: InferenceDomainMap<(Ft,)>,
+    ) -> InferenceDomainMap<(T2,)> {
+        let talk = (fs.talk)(self.talk);
+        InferenceDomainMap { talk }
+    }
+}
+
+impl<T, E> InferenceDomainMap<(Result<T, E>,)> {
+    pub(crate) fn collect(self) -> Result<InferenceDomainMap<(T,)>, E> {
+        let talk = self.talk?;
+        Ok(InferenceDomainMap { talk })
+    }
+}
+
+impl<'de, V: InferenceDomainMapValues + ?Sized> Deserialize<'de> for InferenceDomainMap<V>
+where
+    V::Talk: Deserialize<'de>,
+{
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        let Repr { talk } = Repr::deserialize(deserializer)?;
+        return Ok(Self { talk });
+
+        #[derive(Deserialize)]
+        struct Repr<T> {
+            talk: T,
+        }
+    }
+}
+
 pub(crate) trait InferenceDomainMapValues {
     type Talk;
 }
diff --git a/crates/voicevox_core/src/lib.rs b/crates/voicevox_core/src/lib.rs
index 94ccc0d5a..dad702cc6 100644
--- a/crates/voicevox_core/src/lib.rs
+++ b/crates/voicevox_core/src/lib.rs
@@ -48,10 +48,12 @@ const _: () = {
     );
 };
 
+mod asyncs;
 mod devices;
 /// cbindgen:ignore
 mod engine;
 mod error;
+mod future;
 mod infer;
 mod macros;
 mod manifest;
diff --git a/crates/voicevox_core/src/manifest.rs b/crates/voicevox_core/src/manifest.rs
index 4460f10bf..203fc76a9 100644
--- a/crates/voicevox_core/src/manifest.rs
+++ b/crates/voicevox_core/src/manifest.rs
@@ -7,10 +7,14 @@ use std::{
 use derive_getters::Getters;
 use derive_more::Deref;
 use derive_new::new;
+use macros::IndexForFields;
 use serde::{de, Deserialize, Deserializer, Serialize};
 use serde_with::{serde_as, DisplayFromStr};
 
-use crate::{StyleId, VoiceModelId};
+use crate::{
+    infer::domains::{InferenceDomainMap, TalkOperation},
+    StyleId, VoiceModelId,
+};
 
 #[derive(Clone)]
 struct FormatVersionV1;
@@ -65,26 +69,31 @@ impl Display for InnerVoiceId {
     }
 }
 
-#[derive(Deserialize, Getters, Clone)]
+#[derive(Deserialize, Getters)]
 pub struct Manifest {
     #[expect(dead_code, reason = "現状はバリデーションのためだけに存在")]
     vvm_format_version: FormatVersionV1,
     pub(crate) id: VoiceModelId,
     metas_filename: String,
     #[serde(flatten)]
-    domains: ManifestDomains,
+    domains: InferenceDomainMap<ManifestDomains>,
 }
 
-#[derive(Deserialize, Clone)]
-pub(crate) struct ManifestDomains {
-    pub(crate) talk: Option<TalkManifest>,
-}
+pub(crate) type ManifestDomains = (Option<TalkManifest>,);
 
-#[derive(Deserialize, Clone)]
+#[derive(Deserialize, IndexForFields)]
+#[cfg_attr(test, derive(Default))]
+#[index_for_fields(TalkOperation)]
 pub(crate) struct TalkManifest {
-    pub(crate) predict_duration_filename: String,
-    pub(crate) predict_intonation_filename: String,
-    pub(crate) decode_filename: String,
+    #[index_for_fields(TalkOperation::PredictDuration)]
+    pub(crate) predict_duration_filename: Arc<str>,
+
+    #[index_for_fields(TalkOperation::PredictIntonation)]
+    pub(crate) predict_intonation_filename: Arc<str>,
+
+    #[index_for_fields(TalkOperation::Decode)]
+    pub(crate) decode_filename: Arc<str>,
+
     #[serde(default)]
     pub(crate) style_id_to_inner_voice_id: StyleIdToInnerVoiceId,
 }
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index 48477256c..ac49d2cdb 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -2,24 +2,33 @@
 //!
 //! VVM ファイルの定義と形式は[ドキュメント](../../../docs/vvm.md)を参照。
 
-use anyhow::anyhow;
+use std::{
+    marker::PhantomData,
+    path::{Path, PathBuf},
+    sync::Arc,
+};
+
+use anyhow::{anyhow, Context as _};
 use derive_more::From;
 use easy_ext::ext;
-use enum_map::EnumMap;
+use enum_map::{enum_map, EnumMap};
+use futures_io::{AsyncBufRead, AsyncSeek};
+use futures_util::future::{OptionFuture, TryFutureExt as _};
 use itertools::Itertools as _;
+use ouroboros::self_referencing;
 use serde::Deserialize;
 use uuid::Uuid;
 
 use crate::{
+    asyncs::Async,
     error::{LoadModelError, LoadModelErrorKind, LoadModelResult},
     infer::{
-        domains::{TalkDomain, TalkOperation},
+        domains::{InferenceDomainMap, TalkDomain, TalkOperation},
         InferenceDomain,
     },
-    manifest::{Manifest, ManifestDomains, StyleIdToInnerVoiceId},
+    manifest::{Manifest, ManifestDomains, StyleIdToInnerVoiceId, TalkManifest},
     SpeakerMeta, StyleMeta, StyleType, VoiceModelMeta,
 };
-use std::path::{Path, PathBuf};
 
 /// [`VoiceModelId`]の実体。
 ///
@@ -51,11 +60,238 @@ impl VoiceModelId {
     }
 }
 
+#[self_referencing]
+struct Inner<A> {
+    header: VoiceModelHeader,
+
+    #[borrows(header)]
+    #[not_covariant]
+    inference_model_entries: InferenceDomainMap<InferenceModelEntries<'this>>,
+
+    // `_marker`とすると、`borrow__marker`のような名前のメソッドが生成されて`non_snake_case`が
+    // 起動してしまう
+    marker: PhantomData<fn(A) -> A>,
+}
+
+impl<A: Async> Inner<A> {
+    async fn from_path(path: impl AsRef<Path>) -> crate::Result<Self> {
+        const MANIFEST_FILENAME: &str = "manifest.json";
+
+        let path = path.as_ref();
+
+        let error = |context, source| LoadModelError {
+            path: path.to_owned(),
+            context,
+            source: Some(source),
+        };
+
+        let mut zip = A::open_zip(path)
+            .await
+            .map_err(|source| error(LoadModelErrorKind::OpenZipFile, source))?;
+
+        let manifest = &async {
+            let idx = zip.find_entry_index(MANIFEST_FILENAME)?;
+            zip.read_file(idx).await
+        }
+        .await
+        .map_err(|source| {
+            error(
+                LoadModelErrorKind::ReadZipEntry {
+                    filename: MANIFEST_FILENAME.to_owned(),
+                },
+                source,
+            )
+        })?;
+        let manifest = serde_json::from_slice::<Manifest>(manifest)
+            .map_err(|source| error(LoadModelErrorKind::InvalidModelFormat, source.into()))?;
+
+        let metas = &async {
+            let idx = zip.find_entry_index(manifest.metas_filename())?;
+            zip.read_file(idx).await
+        }
+        .await
+        .map_err(|source| {
+            error(
+                LoadModelErrorKind::ReadZipEntry {
+                    filename: manifest.metas_filename().clone(),
+                },
+                source,
+            )
+        })?;
+
+        let header = VoiceModelHeader::new(manifest, metas, path)?;
+
+        InnerTryBuilder {
+            header,
+            inference_model_entries_builder: |VoiceModelHeader { manifest, .. }| {
+                manifest
+                    .domains()
+                    .each_ref()
+                    .map(InferenceDomainMap {
+                        talk: |talk| {
+                            talk.as_ref()
+                                .map(|manifest| {
+                                    let indices = enum_map! {
+                                        TalkOperation::PredictDuration => {
+                                            zip.find_entry_index(&manifest.predict_duration_filename)?
+                                        }
+                                        TalkOperation::PredictIntonation => zip.find_entry_index(
+                                            &manifest.predict_intonation_filename,
+                                        )?,
+                                        TalkOperation::Decode => {
+                                            zip.find_entry_index(&manifest.decode_filename)?
+                                        }
+                                    };
+
+                                    Ok(InferenceModelEntry { indices, manifest })
+                                })
+                                .transpose()
+                                .map_err(move |source| {
+                                    error(
+                                        LoadModelErrorKind::ReadZipEntry {
+                                            filename: MANIFEST_FILENAME.to_owned(),
+                                        },
+                                        source,
+                                    )
+                                })
+                        },
+                    })
+                    .collect()
+                    .map_err(crate::Error::from)
+            },
+            marker: PhantomData,
+        }
+        .try_build()
+    }
+
+    fn id(&self) -> VoiceModelId {
+        self.borrow_header().manifest.id
+    }
+
+    fn metas(&self) -> &VoiceModelMeta {
+        &self.borrow_header().metas
+    }
+
+    fn header(&self) -> &VoiceModelHeader {
+        self.borrow_header()
+    }
+
+    async fn read_inference_models(
+        &self,
+    ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
+        let path = &self.borrow_header().path;
+
+        let error = |context, source| LoadModelError {
+            path: path.to_owned(),
+            context,
+            source: Some(source),
+        };
+
+        let mut zip = A::open_zip(path)
+            .await
+            .map_err(|source| error(LoadModelErrorKind::OpenZipFile, source))?;
+
+        macro_rules! read_file {
+            ($entry:expr $(,)?) => {{
+                let (index, filename): (usize, Arc<str>) = $entry;
+                zip.read_file(index)
+                    .map_err(move |source| {
+                        error(
+                            LoadModelErrorKind::ReadZipEntry {
+                                filename: (*filename).to_owned(),
+                            },
+                            source,
+                        )
+                    })
+                    .await?
+            }};
+        }
+
+        let InferenceDomainMap { talk } =
+            self.with_inference_model_entries(|inference_model_entries| {
+                inference_model_entries.each_ref().map(InferenceDomainMap {
+                    talk: |talk| {
+                        talk.as_ref()
+                            .map(|InferenceModelEntry { indices, manifest }| {
+                                (
+                                    indices.map(|op, i| (i, manifest[op].clone())),
+                                    manifest.style_id_to_inner_voice_id.clone(),
+                                )
+                            })
+                    },
+                })
+            });
+
+        let talk = OptionFuture::from(talk.map(
+            |(entries, style_id_to_inner_voice_id)| async move {
+                let [predict_duration, predict_intonation, decode] = entries.into_array();
+
+                let predict_duration = read_file!(predict_duration);
+                let predict_intonation = read_file!(predict_intonation);
+                let decode = read_file!(decode);
+
+                let model_bytes =
+                    EnumMap::from_array([predict_duration, predict_intonation, decode]);
+
+                Ok((style_id_to_inner_voice_id, model_bytes))
+            },
+        ))
+        .await
+        .transpose()?;
+
+        Ok(InferenceDomainMap { talk })
+    }
+}
+
+type InferenceModelEntries<'manifest> =
+    (Option<InferenceModelEntry<TalkDomain, &'manifest TalkManifest>>,);
+
+struct InferenceModelEntry<D: InferenceDomain, M> {
+    indices: EnumMap<D::Operation, usize>,
+    manifest: M,
+}
+
+#[ext]
+impl<A: Async> A {
+    async fn open_zip(
+        path: &Path,
+    ) -> anyhow::Result<async_zip::base::read::seek::ZipFileReader<impl AsyncBufRead + AsyncSeek>>
+    {
+        let zip = Self::open_file(path).await.with_context(|| {
+            // fs-errのと同じにする
+            format!("failed to open file `{}`", path.display())
+        })?;
+        let zip = futures_util::io::BufReader::new(zip); // async_zip v0.0.16では不要、v0.0.17では必要
+        let zip = async_zip::base::read::seek::ZipFileReader::new(zip).await?;
+        Ok(zip)
+    }
+}
+
+#[ext]
+impl<R: AsyncBufRead + AsyncSeek + Unpin> async_zip::base::read::seek::ZipFileReader<R> {
+    fn find_entry_index(&self, filename: &str) -> anyhow::Result<usize> {
+        let (idx, _) = self
+            .file()
+            .entries()
+            .iter()
+            .enumerate()
+            .find(|(_, e)| e.filename().as_str().ok() == Some(filename))
+            .with_context(|| "could not find `{filename}`")?;
+        Ok(idx)
+    }
+
+    async fn read_file(&mut self, index: usize) -> anyhow::Result<Vec<u8>> {
+        let mut rdr = self.reader_with_entry(index).await?;
+        let mut buf = Vec::with_capacity(rdr.entry().uncompressed_size() as usize);
+        rdr.read_to_end_checked(&mut buf).await?;
+        Ok(buf)
+    }
+}
+
 // FIXME: "header"といいつつ、VVMのファイルパスを持っている状態になっている。
 /// 音声モデルが持つ、各モデルファイルの実体を除く情報。
 ///
 /// モデルの`[u8]`と分けて`Status`に渡す。
-#[derive(Clone)]
 pub(crate) struct VoiceModelHeader {
     pub(crate) manifest: Manifest,
     /// メタ情報。
@@ -67,27 +303,32 @@ pub(crate) struct VoiceModelHeader {
 
 impl VoiceModelHeader {
     fn new(manifest: Manifest, metas: &[u8], path: &Path) -> LoadModelResult<Self> {
-        let metas =
-            serde_json::from_slice::<VoiceModelMeta>(metas).map_err(|source| LoadModelError {
-                path: path.to_owned(),
-                context: LoadModelErrorKind::InvalidModelFormat,
-                source: Some(
-                    anyhow::Error::from(source)
-                        .context(format!("{}が不正です", manifest.metas_filename())),
-                ),
-            })?;
+        let error = |context, source| LoadModelError {
+            path: path.to_owned(),
+            context,
+            source: Some(source),
+        };
+
+        let metas = serde_json::from_slice::<VoiceModelMeta>(metas).map_err(|source| {
+            error(
+                LoadModelErrorKind::InvalidModelFormat,
+                anyhow::Error::from(source)
+                    .context(format!("{}が不正です", manifest.metas_filename())),
+            )
+        })?;
 
         manifest
             .domains()
             .check_acceptable(&metas)
-            .map_err(|style_type| LoadModelError {
-                path: path.to_owned(),
-                context: LoadModelErrorKind::InvalidModelFormat,
-                source: Some(anyhow!(
-                    "{metas_filename}には`{style_type}`のスタイルが存在しますが、manifest.jsonでの\
-                     対応がありません",
-                    metas_filename = manifest.metas_filename(),
-                )),
+            .map_err(|style_type| {
+                error(
+                    LoadModelErrorKind::InvalidModelFormat,
+                    anyhow!(
+                        "{metas_filename}には`{style_type}`のスタイルが存在しますが、manifest.json\
+                         での対応がありません",
+                        metas_filename = manifest.metas_filename(),
+                    ),
+                )
             })?;
 
         Ok(Self {
@@ -98,7 +339,7 @@ impl VoiceModelHeader {
     }
 }
 
-impl ManifestDomains {
+impl InferenceDomainMap<ManifestDomains> {
     /// manifestとして対応していない`StyleType`に対してエラーを発する。
     ///
     /// `Status`はこのバリデーションを信頼し、`InferenceDomain`の不足時にパニックする。
@@ -141,360 +382,142 @@ impl ManifestDomains {
 }
 
 pub(crate) mod blocking {
-    use std::{
-        io::{self, Cursor},
-        path::Path,
-    };
+    use std::path::Path;
 
     use easy_ext::ext;
-    use enum_map::EnumMap;
-    use ouroboros::self_referencing;
-    use rayon::iter::{IntoParallelIterator as _, ParallelIterator as _};
-    use serde::de::DeserializeOwned;
     use uuid::Uuid;
 
     use crate::{
-        error::{LoadModelError, LoadModelErrorKind, LoadModelResult},
-        infer::domains::InferenceDomainMap,
-        manifest::{Manifest, TalkManifest},
-        VoiceModelMeta,
+        asyncs::SingleTasked, error::LoadModelResult, future::FutureExt as _,
+        infer::domains::InferenceDomainMap, VoiceModelMeta,
     };
 
-    use super::{ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
+    use super::{Inner, ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
 
     /// 音声モデル。
     ///
     /// VVMファイルと対応する。
-    #[derive(Clone)]
-    pub struct VoiceModel {
-        header: VoiceModelHeader,
-    }
+    pub struct VoiceModel(Inner<SingleTasked>);
 
     impl self::VoiceModel {
         pub(crate) fn read_inference_models(
             &self,
         ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
-            let reader = BlockingVvmEntryReader::open(&self.header.path)?;
-
-            let talk = self
-                .header
-                .manifest
-                .domains()
-                .talk
-                .as_ref()
-                .map(
-                    |TalkManifest {
-                         predict_duration_filename,
-                         predict_intonation_filename,
-                         decode_filename,
-                         style_id_to_inner_voice_id,
-                     }| {
-                        let model_bytes = [
-                            predict_duration_filename,
-                            predict_intonation_filename,
-                            decode_filename,
-                        ]
-                        .into_par_iter()
-                        .map(|filename| reader.read_vvm_entry(filename))
-                        .collect::<std::result::Result<Vec<_>, _>>()?
-                        .try_into()
-                        .unwrap_or_else(|_| panic!("should be same length"));
-
-                        let model_bytes = EnumMap::from_array(model_bytes);
-
-                        Ok((style_id_to_inner_voice_id.clone(), model_bytes))
-                    },
-                )
-                .transpose()?;
-
-            Ok(InferenceDomainMap { talk })
+            self.0.read_inference_models().block_on()
         }
 
         /// VVMファイルから`VoiceModel`をコンストラクトする。
         pub fn from_path(path: impl AsRef<Path>) -> crate::Result<Self> {
-            let path = path.as_ref();
-            let reader = BlockingVvmEntryReader::open(path)?;
-            let manifest = reader.read_vvm_json::<Manifest>("manifest.json")?;
-            let metas = &reader.read_vvm_entry(manifest.metas_filename())?;
-            let header = VoiceModelHeader::new(manifest, metas, path)?;
-            Ok(Self { header })
+            Inner::from_path(path).block_on().map(Self)
         }
 
         /// ID。
         pub fn id(&self) -> VoiceModelId {
-            self.header.manifest.id
+            self.0.id()
         }
 
         /// メタ情報。
         pub fn metas(&self) -> &VoiceModelMeta {
-            &self.header.metas
+            self.0.metas()
         }
 
         pub(crate) fn header(&self) -> &VoiceModelHeader {
-            &self.header
-        }
-    }
-
-    #[self_referencing]
-    struct BlockingVvmEntryReader {
-        path: std::path::PathBuf,
-        zip: Vec<u8>,
-        #[covariant]
-        #[borrows(zip)]
-        reader: zip::ZipArchive<Cursor<&'this [u8]>>,
-    }
-
-    impl BlockingVvmEntryReader {
-        fn open(path: &Path) -> LoadModelResult<Self> {
-            (|| {
-                let zip = std::fs::read(path)?;
-                Self::try_new(path.to_owned(), zip, |zip| {
-                    zip::ZipArchive::new(Cursor::new(zip))
-                })
-            })()
-            .map_err(|source| LoadModelError {
-                path: path.to_owned(),
-                context: LoadModelErrorKind::OpenZipFile,
-                source: Some(source.into()),
-            })
-        }
-
-        // FIXME: manifest.json専用になっているので、そういう関数名にする
-        fn read_vvm_json<T: DeserializeOwned>(&self, filename: &str) -> LoadModelResult<T> {
-            let bytes = &self.read_vvm_entry(filename)?;
-            serde_json::from_slice(bytes).map_err(|source| LoadModelError {
-                path: self.borrow_path().clone(),
-                context: LoadModelErrorKind::InvalidModelFormat,
-                source: Some(anyhow::Error::from(source).context(format!("{filename}が不正です"))),
-            })
-        }
-
-        fn read_vvm_entry(&self, filename: &str) -> LoadModelResult<Vec<u8>> {
-            (|| {
-                let mut reader = self.borrow_reader().clone();
-                let mut entry = reader.by_name(filename)?;
-                let mut buf = Vec::with_capacity(entry.size() as _);
-                io::copy(&mut entry, &mut buf)?;
-                Ok(buf)
-            })()
-            .map_err(|source| LoadModelError {
-                path: self.borrow_path().clone(),
-                context: LoadModelErrorKind::OpenZipFile,
-                source: Some(source),
-            })
+            self.0.header()
         }
     }
 
     #[ext(IdRef)]
     pub impl VoiceModel {
         fn id_ref(&self) -> &Uuid {
-            &self.header.manifest.id.0
+            &self.header().manifest.id.0
         }
     }
 }
 
 pub(crate) mod tokio {
-    use std::{collections::HashMap, io, path::Path};
-
-    use derive_new::new;
-    use enum_map::EnumMap;
-    use futures::future::{join3, OptionFuture};
-    use serde::de::DeserializeOwned;
+    use std::path::Path;
 
     use crate::{
-        error::{LoadModelError, LoadModelErrorKind, LoadModelResult},
-        infer::domains::InferenceDomainMap,
-        manifest::{Manifest, TalkManifest},
+        asyncs::BlockingThreadPool, error::LoadModelResult, infer::domains::InferenceDomainMap,
         Result, VoiceModelMeta,
     };
 
-    use super::{ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
+    use super::{Inner, ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
 
     /// 音声モデル。
     ///
     /// VVMファイルと対応する。
-    #[derive(Clone)]
-    pub struct VoiceModel {
-        header: VoiceModelHeader,
-    }
+    pub struct VoiceModel(Inner<BlockingThreadPool>);
 
     impl self::VoiceModel {
         pub(crate) async fn read_inference_models(
             &self,
         ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
-            let reader = AsyncVvmEntryReader::open(&self.header.path).await?;
-
-            let talk = OptionFuture::from(self.header.manifest.domains().talk.as_ref().map(
-                |TalkManifest {
-                     predict_duration_filename,
-                     predict_intonation_filename,
-                     decode_filename,
-                     style_id_to_inner_voice_id,
-                 }| async {
-                    let (
-                        decode_model_result,
-                        predict_duration_model_result,
-                        predict_intonation_model_result,
-                    ) = join3(
-                        reader.read_vvm_entry(decode_filename),
-                        reader.read_vvm_entry(predict_duration_filename),
-                        reader.read_vvm_entry(predict_intonation_filename),
-                    )
-                    .await;
-
-                    let model_bytes = EnumMap::from_array([
-                        predict_duration_model_result?,
-                        predict_intonation_model_result?,
-                        decode_model_result?,
-                    ]);
-
-                    Ok((style_id_to_inner_voice_id.clone(), model_bytes))
-                },
-            ))
-            .await
-            .transpose()?;
-
-            Ok(InferenceDomainMap { talk })
+            self.0.read_inference_models().await
         }
         /// VVMファイルから`VoiceModel`をコンストラクトする。
         pub async fn from_path(path: impl AsRef<Path>) -> Result<Self> {
-            let reader = AsyncVvmEntryReader::open(path.as_ref()).await?;
-            let manifest = reader.read_vvm_json::<Manifest>("manifest.json").await?;
-            let metas = &reader.read_vvm_entry(manifest.metas_filename()).await?;
-            let header = VoiceModelHeader::new(manifest, metas, path.as_ref())?;
-            Ok(Self { header })
+            Inner::from_path(path).await.map(Self)
         }
 
         /// ID。
         pub fn id(&self) -> VoiceModelId {
-            self.header.manifest.id
+            self.0.id()
         }
 
         /// メタ情報。
         pub fn metas(&self) -> &VoiceModelMeta {
-            &self.header.metas
+            self.0.metas()
         }
 
         pub(crate) fn header(&self) -> &VoiceModelHeader {
-            &self.header
-        }
-    }
-
-    struct AsyncVvmEntry {
-        index: usize,
-        entry: async_zip::ZipEntry,
-    }
-
-    #[derive(new)]
-    struct AsyncVvmEntryReader<'a> {
-        path: &'a Path,
-        reader: async_zip::base::read::mem::ZipFileReader,
-        entry_map: HashMap<String, AsyncVvmEntry>,
-    }
-
-    impl<'a> AsyncVvmEntryReader<'a> {
-        async fn open(path: &'a Path) -> LoadModelResult<Self> {
-            let reader = async {
-                let file = fs_err::tokio::read(path).await?;
-                async_zip::base::read::mem::ZipFileReader::new(file).await
-            }
-            .await
-            .map_err(|source| LoadModelError {
-                path: path.to_owned(),
-                context: LoadModelErrorKind::OpenZipFile,
-                source: Some(source.into()),
-            })?;
-            let entry_map: HashMap<_, _> = reader
-                .file()
-                .entries()
-                .iter()
-                .flat_map(|e| {
-                    // 非UTF-8のファイルを利用することはないため、無視する
-                    let filename = e.filename().as_str().ok()?;
-                    (!e.dir().ok()?).then_some(())?;
-                    Some((filename.to_owned(), (**e).clone()))
-                })
-                .enumerate()
-                .map(|(i, (filename, entry))| (filename, AsyncVvmEntry { index: i, entry }))
-                .collect();
-            Ok(AsyncVvmEntryReader::new(path, reader, entry_map))
-        }
-        // FIXME: manifest.json専用になっているので、そういう関数名にする
-        async fn read_vvm_json<T: DeserializeOwned>(&self, filename: &str) -> LoadModelResult<T> {
-            let bytes = self.read_vvm_entry(filename).await?;
-            serde_json::from_slice(&bytes).map_err(|source| LoadModelError {
-                path: self.path.to_owned(),
-                context: LoadModelErrorKind::InvalidModelFormat,
-                source: Some(anyhow::Error::from(source).context(format!("{filename}が不正です"))),
-            })
-        }
-
-        async fn read_vvm_entry(&self, filename: &str) -> LoadModelResult<Vec<u8>> {
-            async {
-                let me = self
-                    .entry_map
-                    .get(filename)
-                    .ok_or_else(|| io::Error::from(io::ErrorKind::NotFound))?;
-                let mut manifest_reader = self.reader.reader_with_entry(me.index).await?;
-                let mut buf = Vec::with_capacity(me.entry.uncompressed_size() as usize);
-                manifest_reader.read_to_end_checked(&mut buf).await?;
-                Ok::<_, anyhow::Error>(buf)
-            }
-            .await
-            .map_err(|source| LoadModelError {
-                path: self.path.to_owned(),
-                context: LoadModelErrorKind::ReadZipEntry {
-                    filename: filename.to_owned(),
-                },
-                source: Some(source),
-            })
+            self.0.header()
         }
     }
 }
 
 #[cfg(test)]
 mod tests {
-    use std::sync::LazyLock;
-
     use rstest::{fixture, rstest};
     use serde_json::json;
 
     use crate::{
+        infer::domains::InferenceDomainMap,
         manifest::{ManifestDomains, TalkManifest},
         SpeakerMeta, StyleType,
     };
 
     #[rstest]
     #[case(
-        &ManifestDomains {
+        &InferenceDomainMap {
             talk: None,
         },
         &[],
         Ok(())
     )]
     #[case(
-        &ManifestDomains {
-            talk: Some(TALK_MANIFEST.clone()),
+        &InferenceDomainMap {
+            talk: Some(TalkManifest::default()),
         },
         &[speaker(&[StyleType::Talk])],
         Ok(())
     )]
     #[case(
-        &ManifestDomains {
-            talk: Some(TALK_MANIFEST.clone()),
+        &InferenceDomainMap {
+            talk: Some(TalkManifest::default()),
         },
         &[speaker(&[StyleType::Talk, StyleType::Sing])],
         Ok(())
     )]
     #[case(
-        &ManifestDomains {
+        &InferenceDomainMap {
             talk: None,
         },
         &[speaker(&[StyleType::Talk])],
         Err(())
     )]
     fn check_acceptable_works(
-        #[case] manifest: &ManifestDomains,
+        #[case] manifest: &InferenceDomainMap<ManifestDomains>,
         #[case] metas: &[SpeakerMeta],
         #[case] expected: std::result::Result<(), ()>,
     ) {
@@ -502,13 +525,7 @@ mod tests {
         assert_eq!(expected, actual);
     }
 
-    static TALK_MANIFEST: LazyLock<TalkManifest> = LazyLock::new(|| TalkManifest {
-        predict_duration_filename: "".to_owned(),
-        predict_intonation_filename: "".to_owned(),
-        decode_filename: "".to_owned(),
-        style_id_to_inner_voice_id: Default::default(),
-    });
-
+    // FIXME: これ使ってないのでは？
     #[fixture]
     fn talk_speaker() -> SpeakerMeta {
         serde_json::from_value(json!({
diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml
index 996367a5f..1b74bfdf5 100644
--- a/crates/voicevox_core_c_api/Cargo.toml
+++ b/crates/voicevox_core_c_api/Cargo.toml
@@ -26,7 +26,6 @@ const_format.workspace = true
 cstr.workspace = true
 derive-getters.workspace = true
 easy-ext.workspace = true
-futures.workspace = true
 itertools.workspace = true
 libc.workspace = true
 process_path.workspace = true
diff --git a/crates/voicevox_core_c_api/src/compatible_engine.rs b/crates/voicevox_core_c_api/src/compatible_engine.rs
index 68b836f2f..9fdff0c92 100644
--- a/crates/voicevox_core_c_api/src/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/src/compatible_engine.rs
@@ -2,7 +2,7 @@ use std::{
     collections::BTreeMap,
     env,
     ffi::{c_char, CString},
-    sync::{LazyLock, Mutex, MutexGuard},
+    sync::{Arc, LazyLock, Mutex, MutexGuard},
 };
 
 use libc::c_int;
@@ -35,10 +35,10 @@ static ONNXRUNTIME: LazyLock<&'static voicevox_core::blocking::Onnxruntime> = La
 });
 
 struct VoiceModelSet {
-    all_vvms: Vec<voicevox_core::blocking::VoiceModel>,
+    all_vvms: Vec<Arc<voicevox_core::blocking::VoiceModel>>,
     all_metas_json: CString,
     style_model_map: BTreeMap<StyleId, VoiceModelId>,
-    model_map: BTreeMap<VoiceModelId, voicevox_core::blocking::VoiceModel>,
+    model_map: BTreeMap<VoiceModelId, Arc<voicevox_core::blocking::VoiceModel>>,
 }
 
 static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
@@ -66,7 +66,7 @@ static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
     /// # Panics
     ///
     /// 失敗したらパニックする
-    fn get_all_models() -> Vec<voicevox_core::blocking::VoiceModel> {
+    fn get_all_models() -> Vec<Arc<voicevox_core::blocking::VoiceModel>> {
         let root_dir = if let Some(root_dir) = env::var_os(ROOT_DIR_ENV_NAME) {
             root_dir.into()
         } else {
@@ -84,7 +84,7 @@ static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
             .unwrap_or_else(|e| panic!("{}が読めませんでした: {e}", root_dir.display()))
             .into_iter()
             .filter(|entry| entry.path().extension().map_or(false, |ext| ext == "vvm"))
-            .map(|entry| voicevox_core::blocking::VoiceModel::from_path(entry.path()))
+            .map(|entry| voicevox_core::blocking::VoiceModel::from_path(entry.path()).map(Arc::new))
             .collect::<std::result::Result<_, _>>()
             .unwrap()
     }
diff --git a/crates/voicevox_core_macros/src/extract.rs b/crates/voicevox_core_macros/src/extract.rs
new file mode 100644
index 000000000..e9b480630
--- /dev/null
+++ b/crates/voicevox_core_macros/src/extract.rs
@@ -0,0 +1,31 @@
+use syn::{
+    spanned::Spanned as _, Attribute, Data, DataEnum, DataStruct, DataUnion, Field, Fields, Type,
+};
+
+pub(crate) fn struct_fields(data: &Data) -> syn::Result<Vec<(&[Attribute], &syn::Ident, &Type)>> {
+    let fields = match data {
+        Data::Struct(DataStruct {
+            fields: Fields::Named(fields),
+            ..
+        }) => fields,
+        Data::Struct(DataStruct { fields, .. }) => {
+            return Err(syn::Error::new(fields.span(), "expect named fields"));
+        }
+        Data::Enum(DataEnum { enum_token, .. }) => {
+            return Err(syn::Error::new(enum_token.span(), "expected a struct"));
+        }
+        Data::Union(DataUnion { union_token, .. }) => {
+            return Err(syn::Error::new(union_token.span(), "expected a struct"));
+        }
+    };
+
+    Ok(fields
+        .named
+        .iter()
+        .map(
+            |Field {
+                 attrs, ident, ty, ..
+             }| (&**attrs, ident.as_ref().expect("should be named"), ty),
+        )
+        .collect())
+}
diff --git a/crates/voicevox_core_macros/src/inference_domain.rs b/crates/voicevox_core_macros/src/inference_domain.rs
index d24a20ab1..f959982e4 100644
--- a/crates/voicevox_core_macros/src/inference_domain.rs
+++ b/crates/voicevox_core_macros/src/inference_domain.rs
@@ -3,8 +3,8 @@ use quote::quote;
 use syn::{
     parse::{Parse, ParseStream},
     spanned::Spanned as _,
-    Attribute, Data, DataEnum, DataStruct, DataUnion, DeriveInput, Field, Fields, Generics,
-    ItemType, Type, Variant,
+    Attribute, Data, DataEnum, DataStruct, DataUnion, DeriveInput, Fields, Generics, ItemType,
+    Type, Variant,
 };
 
 pub(crate) fn derive_inference_operation(
@@ -178,11 +178,11 @@ pub(crate) fn derive_inference_input_signature(
 
     let (impl_generics, ty_generics, where_clause) = generics.split_for_impl();
 
-    let fields = struct_fields(data)?;
+    let fields = crate::extract::struct_fields(data)?;
 
     let param_infos = fields
         .iter()
-        .map(|(name, ty)| {
+        .map(|(_, name, ty)| {
             let name = name.to_string();
             quote! {
                 crate::infer::ParamInfo {
@@ -194,7 +194,7 @@ pub(crate) fn derive_inference_input_signature(
         })
         .collect::<proc_macro2::TokenStream>();
 
-    let field_names = fields.iter().map(|(name, _)| name);
+    let field_names = fields.iter().map(|(_, name, _)| name);
 
     return Ok(quote! {
         impl #impl_generics crate::infer::InferenceInputSignature for #ident #ty_generics
@@ -277,12 +277,12 @@ pub(crate) fn derive_inference_output_signature(
 
     let (impl_generics, ty_generics, where_clause) = generics.split_for_impl();
 
-    let fields = struct_fields(data)?;
+    let fields = crate::extract::struct_fields(data)?;
     let num_fields = fields.len();
 
     let param_infos = fields
         .iter()
-        .map(|(name, ty)| {
+        .map(|(_, name, ty)| {
             let name = name.to_string();
             quote! {
                 crate::infer::ParamInfo {
@@ -294,7 +294,7 @@ pub(crate) fn derive_inference_output_signature(
         })
         .collect::<proc_macro2::TokenStream>();
 
-    let field_names = fields.iter().map(|(name, _)| name);
+    let field_names = fields.iter().map(|(_, name, _)| name);
 
     Ok(quote! {
         impl #impl_generics crate::infer::InferenceOutputSignature for #ident #ty_generics
@@ -349,30 +349,6 @@ pub(crate) fn derive_inference_output_signature(
     })
 }
 
-fn struct_fields(data: &Data) -> syn::Result<Vec<(&syn::Ident, &Type)>> {
-    let fields = match data {
-        Data::Struct(DataStruct {
-            fields: Fields::Named(fields),
-            ..
-        }) => fields,
-        Data::Struct(DataStruct { fields, .. }) => {
-            return Err(syn::Error::new(fields.span(), "expect named fields"));
-        }
-        Data::Enum(DataEnum { enum_token, .. }) => {
-            return Err(syn::Error::new(enum_token.span(), "expected a struct"));
-        }
-        Data::Union(DataUnion { union_token, .. }) => {
-            return Err(syn::Error::new(union_token.span(), "expected a struct"));
-        }
-    };
-
-    Ok(fields
-        .named
-        .iter()
-        .map(|Field { ident, ty, .. }| (ident.as_ref().expect("should be named"), ty))
-        .collect())
-}
-
 fn unit_enum_variants(data: &Data) -> syn::Result<Vec<(&[Attribute], &syn::Ident)>> {
     let variants = match data {
         Data::Struct(DataStruct { struct_token, .. }) => {
diff --git a/crates/voicevox_core_macros/src/lib.rs b/crates/voicevox_core_macros/src/lib.rs
index 98a2fdc5c..ff0b83037 100644
--- a/crates/voicevox_core_macros/src/lib.rs
+++ b/crates/voicevox_core_macros/src/lib.rs
@@ -1,6 +1,8 @@
 #![warn(rust_2018_idioms)]
 
+mod extract;
 mod inference_domain;
+mod manifest;
 
 use syn::parse_macro_input;
 
@@ -100,6 +102,35 @@ pub fn derive_inference_output_signature(
     from_syn(inference_domain::derive_inference_output_signature(input))
 }
 
+/// 構造体のフィールドを取得できる`std::ops::Index`の実装を導出する。
+///
+/// # Example
+///
+/// ```
+/// use macros::IndexForFields;
+///
+/// #[derive(IndexForFields)]
+/// #[index_for_fields(TalkOperation)]
+/// pub(crate) struct TalkManifest {
+///     #[index_for_fields(TalkOperation::PredictDuration)]
+///     pub(crate) predict_duration_filename: Arc<str>,
+///
+///     #[index_for_fields(TalkOperation::PredictIntonation)]
+///     pub(crate) predict_intonation_filename: Arc<str>,
+///
+///     #[index_for_fields(TalkOperation::Decode)]
+///     pub(crate) decode_filename: Arc<str>,
+///
+///     // …
+/// }
+/// ```
+#[cfg(not(doctest))]
+#[proc_macro_derive(IndexForFields, attributes(index_for_fields))]
+pub fn derive_index_for_fields(input: proc_macro::TokenStream) -> proc_macro::TokenStream {
+    let input = &parse_macro_input!(input);
+    from_syn(manifest::derive_index_for_fields(input))
+}
+
 fn from_syn(result: syn::Result<proc_macro2::TokenStream>) -> proc_macro::TokenStream {
     result.unwrap_or_else(|e| e.to_compile_error()).into()
 }
diff --git a/crates/voicevox_core_macros/src/manifest.rs b/crates/voicevox_core_macros/src/manifest.rs
new file mode 100644
index 000000000..9560b1fd4
--- /dev/null
+++ b/crates/voicevox_core_macros/src/manifest.rs
@@ -0,0 +1,72 @@
+use proc_macro2::Span;
+use quote::quote;
+use syn::{Attribute, DeriveInput, Expr, Meta, Type};
+
+pub(crate) fn derive_index_for_fields(
+    input: &DeriveInput,
+) -> syn::Result<proc_macro2::TokenStream> {
+    const ATTR_NAME: &str = "index_for_fields";
+
+    let DeriveInput {
+        attrs,
+        ident,
+        generics,
+        data,
+        ..
+    } = input;
+
+    let idx = attrs
+        .iter()
+        .find_map(|Attribute { meta, .. }| match meta {
+            Meta::List(list) if list.path.is_ident(ATTR_NAME) => Some(list),
+            _ => None,
+        })
+        .ok_or_else(|| {
+            syn::Error::new(
+                Span::call_site(),
+                format!("missing `#[{ATTR_NAME}(…)]` in the struct itself"),
+            )
+        })?
+        .parse_args::<Type>()?;
+
+    let (impl_generics, ty_generics, where_clause) = generics.split_for_impl();
+
+    let targets = crate::extract::struct_fields(data)?
+        .into_iter()
+        .flat_map(|(attrs, name, output)| {
+            let meta = attrs.iter().find_map(|Attribute { meta, .. }| match meta {
+                Meta::List(meta) if meta.path.is_ident(ATTR_NAME) => Some(meta),
+                _ => None,
+            })?;
+            Some((meta, name, output))
+        })
+        .map(|(meta, name, output)| {
+            let key = meta.parse_args::<Expr>()?;
+            Ok((key, name, output))
+        })
+        .collect::<syn::Result<Vec<_>>>()?;
+
+    let (_, _, output) = targets.first().ok_or_else(|| {
+        syn::Error::new(
+            Span::call_site(),
+            format!("no fields have `#[{ATTR_NAME}(…)]`"),
+        )
+    })?;
+
+    let arms = targets
+        .iter()
+        .map(|(key, name, _)| Ok(quote!(#key => &self.#name)))
+        .collect::<syn::Result<Vec<_>>>()?;
+
+    Ok(quote! {
+        impl #impl_generics ::std::ops::Index<#idx> for #ident #ty_generics #where_clause {
+            type Output = #output;
+
+            fn index(&self, index: #idx) -> &Self::Output {
+                match index {
+                    #(#arms),*
+                }
+            }
+        }
+    })
+}
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index 9eabae6a3..b4aa65c9b 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -160,14 +160,16 @@ mod blocking {
     #[pyclass]
     #[derive(Clone)]
     pub(crate) struct VoiceModel {
-        model: voicevox_core::blocking::VoiceModel,
+        model: Arc<voicevox_core::blocking::VoiceModel>,
     }
 
     #[pymethods]
     impl VoiceModel {
         #[staticmethod]
         fn from_path(py: Python<'_>, path: PathBuf) -> PyResult<Self> {
-            let model = voicevox_core::blocking::VoiceModel::from_path(path).into_py_result(py)?;
+            let model = voicevox_core::blocking::VoiceModel::from_path(path)
+                .into_py_result(py)?
+                .into();
             Ok(Self { model })
         }
 
@@ -660,7 +662,7 @@ mod asyncio {
     #[pyclass]
     #[derive(Clone)]
     pub(crate) struct VoiceModel {
-        model: voicevox_core::tokio::VoiceModel,
+        model: Arc<voicevox_core::tokio::VoiceModel>,
     }
 
     #[pymethods]
@@ -669,7 +671,7 @@ mod asyncio {
         fn from_path(py: Python<'_>, path: PathBuf) -> PyResult<&PyAny> {
             pyo3_asyncio::tokio::future_into_py(py, async move {
                 let model = voicevox_core::tokio::VoiceModel::from_path(path).await;
-                let model = Python::with_gil(|py| model.into_py_result(py))?;
+                let model = Python::with_gil(|py| model.into_py_result(py))?.into();
                 Ok(Self { model })
             })
         }

From b8118b9534f09549f7ae33ea69424b166d09e047 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sat, 14 Sep 2024 02:52:49 +0900
Subject: [PATCH 28/36] =?UTF-8?q?change:=20Rust=20API=E3=81=AE=E8=84=B1Tok?=
 =?UTF-8?q?io=E3=81=A8=E3=80=81`voicevox=5Fcore::`{`tokio`=E2=86=92`nonblo?=
 =?UTF-8?q?cking`}=20(#831)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Tokioに依存したプログラムは、async-stdやsmolで使うことはできない。一方、
現在のVOICEVOX CORE Rust APIのTokio依存部分は
`tokio::task::spawn_blocking`のみである。そのため
`tokio::task::spawn_blocking`を、同等の機能を持つblockingクレートのも
のに置き換えることでRust APIの"脱Tokio"を行う。

https://docs.rs/crate/blocking

またこの"脱Tokio"に伴い、Rust APIの`voicevox_core::tokio`を
`voicevox_core::nonblocking`にリネームする。

Python APIではpyo3-asyncioが現在Tokio版かasync-std版しかない状態なので、
Tokioに依存した状態のままにしてある。またtest_utilやdownloaderではこれま
で通りreqwestに依存する。

また将来`Synthesizer`や`OpenJtalk`なども`trait Async`をベースにした設計
にすることを考えているが、本PRではTODOコメントを残すのみにしてある。

https://github.com/VOICEVOX/voicevox_core/pull/830#discussion_r1750081919
---
 Cargo.lock                                    |  22 +++
 Cargo.toml                                    |   2 +
 crates/voicevox_core/Cargo.toml               |   5 +-
 .../src/__internal/doctest_fixtures.rs        |  12 +-
 crates/voicevox_core/src/asyncs.rs            |   6 +-
 crates/voicevox_core/src/devices.rs           |   4 +-
 .../src/engine/full_context_label.rs          |   4 +-
 crates/voicevox_core/src/engine/open_jtalk.rs |  28 +++-
 .../src/infer/runtimes/onnxruntime.rs         |  38 +++--
 crates/voicevox_core/src/lib.rs               |   2 +-
 crates/voicevox_core/src/nonblocking.rs       |  25 ++++
 crates/voicevox_core/src/status.rs            |   4 +-
 crates/voicevox_core/src/synthesizer.rs       | 138 ++++++++++--------
 crates/voicevox_core/src/task.rs              |  14 +-
 crates/voicevox_core/src/test_util.rs         |   2 +-
 crates/voicevox_core/src/tokio.rs             |  13 --
 crates/voicevox_core/src/user_dict/dict.rs    |  22 ++-
 crates/voicevox_core/src/voice_model.rs       |   9 +-
 crates/voicevox_core_python_api/src/lib.rs    |  48 +++---
 19 files changed, 257 insertions(+), 141 deletions(-)
 create mode 100644 crates/voicevox_core/src/nonblocking.rs
 delete mode 100644 crates/voicevox_core/src/tokio.rs

diff --git a/Cargo.lock b/Cargo.lock
index 53117ce5c..defbbe093 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2767,6 +2767,26 @@ dependencies = [
  "time",
 ]
 
+[[package]]
+name = "pollster"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "22686f4785f02a4fcc856d3b3bb19bf6c8160d103f7a99cc258bddd0251dc7f2"
+dependencies = [
+ "pollster-macro",
+]
+
+[[package]]
+name = "pollster-macro"
+version = "0.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ea78f0ef4193055a4b09814ce6bcb572ad1174d6023e2f00a9ea1a798d18d301"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 1.0.102",
+]
+
 [[package]]
 name = "portable-atomic"
 version = "0.3.19"
@@ -4345,6 +4365,7 @@ dependencies = [
  "anyhow",
  "async-fs",
  "async_zip",
+ "blocking",
  "camino",
  "const_format",
  "derive-getters",
@@ -4366,6 +4387,7 @@ dependencies = [
  "ndarray",
  "open_jtalk",
  "ouroboros",
+ "pollster",
  "pretty_assertions",
  "ref-cast",
  "regex",
diff --git a/Cargo.toml b/Cargo.toml
index 3a2fffb01..922c7ac09 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -12,6 +12,7 @@ async-fs = "2.1.2"
 async_zip = "=0.0.16"
 bindgen = "0.69.4"
 binstall-tar = "0.4.39"
+blocking = "1.6.1"
 bytes = "1.1.0"
 camino = "1.1.6"
 cargo_metadata = "0.18.1"
@@ -57,6 +58,7 @@ octocrab = { version = "0.19.0", default-features = false }
 once_cell = "1.19.0"
 ouroboros = "0.18.0"
 parse-display = "0.8.2"
+pollster = "0.3.0"
 pretty_assertions = "1.3.0"
 proc-macro2 = "1.0.69"
 pyo3 = "0.20.3"
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index 74feebb4b..e05b04c79 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -18,6 +18,7 @@ link-onnxruntime = []
 anyhow.workspace = true
 async-fs.workspace = true
 async_zip = { workspace = true, features = ["deflate"] }
+blocking.workspace = true
 camino.workspace = true
 const_format.workspace = true
 derive-getters.workspace = true
@@ -27,7 +28,7 @@ duplicate.workspace = true
 easy-ext.workspace = true
 educe.workspace = true
 enum-map.workspace = true
-fs-err = { workspace = true, features = ["tokio"] }
+fs-err.workspace = true
 futures-io.workspace = true
 futures-lite.workspace = true
 futures-util = { workspace = true, features = ["io"] }
@@ -46,7 +47,6 @@ smallvec.workspace = true
 strum = { workspace = true, features = ["derive"] }
 tempfile.workspace = true
 thiserror.workspace = true
-tokio = { workspace = true, features = ["rt"] } # FIXME: feature-gateする
 tracing.workspace = true
 uuid = { workspace = true, features = ["v4", "serde"] }
 voicevox-ort = { workspace = true, features = ["download-binaries", "__init-for-voicevox"] }
@@ -54,6 +54,7 @@ voicevox_core_macros = { path = "../voicevox_core_macros" }
 
 [dev-dependencies]
 heck.workspace = true
+pollster = { workspace = true, features = ["macro"] }
 pretty_assertions.workspace = true
 rstest.workspace = true
 rstest_reuse.workspace = true
diff --git a/crates/voicevox_core/src/__internal/doctest_fixtures.rs b/crates/voicevox_core/src/__internal/doctest_fixtures.rs
index 8f45cba73..253bb8d6f 100644
--- a/crates/voicevox_core/src/__internal/doctest_fixtures.rs
+++ b/crates/voicevox_core/src/__internal/doctest_fixtures.rs
@@ -10,23 +10,23 @@ pub async fn synthesizer_with_sample_voice_model(
         OsString,
     >,
     open_jtalk_dic_dir: impl AsRef<Utf8Path>,
-) -> anyhow::Result<crate::tokio::Synthesizer<crate::tokio::OpenJtalk>> {
-    let syntesizer = crate::tokio::Synthesizer::new(
+) -> anyhow::Result<crate::nonblocking::Synthesizer<crate::nonblocking::OpenJtalk>> {
+    let syntesizer = crate::nonblocking::Synthesizer::new(
         #[cfg(feature = "load-onnxruntime")]
-        crate::tokio::Onnxruntime::load_once()
+        crate::nonblocking::Onnxruntime::load_once()
             .filename(onnxruntime_dylib_path)
             .exec()
             .await?,
         #[cfg(feature = "link-onnxruntime")]
-        crate::tokio::Onnxruntime::init_once().await?,
-        crate::tokio::OpenJtalk::new(open_jtalk_dic_dir).await?,
+        crate::nonblocking::Onnxruntime::init_once().await?,
+        crate::nonblocking::OpenJtalk::new(open_jtalk_dic_dir).await?,
         &InitializeOptions {
             acceleration_mode: AccelerationMode::Cpu,
             ..Default::default()
         },
     )?;
 
-    let model = &crate::tokio::VoiceModel::from_path(voice_model_path).await?;
+    let model = &crate::nonblocking::VoiceModel::from_path(voice_model_path).await?;
     syntesizer.load_voice_model(model).await?;
 
     Ok(syntesizer)
diff --git a/crates/voicevox_core/src/asyncs.rs b/crates/voicevox_core/src/asyncs.rs
index 7bbabbb06..5f4d7fd21 100644
--- a/crates/voicevox_core/src/asyncs.rs
+++ b/crates/voicevox_core/src/asyncs.rs
@@ -11,8 +11,7 @@
 //! に[`SingleTasked`]を用意している。
 //!
 //! [ブロッキング版API]: crate::blocking
-//! [非同期版API]: crate::tokio
-//! [blocking]: https://docs.rs/crate/blocking
+//! [非同期版API]: crate::nonblocking
 
 use std::{
     io::{self, Read as _, Seek as _, SeekFrom},
@@ -71,8 +70,7 @@ impl Async for SingleTasked {
 ///
 /// [非同期版API]用。
 ///
-/// [blocking]: https://docs.rs/crate/blocking
-/// [非同期版API]: crate::tokio
+/// [非同期版API]: crate::nonblocking
 pub(crate) enum BlockingThreadPool {}
 
 impl Async for BlockingThreadPool {
diff --git a/crates/voicevox_core/src/devices.rs b/crates/voicevox_core/src/devices.rs
index 6c0e87d06..ebffcb360 100644
--- a/crates/voicevox_core/src/devices.rs
+++ b/crates/voicevox_core/src/devices.rs
@@ -52,9 +52,9 @@ fn test_gpu(
 /// しても`cuda`や`dml`は`true`を示しうる。
 ///
 /// ```
-/// # #[tokio::main]
+/// # #[pollster::main]
 /// # async fn main() -> anyhow::Result<()> {
-/// use voicevox_core::{tokio::Onnxruntime, SupportedDevices};
+/// use voicevox_core::{nonblocking::Onnxruntime, SupportedDevices};
 ///
 /// # voicevox_core::blocking::Onnxruntime::load_once()
 /// #     .filename(if cfg!(windows) {
diff --git a/crates/voicevox_core/src/engine/full_context_label.rs b/crates/voicevox_core/src/engine/full_context_label.rs
index 92617a8c1..dab5cbae5 100644
--- a/crates/voicevox_core/src/engine/full_context_label.rs
+++ b/crates/voicevox_core/src/engine/full_context_label.rs
@@ -425,7 +425,7 @@ mod tests {
     #[apply(label_cases)]
     #[tokio::test]
     async fn open_jtalk(text: &str, labels: &[&str], _accent_phrase: &[AccentPhrase]) {
-        let open_jtalk = crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+        let open_jtalk = crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
             .await
             .unwrap();
         assert_eq!(&open_jtalk.extract_fullcontext(text).unwrap(), labels);
@@ -447,7 +447,7 @@ mod tests {
     #[apply(label_cases)]
     #[tokio::test]
     async fn extract_fullcontext(text: &str, _labels: &[&str], accent_phrase: &[AccentPhrase]) {
-        let open_jtalk = crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+        let open_jtalk = crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
             .await
             .unwrap();
         assert_eq!(
diff --git a/crates/voicevox_core/src/engine/open_jtalk.rs b/crates/voicevox_core/src/engine/open_jtalk.rs
index 88d16f381..fb7f3ea59 100644
--- a/crates/voicevox_core/src/engine/open_jtalk.rs
+++ b/crates/voicevox_core/src/engine/open_jtalk.rs
@@ -1,3 +1,16 @@
+// TODO: `VoiceModel`のように、次のような設計にする。
+//
+// ```
+// pub(crate) mod blocking {
+//     pub struct OpenJtalk(Inner<SingleTasked>);
+//     // …
+// }
+// pub(crate) mod nonblocking {
+//     pub struct OpenJtalk(Inner<BlockingThreadPool>);
+//     // …
+// }
+// ```
+
 use ::open_jtalk::Text2MecabError;
 
 #[derive(thiserror::Error, Debug)]
@@ -183,12 +196,19 @@ pub(crate) mod blocking {
     }
 }
 
-pub(crate) mod tokio {
+pub(crate) mod nonblocking {
     use camino::Utf8Path;
 
     use super::FullcontextExtractor;
 
     /// テキスト解析器としてのOpen JTalk。
+    ///
+    /// # Performance
+    ///
+    /// [blocking]クレートにより動いている。詳しくは[`nonblocking`モジュールのドキュメント]を参照。
+    ///
+    /// [blocking]: https://docs.rs/crate/blocking
+    /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
     #[derive(Clone)]
     pub struct OpenJtalk(super::blocking::OpenJtalk);
 
@@ -206,7 +226,7 @@ pub(crate) mod tokio {
         /// この関数を呼び出した後にユーザー辞書を変更した場合は、再度この関数を呼ぶ必要がある。
         pub async fn use_user_dict(
             &self,
-            user_dict: &crate::tokio::UserDict,
+            user_dict: &crate::nonblocking::UserDict,
         ) -> crate::result::Result<()> {
             let inner = self.0 .0.clone();
             let words = user_dict.to_mecab_format();
@@ -325,7 +345,7 @@ mod tests {
         #[case] text: &str,
         #[case] expected: anyhow::Result<Vec<String>>,
     ) {
-        let open_jtalk = super::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+        let open_jtalk = super::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
             .await
             .unwrap();
         let result = open_jtalk.extract_fullcontext(text);
@@ -339,7 +359,7 @@ mod tests {
         #[case] text: &str,
         #[case] expected: anyhow::Result<Vec<String>>,
     ) {
-        let open_jtalk = super::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+        let open_jtalk = super::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
             .await
             .unwrap();
         for _ in 0..10 {
diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
index 7d975f7f7..91e435701 100644
--- a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
+++ b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -1,3 +1,16 @@
+// TODO: `VoiceModel`のように、次のような設計にする。
+//
+// ```
+// pub(crate) mod blocking {
+//     pub struct Onnxruntime(Inner<SingleTasked>);
+//     // …
+// }
+// pub(crate) mod nonblocking {
+//     pub struct Onnxruntime(Inner<BlockingThreadPool>);
+//     // …
+// }
+// ```
+
 use std::{fmt::Debug, vec};
 
 use anyhow::{anyhow, bail, ensure};
@@ -18,9 +31,6 @@ use super::super::{
     OutputScalarKind, OutputTensor, ParamInfo, PushInputTensor,
 };
 
-// TODO: `trait AsyncRuntime`みたいなものを作って抽象化しながら同期版と非同期版に別個の役割を
-// 持たせる
-// （なぜそうしたいかの理由の一つとしては<https://github.com/VOICEVOX/voicevox_core/issues/687>）
 impl InferenceRuntime for self::blocking::Onnxruntime {
     type Session = ort::Session;
     type RunContext<'a> = OnnxruntimeRunContext<'a>;
@@ -254,7 +264,7 @@ pub(crate) mod blocking {
     /// # Rust APIにおけるインスタンスの共有
     ///
     /// インスタンスは[voicevox-ort]側に作られる。Rustのクレートとしてこのライブラリを利用する場合、
-    /// Tokio版APIやvoicevox-ortを利用する他クレートともインスタンスが共有される。
+    /// 非同期版APIやvoicevox-ortを利用する他クレートともインスタンスが共有される。
     ///
     #[cfg_attr(feature = "load-onnxruntime", doc = "```")]
     #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```compile_fail")]
@@ -268,7 +278,7 @@ pub(crate) mod blocking {
     /// #         .exec()?;
     /// # }
     /// let ort1 = voicevox_core::blocking::Onnxruntime::load_once().exec()?;
-    /// let ort2 = another_lib::tokio::Onnxruntime::get().expect("`ort1`と同一のはず");
+    /// let ort2 = another_lib::nonblocking::Onnxruntime::get().expect("`ort1`と同一のはず");
     /// assert_eq!(ptr_addr(ort1), ptr_addr(ort2));
     ///
     /// fn ptr_addr(obj: &impl Sized) -> usize {
@@ -430,7 +440,7 @@ pub(crate) mod blocking {
     }
 }
 
-pub(crate) mod tokio {
+pub(crate) mod nonblocking {
     use ref_cast::{ref_cast_custom, RefCastCustom};
 
     use crate::SupportedDevices;
@@ -448,7 +458,7 @@ pub(crate) mod tokio {
     #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```compile_fail")]
     /// # use voicevox_core as another_lib;
     /// #
-    /// # #[tokio::main]
+    /// # #[pollster::main]
     /// # async fn main() -> anyhow::Result<()> {
     /// # if cfg!(windows) {
     /// #     // Windows\System32\onnxruntime.dllを回避
@@ -456,7 +466,9 @@ pub(crate) mod tokio {
     /// #         .filename(test_util::ONNXRUNTIME_DYLIB_PATH)
     /// #         .exec()?;
     /// # }
-    /// let ort1 = voicevox_core::tokio::Onnxruntime::load_once().exec().await?;
+    /// let ort1 = voicevox_core::nonblocking::Onnxruntime::load_once()
+    ///     .exec()
+    ///     .await?;
     /// let ort2 = another_lib::blocking::Onnxruntime::get().expect("`ort1`と同一のはず");
     /// assert_eq!(ptr_addr(ort1), ptr_addr(ort2));
     ///
@@ -467,7 +479,13 @@ pub(crate) mod tokio {
     /// # }
     /// ```
     ///
+    /// # Performance
+    ///
+    /// [blocking]クレートにより動いている。詳しくは[`nonblocking`モジュールのドキュメント]を参照。
+    ///
     /// [voicevox-ort]: https://github.com/VOICEVOX/ort
+    /// [blocking]: https://docs.rs/crate/blocking
+    /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
     #[derive(Debug, RefCastCustom)]
     #[repr(transparent)]
     pub struct Onnxruntime(pub(crate) super::blocking::Onnxruntime);
@@ -584,11 +602,11 @@ mod tests {
 
         assert_eq!(
             super::blocking::Onnxruntime::LIB_NAME,
-            super::tokio::Onnxruntime::LIB_NAME,
+            super::nonblocking::Onnxruntime::LIB_NAME,
         );
         assert_eq!(
             super::blocking::Onnxruntime::LIB_VERSION,
-            super::tokio::Onnxruntime::LIB_VERSION,
+            super::nonblocking::Onnxruntime::LIB_VERSION,
         );
     }
 
diff --git a/crates/voicevox_core/src/lib.rs b/crates/voicevox_core/src/lib.rs
index dad702cc6..c5ab200d7 100644
--- a/crates/voicevox_core/src/lib.rs
+++ b/crates/voicevox_core/src/lib.rs
@@ -69,7 +69,7 @@ mod voice_model;
 
 pub mod __internal;
 pub mod blocking;
-pub mod tokio;
+pub mod nonblocking;
 
 #[cfg(test)]
 mod test_util;
diff --git a/crates/voicevox_core/src/nonblocking.rs b/crates/voicevox_core/src/nonblocking.rs
new file mode 100644
index 000000000..501a44d04
--- /dev/null
+++ b/crates/voicevox_core/src/nonblocking.rs
@@ -0,0 +1,25 @@
+//! 非同期版API。
+//!
+//! # Performance
+//!
+//! これらは[blocking]クレートにより動いている。特定の非同期ランタイムを必要とせず、[pollster]など
+//! でも動かすことができる。
+//!
+//! スレッドプールおよびエグゼキュータはblockingクレートに依存するすべてのプログラム間で共有される。
+//! スレッドプールのサイズは、blockingクレートの説明にある通り`$BLOCKING_MAX_THREADS`で調整すること
+//! ができる。
+//!
+//! [blocking]: https://docs.rs/crate/blocking
+//! [pollster]: https://docs.rs/crate/pollster
+
+pub use crate::{
+    engine::open_jtalk::nonblocking::OpenJtalk,
+    infer::runtimes::onnxruntime::nonblocking::Onnxruntime, synthesizer::nonblocking::Synthesizer,
+    user_dict::dict::nonblocking::UserDict, voice_model::nonblocking::VoiceModel,
+};
+
+pub mod onnxruntime {
+    #[cfg(feature = "load-onnxruntime")]
+    #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
+    pub use crate::infer::runtimes::onnxruntime::nonblocking::LoadOnce;
+}
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index 419be52f5..5103e060e 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -408,7 +408,7 @@ mod tests {
                 talk: enum_map!(_ => InferenceSessionOptions::new(0, DeviceSpec::Cpu)),
             },
         );
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         let model_contents = &model.read_inference_models().await.unwrap();
         let result = status.insert_model(model.header(), model_contents);
         assert_debug_fmt_eq!(Ok(()), result);
@@ -424,7 +424,7 @@ mod tests {
                 talk: enum_map!(_ => InferenceSessionOptions::new(0, DeviceSpec::Cpu)),
             },
         );
-        let vvm = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let vvm = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         let model_header = vvm.header();
         let model_contents = &vvm.read_inference_models().await.unwrap();
         assert!(
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 3b9642c8a..7a1bb2ab8 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -1,7 +1,20 @@
-/// [`blocking::Synthesizer::synthesis`]および[`tokio::Synthesizer::synthesis`]のオプション。
+// TODO: `VoiceModel`のように、次のような設計にする。
+//
+// ```
+// pub(crate) mod blocking {
+//     pub struct Synthesizer(Inner<SingleTasked>);
+//     // …
+// }
+// pub(crate) mod nonblocking {
+//     pub struct Synthesizer(Inner<BlockingThreadPool>);
+//     // …
+// }
+// ```
+
+/// [`blocking::Synthesizer::synthesis`]および[`nonblocking::Synthesizer::synthesis`]のオプション。
 ///
 /// [`blocking::Synthesizer::synthesis`]: blocking::Synthesizer::synthesis
-/// [`tokio::Synthesizer::synthesis`]: tokio::Synthesizer::synthesis
+/// [`nonblocking::Synthesizer::synthesis`]: nonblocking::Synthesizer::synthesis
 #[derive(Clone)]
 pub struct SynthesisOptions {
     pub enable_interrogative_upspeak: bool,
@@ -21,10 +34,10 @@ impl From<&TtsOptions> for SynthesisOptions {
     }
 }
 
-/// [`blocking::Synthesizer::tts`]および[`tokio::Synthesizer::tts`]のオプション。
+/// [`blocking::Synthesizer::tts`]および[`nonblocking::Synthesizer::tts`]のオプション。
 ///
 /// [`blocking::Synthesizer::tts`]: blocking::Synthesizer::tts
-/// [`tokio::Synthesizer::tts`]: tokio::Synthesizer::tts
+/// [`nonblocking::Synthesizer::tts`]: nonblocking::Synthesizer::tts
 #[derive(Clone)]
 pub struct TtsOptions {
     pub enable_interrogative_upspeak: bool,
@@ -56,10 +69,10 @@ pub enum AccelerationMode {
     Gpu,
 }
 
-/// [`blocking::Synthesizer::new`]および[`tokio::Synthesizer::new`]のオプション。
+/// [`blocking::Synthesizer::new`]および[`nonblocking::Synthesizer::new`]のオプション。
 ///
 /// [`blocking::Synthesizer::new`]: blocking::Synthesizer::new
-/// [`tokio::Synthesizer::new`]: tokio::Synthesizer::new
+/// [`nonblocking::Synthesizer::new`]: nonblocking::Synthesizer::new
 #[derive(Default)]
 pub struct InitializeOptions {
     pub acceleration_mode: AccelerationMode,
@@ -67,7 +80,7 @@ pub struct InitializeOptions {
 }
 
 pub(crate) mod blocking {
-    // FIXME: ここのdocのコードブロックはasync版のものなので、`tokio`モジュールの方に移した上で、
+    // FIXME: ここのdocのコードブロックはasync版のものなので、`nonblocking`モジュールの方に移した上で、
     // (ブロッキング版をpublic APIにするならの話ではあるが)ブロッキング版はブロッキング版でコード例
     // を用意する
 
@@ -113,7 +126,7 @@ pub(crate) mod blocking {
         ///
         #[cfg_attr(feature = "load-onnxruntime", doc = "```")]
         #[cfg_attr(not(feature = "load-onnxruntime"), doc = "```compile_fail")]
-        /// # #[tokio::main]
+        /// # #[pollster::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # use test_util::{ONNXRUNTIME_DYLIB_PATH, OPEN_JTALK_DIC_DIR};
         /// #
@@ -122,7 +135,7 @@ pub(crate) mod blocking {
         /// use std::sync::Arc;
         ///
         /// use voicevox_core::{
-        ///     tokio::{Onnxruntime, OpenJtalk, Synthesizer},
+        ///     nonblocking::{Onnxruntime, OpenJtalk, Synthesizer},
         ///     AccelerationMode, InitializeOptions,
         /// };
         ///
@@ -466,7 +479,7 @@ pub(crate) mod blocking {
         /// # Example
         ///
         /// ```
-        /// # #[tokio::main]
+        /// # #[pollster::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
@@ -685,7 +698,7 @@ pub(crate) mod blocking {
         /// # Example
         ///
         /// ```
-        /// # #[tokio::main]
+        /// # #[pollster::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
@@ -729,7 +742,7 @@ pub(crate) mod blocking {
         /// # Example
         ///
         /// ```
-        /// # #[tokio::main]
+        /// # #[pollster::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
@@ -762,7 +775,7 @@ pub(crate) mod blocking {
         /// # Examples
         ///
         /// ```
-        /// # #[tokio::main]
+        /// # #[pollster::main]
         /// # async fn main() -> anyhow::Result<()> {
         /// # let synthesizer =
         /// #     voicevox_core::__internal::doctest_fixtures::synthesizer_with_sample_voice_model(
@@ -1127,7 +1140,7 @@ pub(crate) mod blocking {
     }
 }
 
-pub(crate) mod tokio {
+pub(crate) mod nonblocking {
     use std::sync::Arc;
 
     use crate::{
@@ -1138,13 +1151,20 @@ pub(crate) mod tokio {
     use super::{InitializeOptions, TtsOptions};
 
     /// 音声シンセサイザ。
+    ///
+    /// # Performance
+    ///
+    /// [blocking]クレートにより動いている。詳しくは[`nonblocking`モジュールのドキュメント]を参照。
+    ///
+    /// [blocking]: https://docs.rs/crate/blocking
+    /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
     #[derive(Clone)]
     pub struct Synthesizer<O>(pub(super) Arc<super::blocking::Synthesizer<O>>);
 
     // FIXME: docを書く
     impl<O: Send + Sync + 'static> self::Synthesizer<O> {
         pub fn new(
-            onnxruntime: &'static crate::tokio::Onnxruntime,
+            onnxruntime: &'static crate::nonblocking::Onnxruntime,
             open_jtalk: O,
             options: &InitializeOptions,
         ) -> Result<Self> {
@@ -1153,15 +1173,15 @@ pub(crate) mod tokio {
                 .map(Self)
         }
 
-        pub fn onnxruntime(&self) -> &'static crate::tokio::Onnxruntime {
-            crate::tokio::Onnxruntime::from_blocking(self.0.onnxruntime())
+        pub fn onnxruntime(&self) -> &'static crate::nonblocking::Onnxruntime {
+            crate::nonblocking::Onnxruntime::from_blocking(self.0.onnxruntime())
         }
 
         pub fn is_gpu_mode(&self) -> bool {
             self.0.is_gpu_mode()
         }
 
-        pub async fn load_voice_model(&self, model: &crate::tokio::VoiceModel) -> Result<()> {
+        pub async fn load_voice_model(&self, model: &crate::nonblocking::VoiceModel) -> Result<()> {
             let model_bytes = &model.read_inference_models().await?;
             self.0.status.insert_model(model.header(), model_bytes)
         }
@@ -1318,8 +1338,8 @@ mod tests {
     #[case(Ok(()))]
     #[tokio::test]
     async fn load_model_works(#[case] expected_result_at_initialized: Result<()>) {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
             (),
@@ -1331,7 +1351,7 @@ mod tests {
         .unwrap();
 
         let result = syntesizer
-            .load_voice_model(&crate::tokio::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
             .await;
 
         assert_debug_fmt_eq!(
@@ -1344,8 +1364,8 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn is_use_gpu_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
             (),
@@ -1363,8 +1383,8 @@ mod tests {
     #[tokio::test]
     async fn is_loaded_model_by_style_id_works(#[case] style_id: u32, #[case] expected: bool) {
         let style_id = StyleId::new(style_id);
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
             (),
@@ -1379,7 +1399,7 @@ mod tests {
             "expected is_model_loaded to return false, but got true",
         );
         syntesizer
-            .load_voice_model(&crate::tokio::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1394,8 +1414,8 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn predict_duration_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
             (),
@@ -1407,7 +1427,7 @@ mod tests {
         .unwrap();
 
         syntesizer
-            .load_voice_model(&crate::tokio::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1428,8 +1448,8 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn predict_intonation_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
             (),
@@ -1440,7 +1460,7 @@ mod tests {
         )
         .unwrap();
         syntesizer
-            .load_voice_model(&crate::tokio::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1470,8 +1490,8 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn decode_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
             (),
@@ -1482,7 +1502,7 @@ mod tests {
         )
         .unwrap();
         syntesizer
-            .load_voice_model(&crate::tokio::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1565,11 +1585,11 @@ mod tests {
         #[case] expected_text_consonant_vowel_data: &TextConsonantVowelData,
         #[case] expected_kana_text: &str,
     ) {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
-            crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+            crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
             &InitializeOptions {
@@ -1579,7 +1599,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let query = match input {
@@ -1636,11 +1656,11 @@ mod tests {
         #[case] input: Input,
         #[case] expected_text_consonant_vowel_data: &TextConsonantVowelData,
     ) {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
-            crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+            crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
             &InitializeOptions {
@@ -1650,7 +1670,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = match input {
@@ -1704,11 +1724,11 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn create_accent_phrases_works_for_japanese_commas_and_periods() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
-            crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+            crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
             &InitializeOptions {
@@ -1718,7 +1738,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
@@ -1767,11 +1787,11 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn mora_length_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
-            crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+            crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
             &InitializeOptions {
@@ -1781,7 +1801,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
@@ -1808,11 +1828,11 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn mora_pitch_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
-            crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+            crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
             &InitializeOptions {
@@ -1822,7 +1842,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
@@ -1849,11 +1869,11 @@ mod tests {
     #[rstest]
     #[tokio::test]
     async fn mora_data_works() {
-        let syntesizer = super::tokio::Synthesizer::new(
-            crate::tokio::Onnxruntime::from_test_util_data()
+        let syntesizer = super::nonblocking::Synthesizer::new(
+            crate::nonblocking::Onnxruntime::from_test_util_data()
                 .await
                 .unwrap(),
-            crate::tokio::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
+            crate::nonblocking::OpenJtalk::new(OPEN_JTALK_DIC_DIR)
                 .await
                 .unwrap(),
             &InitializeOptions {
@@ -1863,7 +1883,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::tokio::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
diff --git a/crates/voicevox_core/src/task.rs b/crates/voicevox_core/src/task.rs
index 951e3c19e..233c0de85 100644
--- a/crates/voicevox_core/src/task.rs
+++ b/crates/voicevox_core/src/task.rs
@@ -1,16 +1,6 @@
-use std::panic;
+// TODO: `Async::unblock`として取り回す
 
 /// ブロッキング操作を非同期化する。
-///
-/// # Panics
-///
-/// - `f`がパニックした場合、パニックがそのままunwindされる。
-/// - tokioのランタイムの都合で`f`の実行が"cancel"された場合パニックする。
 pub(crate) async fn asyncify<F: FnOnce() -> R + Send + 'static, R: Send + 'static>(f: F) -> R {
-    tokio::task::spawn_blocking(f)
-        .await
-        .unwrap_or_else(|err| match err.try_into_panic() {
-            Ok(panic) => panic::resume_unwind(panic),
-            Err(err) => panic!("{err}"), // FIXME: エラーとして回収する
-        })
+    blocking::unblock(f).await
 }
diff --git a/crates/voicevox_core/src/test_util.rs b/crates/voicevox_core/src/test_util.rs
index 5b97f21fc..f92c4ee0c 100644
--- a/crates/voicevox_core/src/test_util.rs
+++ b/crates/voicevox_core/src/test_util.rs
@@ -2,7 +2,7 @@ use ::test_util::SAMPLE_VOICE_MODEL_FILE_PATH;
 
 use crate::Result;
 
-impl crate::tokio::VoiceModel {
+impl crate::nonblocking::VoiceModel {
     pub(crate) async fn sample() -> Result<Self> {
         Self::from_path(SAMPLE_VOICE_MODEL_FILE_PATH).await
     }
diff --git a/crates/voicevox_core/src/tokio.rs b/crates/voicevox_core/src/tokio.rs
deleted file mode 100644
index 1e2fabada..000000000
--- a/crates/voicevox_core/src/tokio.rs
+++ /dev/null
@@ -1,13 +0,0 @@
-//! Tokio版API。
-
-pub use crate::{
-    engine::open_jtalk::tokio::OpenJtalk, infer::runtimes::onnxruntime::tokio::Onnxruntime,
-    synthesizer::tokio::Synthesizer, user_dict::dict::tokio::UserDict,
-    voice_model::tokio::VoiceModel,
-};
-
-pub mod onnxruntime {
-    #[cfg(feature = "load-onnxruntime")]
-    #[cfg_attr(docsrs, doc(cfg(feature = "load-onnxruntime")))]
-    pub use crate::infer::runtimes::onnxruntime::tokio::LoadOnce;
-}
diff --git a/crates/voicevox_core/src/user_dict/dict.rs b/crates/voicevox_core/src/user_dict/dict.rs
index 6997620f0..13c30540d 100644
--- a/crates/voicevox_core/src/user_dict/dict.rs
+++ b/crates/voicevox_core/src/user_dict/dict.rs
@@ -1,3 +1,16 @@
+// TODO: `VoiceModel`のように、次のような設計にする。
+//
+// ```
+// pub(crate) mod blocking {
+//     pub struct UserDict(Inner<SingleTasked>);
+//     // …
+// }
+// pub(crate) mod nonblocking {
+//     pub struct UserDict(Inner<BlockingThreadPool>);
+//     // …
+// }
+// ```
+
 pub(crate) mod blocking {
     use indexmap::IndexMap;
     use itertools::join;
@@ -102,7 +115,7 @@ pub(crate) mod blocking {
     }
 }
 
-pub(crate) mod tokio {
+pub(crate) mod nonblocking {
     use std::sync::Arc;
 
     use indexmap::IndexMap;
@@ -115,6 +128,13 @@ pub(crate) mod tokio {
     /// ユーザー辞書。
     ///
     /// 単語はJSONとの相互変換のために挿入された順序を保つ。
+    ///
+    /// # Performance
+    ///
+    /// [blocking]クレートにより動いている。詳しくは[`nonblocking`モジュールのドキュメント]を参照。
+    ///
+    /// [blocking]: https://docs.rs/crate/blocking
+    /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
     #[derive(Debug, Default)]
     pub struct UserDict(Arc<super::blocking::UserDict>);
 
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index ac49d2cdb..48c541439 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -434,7 +434,7 @@ pub(crate) mod blocking {
     }
 }
 
-pub(crate) mod tokio {
+pub(crate) mod nonblocking {
     use std::path::Path;
 
     use crate::{
@@ -447,6 +447,13 @@ pub(crate) mod tokio {
     /// 音声モデル。
     ///
     /// VVMファイルと対応する。
+    ///
+    /// # Performance
+    ///
+    /// [blocking]クレートにより動いている。詳しくは[`nonblocking`モジュールのドキュメント]を参照。
+    ///
+    /// [blocking]: https://docs.rs/crate/blocking
+    /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
     pub struct VoiceModel(Inner<BlockingThreadPool>);
 
     impl self::VoiceModel {
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index b4aa65c9b..c09fafdc8 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -662,7 +662,7 @@ mod asyncio {
     #[pyclass]
     #[derive(Clone)]
     pub(crate) struct VoiceModel {
-        model: Arc<voicevox_core::tokio::VoiceModel>,
+        model: Arc<voicevox_core::nonblocking::VoiceModel>,
     }
 
     #[pymethods]
@@ -670,7 +670,7 @@ mod asyncio {
         #[staticmethod]
         fn from_path(py: Python<'_>, path: PathBuf) -> PyResult<&PyAny> {
             pyo3_asyncio::tokio::future_into_py(py, async move {
-                let model = voicevox_core::tokio::VoiceModel::from_path(path).await;
+                let model = voicevox_core::nonblocking::VoiceModel::from_path(path).await;
                 let model = Python::with_gil(|py| model.into_py_result(py))?.into();
                 Ok(Self { model })
             })
@@ -693,33 +693,36 @@ mod asyncio {
 
     #[pyclass]
     #[derive(Clone)]
-    pub(crate) struct Onnxruntime(&'static voicevox_core::tokio::Onnxruntime);
+    pub(crate) struct Onnxruntime(&'static voicevox_core::nonblocking::Onnxruntime);
 
     #[pymethods]
     impl Onnxruntime {
         #[classattr]
-        const LIB_NAME: &'static str = voicevox_core::tokio::Onnxruntime::LIB_NAME;
+        const LIB_NAME: &'static str = voicevox_core::nonblocking::Onnxruntime::LIB_NAME;
 
         #[classattr]
-        const LIB_VERSION: &'static str = voicevox_core::tokio::Onnxruntime::LIB_VERSION;
+        const LIB_VERSION: &'static str = voicevox_core::nonblocking::Onnxruntime::LIB_VERSION;
 
         #[classattr]
         const LIB_VERSIONED_FILENAME: &'static str =
-            voicevox_core::tokio::Onnxruntime::LIB_VERSIONED_FILENAME;
+            voicevox_core::nonblocking::Onnxruntime::LIB_VERSIONED_FILENAME;
 
         #[classattr]
         const LIB_UNVERSIONED_FILENAME: &'static str =
-            voicevox_core::tokio::Onnxruntime::LIB_UNVERSIONED_FILENAME;
+            voicevox_core::nonblocking::Onnxruntime::LIB_UNVERSIONED_FILENAME;
 
         #[staticmethod]
         fn get(py: Python<'_>) -> PyResult<Option<Py<Self>>> {
-            let result = ONNXRUNTIME.get_or_try_init(|| {
-                match voicevox_core::tokio::Onnxruntime::get().map(|o| Py::new(py, Self(o))) {
-                    Some(Ok(this)) => Ok(this),
-                    Some(Err(err)) => Err(Some(err)),
-                    None => Err(None),
-                }
-            });
+            let result =
+                ONNXRUNTIME.get_or_try_init(
+                    || match voicevox_core::nonblocking::Onnxruntime::get()
+                        .map(|o| Py::new(py, Self(o)))
+                    {
+                        Some(Ok(this)) => Ok(this),
+                        Some(Err(err)) => Err(Some(err)),
+                        None => Err(None),
+                    },
+                );
 
             match result {
                 Ok(this) => Ok(Some(this.clone())),
@@ -732,7 +735,7 @@ mod asyncio {
         #[pyo3(signature = (*, filename = Self::LIB_VERSIONED_FILENAME.into()))]
         fn load_once(filename: OsString, py: Python<'_>) -> PyResult<&PyAny> {
             pyo3_asyncio::tokio::future_into_py(py, async move {
-                let inner = voicevox_core::tokio::Onnxruntime::load_once()
+                let inner = voicevox_core::nonblocking::Onnxruntime::load_once()
                     .filename(filename)
                     .exec()
                     .await;
@@ -756,7 +759,7 @@ mod asyncio {
     #[pyclass]
     #[derive(Clone)]
     pub(crate) struct OpenJtalk {
-        open_jtalk: voicevox_core::tokio::OpenJtalk,
+        open_jtalk: voicevox_core::nonblocking::OpenJtalk,
     }
 
     #[pymethods]
@@ -769,7 +772,8 @@ mod asyncio {
             py: Python<'_>,
         ) -> PyResult<&PyAny> {
             pyo3_asyncio::tokio::future_into_py(py, async move {
-                let open_jtalk = voicevox_core::tokio::OpenJtalk::new(open_jtalk_dict_dir).await;
+                let open_jtalk =
+                    voicevox_core::nonblocking::OpenJtalk::new(open_jtalk_dict_dir).await;
                 let open_jtalk = Python::with_gil(|py| open_jtalk.into_py_result(py))?;
                 Ok(Self { open_jtalk })
             })
@@ -787,8 +791,10 @@ mod asyncio {
 
     #[pyclass]
     pub(crate) struct Synthesizer {
-        synthesizer:
-            Closable<voicevox_core::tokio::Synthesizer<voicevox_core::tokio::OpenJtalk>, Self>,
+        synthesizer: Closable<
+            voicevox_core::nonblocking::Synthesizer<voicevox_core::nonblocking::OpenJtalk>,
+            Self,
+        >,
     }
 
     #[pymethods]
@@ -807,7 +813,7 @@ mod asyncio {
             acceleration_mode: AccelerationMode,
             cpu_num_threads: u16,
         ) -> PyResult<Self> {
-            let synthesizer = voicevox_core::tokio::Synthesizer::new(
+            let synthesizer = voicevox_core::nonblocking::Synthesizer::new(
                 onnxruntime.0,
                 open_jtalk.open_jtalk.clone(),
                 &InitializeOptions {
@@ -1146,7 +1152,7 @@ mod asyncio {
     #[pyclass]
     #[derive(Default, Debug, Clone)]
     pub(crate) struct UserDict {
-        dict: Arc<voicevox_core::tokio::UserDict>,
+        dict: Arc<voicevox_core::nonblocking::UserDict>,
     }
 
     #[pymethods]

From 967570a64948c31ab36294325d9e3ae1b1d8f06c Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Thu, 19 Sep 2024 09:47:59 +0900
Subject: [PATCH 29/36] =?UTF-8?q?change:=20`VoiceModel`=20=E2=86=92=20`Voi?=
 =?UTF-8?q?ceModelFile`=20(#832)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

現在の`VoiceModel`は、コンストラクトされるときに`id`, `manifest`,
`metas`の情報だけ取得してそれらと`path`だけ保持し、モデル本体は要求され
てから`path`を開いて読むという形になっている。このような責務になっている
ことをユーザーが今のAPIのシグネチャから察するのは困難である。このことか
ら、次の変更を行う。

1. `VoiceModel` → `VoiceModelFile`にリネーム
    * C APIの`voicevox_voice_model_…`は`voicevox_voice_model_file_…`に
2. `VoiceModel::from_path` → `VoiceModelFile::open`にリネーム
    * C APIも同様
3. Python APIには`__{,a}{enter,exit}__`、Java APIには`Closable`の実装
    * `id`と`metas`はクローズ後にもgetできるようにする
    * Rust APIの`blocking`のものを除き、`.close()`で閉じられるように
    * C APIの`delete`は`close`にリネーム

Python APIとJava APIで`Synthesizer::load_voice_model`中に
`VoiceModelFile::close`を行うときの挙動としては、`load_voice_model`がす
べて終わるのを待ってからクローズ処理を行う。実装には`RwLock`を用いる。
```py
    async with await VoiceModelFile.open(vvm_path) as model:
        _ = synthesizer.load_voice_model(model) # awaitしない
```
```console
[WARNING] voicevox_core_python_api: The `VoiceModelFile` is still in use. Waiting before closing
[DEBUG] voicevox_core_python_api: Closing a VoiceModelFile
# `load_voice_model`が無事完了している
```

ただしC APIでは`load_voice_model`中の`close`は現行のままUBとする。
`RwLock`でロックすることで安全なAPIにすることはfuture workとする。

実装の都合上、Python APIの`voicevox_core.asyncio.Synthesizer`も
`__{enter,exit}__`ではなく`__a{enter,exit}__`を持つようして、
`VoiceModelFile`同様に`RwLock`でロック管理を行うようにする。

Resolves #829.
---
 Cargo.lock                                    |   3 +
 Cargo.toml                                    |   1 +
 crates/voicevox_core/Cargo.toml               |   3 +-
 .../src/__internal/doctest_fixtures.rs        |   2 +-
 .../voicevox_core/src/__internal/interop.rs   |   2 +
 .../src/__internal/interop/raii.rs            |  43 ++
 crates/voicevox_core/src/asyncs.rs            | 152 +++++--
 crates/voicevox_core/src/blocking.rs          |   2 +-
 crates/voicevox_core/src/engine/open_jtalk.rs |   2 +-
 .../src/infer/runtimes/onnxruntime.rs         |   2 +-
 crates/voicevox_core/src/nonblocking.rs       |   2 +-
 crates/voicevox_core/src/status.rs            |   4 +-
 crates/voicevox_core/src/synthesizer.rs       |  31 +-
 crates/voicevox_core/src/test_util.rs         |   4 +-
 crates/voicevox_core/src/user_dict/dict.rs    |   2 +-
 crates/voicevox_core/src/voice_model.rs       | 108 +++--
 .../include/voicevox_core.h                   |  36 +-
 crates/voicevox_core_c_api/src/c_impls.rs     |  11 +-
 .../src/compatible_engine.rs                  |   8 +-
 crates/voicevox_core_c_api/src/lib.rs         |  44 +-
 .../tests/e2e/testcases/simple_tts.rs         |   4 +-
 .../testcases/synthesizer_new_output_json.rs  |   2 +-
 .../e2e/testcases/tts_via_audio_query.rs      |   4 +-
 .../tests/e2e/testcases/user_dict_load.rs     |   4 +-
 .../hiroshiba/voicevoxcore/Synthesizer.java   |   9 +-
 .../{VoiceModel.java => VoiceModelFile.java}  |  24 +-
 .../jp/hiroshiba/voicevoxcore/MetaTest.java   |   5 +-
 .../voicevoxcore/SynthesizerTest.java         |  45 +-
 .../jp/hiroshiba/voicevoxcore/TestUtils.java  |   4 +-
 .../hiroshiba/voicevoxcore/UserDictTest.java  |  11 +-
 .../voicevoxcore/VoiceModelTest.java          |   5 +-
 crates/voicevox_core_java_api/src/common.rs   |  72 ++-
 .../voicevox_core_java_api/src/synthesizer.rs |   3 +-
 .../voicevox_core_java_api/src/voice_model.rs |  40 +-
 crates/voicevox_core_python_api/Cargo.toml    |   2 +
 .../python/test/test_asyncio_metas.py         |  10 +-
 .../test/test_asyncio_user_dict_load.py       |   2 +-
 .../python/test/test_blocking_metas.py        |  10 +-
 .../test/test_blocking_user_dict_load.py      |   2 +-
 ...est_pseudo_raii_for_asyncio_synthesizer.py |  26 +-
 .../python/voicevox_core/_rust/asyncio.pyi    |  26 +-
 .../python/voicevox_core/_rust/blocking.pyi   |  20 +-
 .../python/voicevox_core/asyncio.py           |   4 +-
 .../python/voicevox_core/blocking.py          |  10 +-
 .../voicevox_core_python_api/src/convert.rs   |  55 ++-
 crates/voicevox_core_python_api/src/lib.rs    | 415 +++++++++++++-----
 docs/usage.md                                 |  12 +-
 example/cpp/unix/simple_tts.cpp               |   6 +-
 example/cpp/windows/simple_tts/simple_tts.cpp |   7 +-
 example/kotlin/app/src/main/kotlin/app/App.kt |   2 +-
 example/python/run-asyncio.py                 |   6 +-
 example/python/run.py                         |   6 +-
 52 files changed, 943 insertions(+), 372 deletions(-)
 create mode 100644 crates/voicevox_core/src/__internal/interop/raii.rs
 rename crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/{VoiceModel.java => VoiceModelFile.java} (84%)

diff --git a/Cargo.lock b/Cargo.lock
index defbbe093..ae91b89bb 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -4364,6 +4364,7 @@ version = "0.0.0"
 dependencies = [
  "anyhow",
  "async-fs",
+ "async-lock",
  "async_zip",
  "blocking",
  "camino",
@@ -4486,6 +4487,7 @@ version = "0.0.0"
 dependencies = [
  "camino",
  "easy-ext",
+ "futures-lite",
  "log",
  "once_cell",
  "pyo3",
@@ -4493,6 +4495,7 @@ dependencies = [
  "pyo3-log",
  "serde",
  "serde_json",
+ "tokio",
  "tracing",
  "uuid",
  "voicevox_core",
diff --git a/Cargo.toml b/Cargo.toml
index 922c7ac09..9226aca03 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -9,6 +9,7 @@ anstyle-query = "1.0.0"
 anyhow = "1.0.65"
 assert_cmd = "2.0.8"
 async-fs = "2.1.2"
+async-lock = "3.4.0"
 async_zip = "=0.0.16"
 bindgen = "0.69.4"
 binstall-tar = "0.4.39"
diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index e05b04c79..ba508ba44 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -16,7 +16,8 @@ link-onnxruntime = []
 
 [dependencies]
 anyhow.workspace = true
-async-fs.workspace = true
+async-fs.workspace = true # 今これを使っている箇所はどこにも無いが、`UserDict`にはこれを使った方がよいはず
+async-lock.workspace = true
 async_zip = { workspace = true, features = ["deflate"] }
 blocking.workspace = true
 camino.workspace = true
diff --git a/crates/voicevox_core/src/__internal/doctest_fixtures.rs b/crates/voicevox_core/src/__internal/doctest_fixtures.rs
index 253bb8d6f..57c28c7a9 100644
--- a/crates/voicevox_core/src/__internal/doctest_fixtures.rs
+++ b/crates/voicevox_core/src/__internal/doctest_fixtures.rs
@@ -26,7 +26,7 @@ pub async fn synthesizer_with_sample_voice_model(
         },
     )?;
 
-    let model = &crate::nonblocking::VoiceModel::from_path(voice_model_path).await?;
+    let model = &crate::nonblocking::VoiceModelFile::open(voice_model_path).await?;
     syntesizer.load_voice_model(model).await?;
 
     Ok(syntesizer)
diff --git a/crates/voicevox_core/src/__internal/interop.rs b/crates/voicevox_core/src/__internal/interop.rs
index 677f5515a..a218730cd 100644
--- a/crates/voicevox_core/src/__internal/interop.rs
+++ b/crates/voicevox_core/src/__internal/interop.rs
@@ -1,3 +1,5 @@
+pub mod raii;
+
 pub use crate::{
     metas::merge as merge_metas, synthesizer::blocking::PerformInference,
     voice_model::blocking::IdRef,
diff --git a/crates/voicevox_core/src/__internal/interop/raii.rs b/crates/voicevox_core/src/__internal/interop/raii.rs
new file mode 100644
index 000000000..220188ad2
--- /dev/null
+++ b/crates/voicevox_core/src/__internal/interop/raii.rs
@@ -0,0 +1,43 @@
+use std::{marker::PhantomData, ops::Deref};
+
+use ouroboros::self_referencing;
+
+pub enum MaybeClosed<T> {
+    Open(T),
+    Closed,
+}
+
+// [`mapped_lock_guards`]のようなことをやるためのユーティリティ。
+//
+// [`mapped_lock_guards`]: https://github.com/rust-lang/rust/issues/117108
+pub fn try_map_guard<'lock, G, F, T, E>(guard: G, f: F) -> Result<impl Deref<Target = T> + 'lock, E>
+where
+    G: 'lock,
+    F: FnOnce(&G) -> Result<&T, E>,
+    T: 'lock,
+{
+    return MappedLockTryBuilder {
+        guard,
+        target_builder: f,
+        marker: PhantomData,
+    }
+    .try_build();
+
+    #[self_referencing]
+    struct MappedLock<'lock, G: 'lock, T> {
+        guard: G,
+
+        #[borrows(guard)]
+        target: &'this T,
+
+        marker: PhantomData<&'lock T>,
+    }
+
+    impl<'lock, G: 'lock, T: 'lock> Deref for MappedLock<'lock, G, T> {
+        type Target = T;
+
+        fn deref(&self) -> &Self::Target {
+            self.borrow_target()
+        }
+    }
+}
diff --git a/crates/voicevox_core/src/asyncs.rs b/crates/voicevox_core/src/asyncs.rs
index 5f4d7fd21..d89aa7d4b 100644
--- a/crates/voicevox_core/src/asyncs.rs
+++ b/crates/voicevox_core/src/asyncs.rs
@@ -15,15 +15,29 @@
 
 use std::{
     io::{self, Read as _, Seek as _, SeekFrom},
+    ops::DerefMut,
     path::Path,
     pin::Pin,
     task::{self, Poll},
 };
 
+use blocking::Unblock;
 use futures_io::{AsyncRead, AsyncSeek};
+use futures_util::ready;
 
 pub(crate) trait Async: 'static {
-    async fn open_file(path: impl AsRef<Path>) -> io::Result<impl AsyncRead + AsyncSeek + Unpin>;
+    type Mutex<T: Send + Sync + Unpin>: Mutex<T>;
+    type RoFile: AsyncRead + AsyncSeek + Send + Sync + Unpin;
+
+    /// ファイルを読み取り専用(RO)で開く。
+    ///
+    /// `io::Error`は素（`i32`相当）のままにしておき、この関数を呼び出す側でfs-err風のメッセージを付
+    /// ける。
+    async fn open_file_ro(path: impl AsRef<Path>) -> io::Result<Self::RoFile>;
+}
+
+pub(crate) trait Mutex<T>: From<T> + Send + Sync + Unpin {
+    async fn lock(&self) -> impl DerefMut<Target = T>;
 }
 
 /// エグゼキュータが非同期タスクの並行実行をしないことを仮定する、[`Async`]の実装。
@@ -39,30 +53,47 @@ pub(crate) trait Async: 'static {
 pub(crate) enum SingleTasked {}
 
 impl Async for SingleTasked {
-    async fn open_file(path: impl AsRef<Path>) -> io::Result<impl AsyncRead + AsyncSeek + Unpin> {
-        return std::fs::File::open(path).map(BlockingFile);
-
-        struct BlockingFile(std::fs::File);
-
-        impl AsyncRead for BlockingFile {
-            fn poll_read(
-                mut self: Pin<&mut Self>,
-                _: &mut task::Context<'_>,
-                buf: &mut [u8],
-            ) -> Poll<io::Result<usize>> {
-                Poll::Ready(self.0.read(buf))
-            }
-        }
+    type Mutex<T: Send + Sync + Unpin> = StdMutex<T>;
+    type RoFile = StdFile;
 
-        impl AsyncSeek for BlockingFile {
-            fn poll_seek(
-                mut self: Pin<&mut Self>,
-                _: &mut task::Context<'_>,
-                pos: SeekFrom,
-            ) -> Poll<io::Result<u64>> {
-                Poll::Ready(self.0.seek(pos))
-            }
-        }
+    async fn open_file_ro(path: impl AsRef<Path>) -> io::Result<Self::RoFile> {
+        std::fs::File::open(path).map(StdFile)
+    }
+}
+
+pub(crate) struct StdMutex<T>(std::sync::Mutex<T>);
+
+impl<T> From<T> for StdMutex<T> {
+    fn from(inner: T) -> Self {
+        Self(inner.into())
+    }
+}
+
+impl<T: Send + Sync + Unpin> Mutex<T> for StdMutex<T> {
+    async fn lock(&self) -> impl DerefMut<Target = T> {
+        self.0.lock().unwrap_or_else(|e| panic!("{e}"))
+    }
+}
+
+pub(crate) struct StdFile(std::fs::File);
+
+impl AsyncRead for StdFile {
+    fn poll_read(
+        mut self: Pin<&mut Self>,
+        _: &mut task::Context<'_>,
+        buf: &mut [u8],
+    ) -> Poll<io::Result<usize>> {
+        Poll::Ready(self.0.read(buf))
+    }
+}
+
+impl AsyncSeek for StdFile {
+    fn poll_seek(
+        mut self: Pin<&mut Self>,
+        _: &mut task::Context<'_>,
+        pos: SeekFrom,
+    ) -> Poll<io::Result<u64>> {
+        Poll::Ready(self.0.seek(pos))
     }
 }
 
@@ -74,7 +105,76 @@ impl Async for SingleTasked {
 pub(crate) enum BlockingThreadPool {}
 
 impl Async for BlockingThreadPool {
-    async fn open_file(path: impl AsRef<Path>) -> io::Result<impl AsyncRead + AsyncSeek + Unpin> {
-        async_fs::File::open(path).await
+    type Mutex<T: Send + Sync + Unpin> = async_lock::Mutex<T>;
+    type RoFile = AsyncRoFile;
+
+    async fn open_file_ro(path: impl AsRef<Path>) -> io::Result<Self::RoFile> {
+        AsyncRoFile::open(path).await
+    }
+}
+
+impl<T: Send + Sync + Unpin> Mutex<T> for async_lock::Mutex<T> {
+    async fn lock(&self) -> impl DerefMut<Target = T> {
+        self.lock().await
+    }
+}
+
+// TODO: `async_fs::File::into_std_file`みたいなのがあればこんなの↓は作らなくていいはず。PR出す？
+pub(crate) struct AsyncRoFile {
+    // `poll_read`と`poll_seek`しかしない
+    unblock: Unblock<std::fs::File>,
+
+    // async-fsの実装がやっているように「正しい」シーク位置を保持する。ただしファイルはパイプではな
+    // いことがわかっているため smol-rs/async-fs#4 は考えない
+    real_seek_pos: Option<u64>,
+}
+
+impl AsyncRoFile {
+    async fn open(path: impl AsRef<Path>) -> io::Result<Self> {
+        let path = path.as_ref().to_owned();
+        let unblock = Unblock::new(blocking::unblock(|| std::fs::File::open(path)).await?);
+        Ok(Self {
+            unblock,
+            real_seek_pos: None,
+        })
+    }
+
+    pub(crate) async fn close(self) {
+        let file = self.unblock.into_inner().await;
+        blocking::unblock(|| drop(file)).await;
+    }
+}
+
+impl AsyncRead for AsyncRoFile {
+    fn poll_read(
+        mut self: Pin<&mut Self>,
+        cx: &mut task::Context<'_>,
+        buf: &mut [u8],
+    ) -> Poll<io::Result<usize>> {
+        if self.real_seek_pos.is_none() {
+            self.real_seek_pos = Some(ready!(
+                Pin::new(&mut self.unblock).poll_seek(cx, SeekFrom::Current(0))
+            )?);
+        }
+        let n = ready!(Pin::new(&mut self.unblock).poll_read(cx, buf))?;
+        *self.real_seek_pos.as_mut().expect("should be present") += n as u64;
+        Poll::Ready(Ok(n))
+    }
+}
+
+impl AsyncSeek for AsyncRoFile {
+    fn poll_seek(
+        mut self: Pin<&mut Self>,
+        cx: &mut task::Context<'_>,
+        pos: SeekFrom,
+    ) -> Poll<io::Result<u64>> {
+        // async-fsの実装がやっているような"reposition"を行う。
+        // https://github.com/smol-rs/async-fs/issues/2#issuecomment-675595170
+        if let Some(real_seek_pos) = self.real_seek_pos {
+            ready!(Pin::new(&mut self.unblock).poll_seek(cx, SeekFrom::Start(real_seek_pos)))?;
+        }
+        self.real_seek_pos = None;
+
+        Pin::new(&mut self.unblock).poll_seek(cx, pos)
     }
 }
diff --git a/crates/voicevox_core/src/blocking.rs b/crates/voicevox_core/src/blocking.rs
index 8d0bc2129..3443e3085 100644
--- a/crates/voicevox_core/src/blocking.rs
+++ b/crates/voicevox_core/src/blocking.rs
@@ -3,7 +3,7 @@
 pub use crate::{
     engine::open_jtalk::blocking::OpenJtalk, infer::runtimes::onnxruntime::blocking::Onnxruntime,
     synthesizer::blocking::Synthesizer, user_dict::dict::blocking::UserDict,
-    voice_model::blocking::VoiceModel,
+    voice_model::blocking::VoiceModelFile,
 };
 
 pub mod onnxruntime {
diff --git a/crates/voicevox_core/src/engine/open_jtalk.rs b/crates/voicevox_core/src/engine/open_jtalk.rs
index fb7f3ea59..f27e9b0a6 100644
--- a/crates/voicevox_core/src/engine/open_jtalk.rs
+++ b/crates/voicevox_core/src/engine/open_jtalk.rs
@@ -1,4 +1,4 @@
-// TODO: `VoiceModel`のように、次のような設計にする。
+// TODO: `VoiceModelFile`のように、次のような設計にする。
 //
 // ```
 // pub(crate) mod blocking {
diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
index 91e435701..f7f92355e 100644
--- a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
+++ b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -1,4 +1,4 @@
-// TODO: `VoiceModel`のように、次のような設計にする。
+// TODO: `VoiceModelFile`のように、次のような設計にする。
 //
 // ```
 // pub(crate) mod blocking {
diff --git a/crates/voicevox_core/src/nonblocking.rs b/crates/voicevox_core/src/nonblocking.rs
index 501a44d04..7187c57fa 100644
--- a/crates/voicevox_core/src/nonblocking.rs
+++ b/crates/voicevox_core/src/nonblocking.rs
@@ -15,7 +15,7 @@
 pub use crate::{
     engine::open_jtalk::nonblocking::OpenJtalk,
     infer::runtimes::onnxruntime::nonblocking::Onnxruntime, synthesizer::nonblocking::Synthesizer,
-    user_dict::dict::nonblocking::UserDict, voice_model::nonblocking::VoiceModel,
+    user_dict::dict::nonblocking::UserDict, voice_model::nonblocking::VoiceModelFile,
 };
 
 pub mod onnxruntime {
diff --git a/crates/voicevox_core/src/status.rs b/crates/voicevox_core/src/status.rs
index 5103e060e..40e1ae6d2 100644
--- a/crates/voicevox_core/src/status.rs
+++ b/crates/voicevox_core/src/status.rs
@@ -408,7 +408,7 @@ mod tests {
                 talk: enum_map!(_ => InferenceSessionOptions::new(0, DeviceSpec::Cpu)),
             },
         );
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         let model_contents = &model.read_inference_models().await.unwrap();
         let result = status.insert_model(model.header(), model_contents);
         assert_debug_fmt_eq!(Ok(()), result);
@@ -424,7 +424,7 @@ mod tests {
                 talk: enum_map!(_ => InferenceSessionOptions::new(0, DeviceSpec::Cpu)),
             },
         );
-        let vvm = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let vvm = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         let model_header = vvm.header();
         let model_contents = &vvm.read_inference_models().await.unwrap();
         assert!(
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 7a1bb2ab8..045a2d9ea 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -1,4 +1,4 @@
-// TODO: `VoiceModel`のように、次のような設計にする。
+// TODO: `VoiceModelFile`のように、次のような設計にする。
 //
 // ```
 // pub(crate) mod blocking {
@@ -235,7 +235,7 @@ pub(crate) mod blocking {
         }
 
         /// 音声モデルを読み込む。
-        pub fn load_voice_model(&self, model: &crate::blocking::VoiceModel) -> Result<()> {
+        pub fn load_voice_model(&self, model: &crate::blocking::VoiceModelFile) -> Result<()> {
             let model_bytes = &model.read_inference_models()?;
             self.status.insert_model(model.header(), model_bytes)
         }
@@ -1181,7 +1181,10 @@ pub(crate) mod nonblocking {
             self.0.is_gpu_mode()
         }
 
-        pub async fn load_voice_model(&self, model: &crate::nonblocking::VoiceModel) -> Result<()> {
+        pub async fn load_voice_model(
+            &self,
+            model: &crate::nonblocking::VoiceModelFile,
+        ) -> Result<()> {
             let model_bytes = &model.read_inference_models().await?;
             self.0.status.insert_model(model.header(), model_bytes)
         }
@@ -1351,7 +1354,7 @@ mod tests {
         .unwrap();
 
         let result = syntesizer
-            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModelFile::sample().await.unwrap())
             .await;
 
         assert_debug_fmt_eq!(
@@ -1399,7 +1402,7 @@ mod tests {
             "expected is_model_loaded to return false, but got true",
         );
         syntesizer
-            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModelFile::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1427,7 +1430,7 @@ mod tests {
         .unwrap();
 
         syntesizer
-            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModelFile::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1460,7 +1463,7 @@ mod tests {
         )
         .unwrap();
         syntesizer
-            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModelFile::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1502,7 +1505,7 @@ mod tests {
         )
         .unwrap();
         syntesizer
-            .load_voice_model(&crate::nonblocking::VoiceModel::sample().await.unwrap())
+            .load_voice_model(&crate::nonblocking::VoiceModelFile::sample().await.unwrap())
             .await
             .unwrap();
 
@@ -1599,7 +1602,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let query = match input {
@@ -1670,7 +1673,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = match input {
@@ -1738,7 +1741,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
@@ -1801,7 +1804,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
@@ -1842,7 +1845,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
@@ -1883,7 +1886,7 @@ mod tests {
         )
         .unwrap();
 
-        let model = &crate::nonblocking::VoiceModel::sample().await.unwrap();
+        let model = &crate::nonblocking::VoiceModelFile::sample().await.unwrap();
         syntesizer.load_voice_model(model).await.unwrap();
 
         let accent_phrases = syntesizer
diff --git a/crates/voicevox_core/src/test_util.rs b/crates/voicevox_core/src/test_util.rs
index f92c4ee0c..e38f14c5c 100644
--- a/crates/voicevox_core/src/test_util.rs
+++ b/crates/voicevox_core/src/test_util.rs
@@ -2,8 +2,8 @@ use ::test_util::SAMPLE_VOICE_MODEL_FILE_PATH;
 
 use crate::Result;
 
-impl crate::nonblocking::VoiceModel {
+impl crate::nonblocking::VoiceModelFile {
     pub(crate) async fn sample() -> Result<Self> {
-        Self::from_path(SAMPLE_VOICE_MODEL_FILE_PATH).await
+        Self::open(SAMPLE_VOICE_MODEL_FILE_PATH).await
     }
 }
diff --git a/crates/voicevox_core/src/user_dict/dict.rs b/crates/voicevox_core/src/user_dict/dict.rs
index 13c30540d..0e1c89ca2 100644
--- a/crates/voicevox_core/src/user_dict/dict.rs
+++ b/crates/voicevox_core/src/user_dict/dict.rs
@@ -1,4 +1,4 @@
-// TODO: `VoiceModel`のように、次のような設計にする。
+// TODO: `VoiceModelFile`のように、次のような設計にする。
 //
 // ```
 // pub(crate) mod blocking {
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index 48c541439..cf2c0f078 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -3,7 +3,7 @@
 //! VVM ファイルの定義と形式は[ドキュメント](../../../docs/vvm.md)を参照。
 
 use std::{
-    marker::PhantomData,
+    collections::HashMap,
     path::{Path, PathBuf},
     sync::Arc,
 };
@@ -12,7 +12,7 @@ use anyhow::{anyhow, Context as _};
 use derive_more::From;
 use easy_ext::ext;
 use enum_map::{enum_map, EnumMap};
-use futures_io::{AsyncBufRead, AsyncSeek};
+use futures_io::{AsyncBufRead, AsyncRead, AsyncSeek};
 use futures_util::future::{OptionFuture, TryFutureExt as _};
 use itertools::Itertools as _;
 use ouroboros::self_referencing;
@@ -20,7 +20,7 @@ use serde::Deserialize;
 use uuid::Uuid;
 
 use crate::{
-    asyncs::Async,
+    asyncs::{Async, Mutex as _},
     error::{LoadModelError, LoadModelErrorKind, LoadModelResult},
     infer::{
         domains::{InferenceDomainMap, TalkDomain, TalkOperation},
@@ -61,20 +61,18 @@ impl VoiceModelId {
 }
 
 #[self_referencing]
-struct Inner<A> {
+struct Inner<A: Async> {
     header: VoiceModelHeader,
 
     #[borrows(header)]
     #[not_covariant]
     inference_model_entries: InferenceDomainMap<InferenceModelEntries<'this>>,
 
-    // `_marker`とすると、`borrow__marker`のような名前のメソッドが生成されて`non_snake_case`が
-    // 起動してしまう
-    marker: PhantomData<fn(A) -> A>,
+    zip: A::Mutex<A::RoFile>,
 }
 
 impl<A: Async> Inner<A> {
-    async fn from_path(path: impl AsRef<Path>) -> crate::Result<Self> {
+    async fn open(path: impl AsRef<Path>) -> crate::Result<Self> {
         const MANIFEST_FILENAME: &str = "manifest.json";
 
         let path = path.as_ref();
@@ -89,8 +87,16 @@ impl<A: Async> Inner<A> {
             .await
             .map_err(|source| error(LoadModelErrorKind::OpenZipFile, source))?;
 
+        let indices = zip.entry_indices_by_utf8_filenames();
+        let find_entry_index = |filename: &str| {
+            indices
+                .get(filename)
+                .with_context(|| "could not find `{filename}`")
+                .copied()
+        };
+
         let manifest = &async {
-            let idx = zip.find_entry_index(MANIFEST_FILENAME)?;
+            let idx = find_entry_index(MANIFEST_FILENAME)?;
             zip.read_file(idx).await
         }
         .await
@@ -106,7 +112,7 @@ impl<A: Async> Inner<A> {
             .map_err(|source| error(LoadModelErrorKind::InvalidModelFormat, source.into()))?;
 
         let metas = &async {
-            let idx = zip.find_entry_index(manifest.metas_filename())?;
+            let idx = find_entry_index(manifest.metas_filename())?;
             zip.read_file(idx).await
         }
         .await
@@ -133,13 +139,13 @@ impl<A: Async> Inner<A> {
                                 .map(|manifest| {
                                     let indices = enum_map! {
                                         TalkOperation::PredictDuration => {
-                                            zip.find_entry_index(&manifest.predict_duration_filename)?
+                                            find_entry_index(&manifest.predict_duration_filename)?
+                                        }
+                                        TalkOperation::PredictIntonation => {
+                                            find_entry_index(&manifest.predict_intonation_filename)?
                                         }
-                                        TalkOperation::PredictIntonation => zip.find_entry_index(
-                                            &manifest.predict_intonation_filename,
-                                        )?,
                                         TalkOperation::Decode => {
-                                            zip.find_entry_index(&manifest.decode_filename)?
+                                            find_entry_index(&manifest.decode_filename)?
                                         }
                                     };
 
@@ -159,7 +165,7 @@ impl<A: Async> Inner<A> {
                     .collect()
                     .map_err(crate::Error::from)
             },
-            marker: PhantomData,
+            zip: zip.into_inner().into_inner().into(),
         }
         .try_build()
     }
@@ -187,9 +193,10 @@ impl<A: Async> Inner<A> {
             source: Some(source),
         };
 
-        let mut zip = A::open_zip(path)
+        let zip = &mut *self.borrow_zip().lock().await;
+        let mut zip = async_zip::base::read::seek::ZipFileReader::with_bufreader(zip)
             .await
-            .map_err(|source| error(LoadModelErrorKind::OpenZipFile, source))?;
+            .map_err(|source| error(LoadModelErrorKind::OpenZipFile, source.into()))?;
 
         macro_rules! read_file {
             ($entry:expr $(,)?) => {{
@@ -255,29 +262,40 @@ struct InferenceModelEntry<D: InferenceDomain, M> {
 impl<A: Async> A {
     async fn open_zip(
         path: &Path,
-    ) -> anyhow::Result<async_zip::base::read::seek::ZipFileReader<impl AsyncBufRead + AsyncSeek>>
-    {
-        let zip = Self::open_file(path).await.with_context(|| {
+    ) -> anyhow::Result<
+        async_zip::base::read::seek::ZipFileReader<futures_util::io::BufReader<A::RoFile>>,
+    > {
+        let zip = Self::open_file_ro(path).await.with_context(|| {
             // fs-errのと同じにする
             format!("failed to open file `{}`", path.display())
         })?;
-        let zip = futures_util::io::BufReader::new(zip); // async_zip v0.0.16では不要、v0.0.17では必要
-        let zip = async_zip::base::read::seek::ZipFileReader::new(zip).await?;
+        let zip = async_zip::base::read::seek::ZipFileReader::with_bufreader(zip).await?;
         Ok(zip)
     }
 }
 
+// `BufReader`はasync_zip v0.0.16では不要、v0.0.17では必要
+#[ext]
+impl<R: AsyncRead + AsyncSeek + Unpin>
+    async_zip::base::read::seek::ZipFileReader<futures_util::io::BufReader<R>>
+{
+    async fn with_bufreader(rdr: R) -> async_zip::error::Result<Self>
+    where
+        Self: Sized, // trivial
+    {
+        Self::new(futures_util::io::BufReader::new(rdr)).await
+    }
+}
+
 #[ext]
 impl<R: AsyncBufRead + AsyncSeek + Unpin> async_zip::base::read::seek::ZipFileReader<R> {
-    fn find_entry_index(&self, filename: &str) -> anyhow::Result<usize> {
-        let (idx, _) = self
-            .file()
+    fn entry_indices_by_utf8_filenames(&self) -> HashMap<String, usize> {
+        self.file()
             .entries()
             .iter()
             .enumerate()
-            .find(|(_, e)| e.filename().as_str().ok() == Some(filename))
-            .with_context(|| "could not find `{filename}`")?;
-        Ok(idx)
+            .flat_map(|(i, e)| e.filename().as_str().map(|s| (s.to_owned(), i)))
+            .collect()
     }
 
     async fn read_file(&mut self, index: usize) -> anyhow::Result<Vec<u8>> {
@@ -394,21 +412,21 @@ pub(crate) mod blocking {
 
     use super::{Inner, ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
 
-    /// 音声モデル。
+    /// 音声モデルファイル。
     ///
     /// VVMファイルと対応する。
-    pub struct VoiceModel(Inner<SingleTasked>);
+    pub struct VoiceModelFile(Inner<SingleTasked>);
 
-    impl self::VoiceModel {
+    impl self::VoiceModelFile {
         pub(crate) fn read_inference_models(
             &self,
         ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
             self.0.read_inference_models().block_on()
         }
 
-        /// VVMファイルから`VoiceModel`をコンストラクトする。
-        pub fn from_path(path: impl AsRef<Path>) -> crate::Result<Self> {
-            Inner::from_path(path).block_on().map(Self)
+        /// VVMファイルを開く。
+        pub fn open(path: impl AsRef<Path>) -> crate::Result<Self> {
+            Inner::open(path).block_on().map(Self)
         }
 
         /// ID。
@@ -427,7 +445,7 @@ pub(crate) mod blocking {
     }
 
     #[ext(IdRef)]
-    pub impl VoiceModel {
+    pub impl VoiceModelFile {
         fn id_ref(&self) -> &Uuid {
             &self.header().manifest.id.0
         }
@@ -444,7 +462,7 @@ pub(crate) mod nonblocking {
 
     use super::{Inner, ModelBytesWithInnerVoiceIdsByDomain, VoiceModelHeader, VoiceModelId};
 
-    /// 音声モデル。
+    /// 音声モデルファイル。
     ///
     /// VVMファイルと対応する。
     ///
@@ -454,17 +472,23 @@ pub(crate) mod nonblocking {
     ///
     /// [blocking]: https://docs.rs/crate/blocking
     /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
-    pub struct VoiceModel(Inner<BlockingThreadPool>);
+    pub struct VoiceModelFile(Inner<BlockingThreadPool>);
 
-    impl self::VoiceModel {
+    impl self::VoiceModelFile {
         pub(crate) async fn read_inference_models(
             &self,
         ) -> LoadModelResult<InferenceDomainMap<ModelBytesWithInnerVoiceIdsByDomain>> {
             self.0.read_inference_models().await
         }
-        /// VVMファイルから`VoiceModel`をコンストラクトする。
-        pub async fn from_path(path: impl AsRef<Path>) -> Result<Self> {
-            Inner::from_path(path).await.map(Self)
+
+        /// VVMファイルを開く。
+        pub async fn open(path: impl AsRef<Path>) -> Result<Self> {
+            Inner::open(path).await.map(Self)
+        }
+
+        /// VVMファイルを閉じる。
+        pub async fn close(self) {
+            self.0.into_heads().zip.into_inner().close().await;
         }
 
         /// ID。
diff --git a/crates/voicevox_core_c_api/include/voicevox_core.h b/crates/voicevox_core_c_api/include/voicevox_core.h
index 422f32978..e158ebb6a 100644
--- a/crates/voicevox_core_c_api/include/voicevox_core.h
+++ b/crates/voicevox_core_c_api/include/voicevox_core.h
@@ -295,12 +295,12 @@ typedef struct VoicevoxSynthesizer VoicevoxSynthesizer;
 typedef struct VoicevoxUserDict VoicevoxUserDict;
 
 /**
- * 音声モデル。
+ * 音声モデルファイル。
  *
  * VVMファイルと対応する。
- * <b>構築</b>(_construction_)は ::voicevox_voice_model_new_from_path で行い、<b>破棄</b>(_destruction_)は ::voicevox_voice_model_delete で行う。
+ * <b>構築</b>(_construction_)は ::voicevox_voice_model_file_open で行い、<b>破棄</b>(_destruction_)は ::voicevox_voice_model_file_close で行う。
  */
-typedef struct VoicevoxVoiceModel VoicevoxVoiceModel;
+typedef struct VoicevoxVoiceModelFile VoicevoxVoiceModelFile;
 
 #if defined(VOICEVOX_LOAD_ONNXRUNTIME)
 /**
@@ -593,7 +593,7 @@ __declspec(dllimport)
 const char *voicevox_get_version(void);
 
 /**
- * VVMファイルから ::VoicevoxVoiceModel を<b>構築</b>(_construct_)する。
+ * VVMファイルを開く。
  *
  * @param [in] path vvmファイルへのUTF-8のファイルパス
  * @param [out] out_model 構築先
@@ -608,56 +608,56 @@ const char *voicevox_get_version(void);
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
-VoicevoxResultCode voicevox_voice_model_new_from_path(const char *path,
-                                                      struct VoicevoxVoiceModel **out_model);
+VoicevoxResultCode voicevox_voice_model_file_open(const char *path,
+                                                  struct VoicevoxVoiceModelFile **out_model);
 
 /**
- * ::VoicevoxVoiceModel からIDを取得する。
+ * ::VoicevoxVoiceModelFile からIDを取得する。
  *
  * @param [in] model 音声モデル
  *
  * @returns 音声モデルID
  *
  * \safety{
- * - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
+ * - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_voice_model_file_close で解放されていてはいけない。
  * }
  */
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
-VoicevoxVoiceModelId voicevox_voice_model_id(const struct VoicevoxVoiceModel *model);
+VoicevoxVoiceModelId voicevox_voice_model_file_id(const struct VoicevoxVoiceModelFile *model);
 
 /**
- * ::VoicevoxVoiceModel からメタ情報を取得する。
+ * ::VoicevoxVoiceModelFile からメタ情報を取得する。
  *
  * @param [in] model 音声モデル
  *
  * @returns メタ情報のJSON文字列
  *
  * \safety{
- * - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
+ * - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_voice_model_file_close で解放されていてはいけない。
  * - 戻り値の文字列の<b>生存期間</b>(_lifetime_)は次にこの関数が呼ばれるか、`model`が破棄されるまでである。この生存期間を越えて文字列にアクセスしてはならない。
  * }
  */
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
-const char *voicevox_voice_model_get_metas_json(const struct VoicevoxVoiceModel *model);
+const char *voicevox_voice_model_file_get_metas_json(const struct VoicevoxVoiceModelFile *model);
 
 /**
- * ::VoicevoxVoiceModel を<b>破棄</b>(_destruct_)する。
+ * ::VoicevoxVoiceModelFile を、所有しているファイルディスクリプタを閉じた上で<b>破棄</b>(_destruct_)する。
  *
  * @param [in] model 破棄対象
  *
  * \safety{
- * - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また既にこの関数で解放されていてはいけない。
+ * - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また既にこの関数で解放されていてはいけない。
  * - `model`は以後<b>ダングリングポインタ</b>(_dangling pointer_)として扱われなくてはならない。
  * }
  */
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
-void voicevox_voice_model_delete(struct VoicevoxVoiceModel *model);
+void voicevox_voice_model_file_close(struct VoicevoxVoiceModelFile *model);
 
 /**
  * ::VoicevoxSynthesizer を<b>構築</b>(_construct_)する。
@@ -671,7 +671,7 @@ void voicevox_voice_model_delete(struct VoicevoxVoiceModel *model);
  *
  * \safety{
  * - `onnxruntime`は ::voicevox_onnxruntime_load_once または ::voicevox_onnxruntime_init_once で得たものでなければならない。
- * - `open_jtalk`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_open_jtalk_rc_new で解放されていてはいけない。
+ * - `open_jtalk`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_open_jtalk_rc_new で解放されていてはいけない。
  * - `out_synthesizer`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
  * }
  */
@@ -708,14 +708,14 @@ void voicevox_synthesizer_delete(struct VoicevoxSynthesizer *synthesizer);
  *
  * \safety{
  * - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
- * - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
+ * - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_voice_model_file_close で解放されていてはいけない。
  * }
  */
 #ifdef _WIN32
 __declspec(dllimport)
 #endif
 VoicevoxResultCode voicevox_synthesizer_load_voice_model(const struct VoicevoxSynthesizer *synthesizer,
-                                                         const struct VoicevoxVoiceModel *model);
+                                                         const struct VoicevoxVoiceModelFile *model);
 
 /**
  * 音声モデルの読み込みを解除する。
diff --git a/crates/voicevox_core_c_api/src/c_impls.rs b/crates/voicevox_core_c_api/src/c_impls.rs
index 1adc402cd..0e9ff9a78 100644
--- a/crates/voicevox_core_c_api/src/c_impls.rs
+++ b/crates/voicevox_core_c_api/src/c_impls.rs
@@ -5,7 +5,8 @@ use ref_cast::ref_cast_custom;
 use voicevox_core::{InitializeOptions, Result, VoiceModelId};
 
 use crate::{
-    helpers::CApiResult, OpenJtalkRc, VoicevoxOnnxruntime, VoicevoxSynthesizer, VoicevoxVoiceModel,
+    helpers::CApiResult, OpenJtalkRc, VoicevoxOnnxruntime, VoicevoxSynthesizer,
+    VoicevoxVoiceModelFile,
 };
 
 // FIXME: 中身(Rust API)を直接操作するかラッパーメソッド越しにするのかが混在していて、一貫性を
@@ -87,7 +88,7 @@ impl VoicevoxSynthesizer {
 
     pub(crate) fn load_voice_model(
         &self,
-        model: &voicevox_core::blocking::VoiceModel,
+        model: &voicevox_core::blocking::VoiceModelFile,
     ) -> CApiResult<()> {
         self.synthesizer.load_voice_model(model)?;
         Ok(())
@@ -104,9 +105,9 @@ impl VoicevoxSynthesizer {
     }
 }
 
-impl VoicevoxVoiceModel {
-    pub(crate) fn from_path(path: impl AsRef<Path>) -> Result<Self> {
-        let model = voicevox_core::blocking::VoiceModel::from_path(path)?;
+impl VoicevoxVoiceModelFile {
+    pub(crate) fn open(path: impl AsRef<Path>) -> Result<Self> {
+        let model = voicevox_core::blocking::VoiceModelFile::open(path)?;
         let metas = CString::new(serde_json::to_string(model.metas()).unwrap()).unwrap();
         Ok(Self { model, metas })
     }
diff --git a/crates/voicevox_core_c_api/src/compatible_engine.rs b/crates/voicevox_core_c_api/src/compatible_engine.rs
index 9fdff0c92..7b1a03e7e 100644
--- a/crates/voicevox_core_c_api/src/compatible_engine.rs
+++ b/crates/voicevox_core_c_api/src/compatible_engine.rs
@@ -35,10 +35,10 @@ static ONNXRUNTIME: LazyLock<&'static voicevox_core::blocking::Onnxruntime> = La
 });
 
 struct VoiceModelSet {
-    all_vvms: Vec<Arc<voicevox_core::blocking::VoiceModel>>,
+    all_vvms: Vec<Arc<voicevox_core::blocking::VoiceModelFile>>,
     all_metas_json: CString,
     style_model_map: BTreeMap<StyleId, VoiceModelId>,
-    model_map: BTreeMap<VoiceModelId, Arc<voicevox_core::blocking::VoiceModel>>,
+    model_map: BTreeMap<VoiceModelId, Arc<voicevox_core::blocking::VoiceModelFile>>,
 }
 
 static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
@@ -66,7 +66,7 @@ static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
     /// # Panics
     ///
     /// 失敗したらパニックする
-    fn get_all_models() -> Vec<Arc<voicevox_core::blocking::VoiceModel>> {
+    fn get_all_models() -> Vec<Arc<voicevox_core::blocking::VoiceModelFile>> {
         let root_dir = if let Some(root_dir) = env::var_os(ROOT_DIR_ENV_NAME) {
             root_dir.into()
         } else {
@@ -84,7 +84,7 @@ static VOICE_MODEL_SET: LazyLock<VoiceModelSet> = LazyLock::new(|| {
             .unwrap_or_else(|e| panic!("{}が読めませんでした: {e}", root_dir.display()))
             .into_iter()
             .filter(|entry| entry.path().extension().map_or(false, |ext| ext == "vvm"))
-            .map(|entry| voicevox_core::blocking::VoiceModel::from_path(entry.path()).map(Arc::new))
+            .map(|entry| voicevox_core::blocking::VoiceModelFile::open(entry.path()).map(Arc::new))
             .collect::<std::result::Result<_, _>>()
             .unwrap()
     }
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 161af38e9..63f344553 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -399,13 +399,13 @@ pub extern "C" fn voicevox_get_version() -> *const c_char {
     };
 }
 
-/// 音声モデル。
+/// 音声モデルファイル。
 ///
 /// VVMファイルと対応する。
-/// <b>構築</b>(_construction_)は ::voicevox_voice_model_new_from_path で行い、<b>破棄</b>(_destruction_)は ::voicevox_voice_model_delete で行う。
+/// <b>構築</b>(_construction_)は ::voicevox_voice_model_file_open で行い、<b>破棄</b>(_destruction_)は ::voicevox_voice_model_file_close で行う。
 #[derive(Getters)]
-pub struct VoicevoxVoiceModel {
-    model: voicevox_core::blocking::VoiceModel,
+pub struct VoicevoxVoiceModelFile {
+    model: voicevox_core::blocking::VoiceModelFile,
     metas: CString,
 }
 
@@ -417,7 +417,7 @@ pub type VoicevoxVoiceModelId<'a> = &'a [u8; 16];
 /// VOICEVOXにおける、ある<b>話者</b>(_speaker_)のある<b>スタイル</b>(_style_)を指す。
 pub type VoicevoxStyleId = u32;
 
-/// VVMファイルから ::VoicevoxVoiceModel を<b>構築</b>(_construct_)する。
+/// VVMファイルを開く。
 ///
 /// @param [in] path vvmファイルへのUTF-8のファイルパス
 /// @param [out] out_model 構築先
@@ -429,60 +429,64 @@ pub type VoicevoxStyleId = u32;
 /// - `out_model`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
 /// }
 #[no_mangle]
-pub unsafe extern "C" fn voicevox_voice_model_new_from_path(
+pub unsafe extern "C" fn voicevox_voice_model_file_open(
     path: *const c_char,
-    out_model: NonNull<Box<VoicevoxVoiceModel>>,
+    out_model: NonNull<Box<VoicevoxVoiceModelFile>>,
 ) -> VoicevoxResultCode {
     init_logger_once();
     into_result_code_with_error((|| {
         let path = ensure_utf8(CStr::from_ptr(path))?;
-        let model = VoicevoxVoiceModel::from_path(path)?.into();
+        let model = VoicevoxVoiceModelFile::open(path)?.into();
         out_model.write_unaligned(model);
         Ok(())
     })())
 }
 
-/// ::VoicevoxVoiceModel からIDを取得する。
+/// ::VoicevoxVoiceModelFile からIDを取得する。
 ///
 /// @param [in] model 音声モデル
 ///
 /// @returns 音声モデルID
 ///
 /// \safety{
-/// - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
+/// - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_voice_model_file_close で解放されていてはいけない。
 /// }
 #[no_mangle]
-pub extern "C" fn voicevox_voice_model_id(model: &VoicevoxVoiceModel) -> VoicevoxVoiceModelId<'_> {
+pub extern "C" fn voicevox_voice_model_file_id(
+    model: &VoicevoxVoiceModelFile,
+) -> VoicevoxVoiceModelId<'_> {
     init_logger_once();
     model.model.id_ref().as_bytes()
 }
 
-/// ::VoicevoxVoiceModel からメタ情報を取得する。
+/// ::VoicevoxVoiceModelFile からメタ情報を取得する。
 ///
 /// @param [in] model 音声モデル
 ///
 /// @returns メタ情報のJSON文字列
 ///
 /// \safety{
-/// - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
+/// - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_voice_model_file_close で解放されていてはいけない。
 /// - 戻り値の文字列の<b>生存期間</b>(_lifetime_)は次にこの関数が呼ばれるか、`model`が破棄されるまでである。この生存期間を越えて文字列にアクセスしてはならない。
 /// }
 #[no_mangle]
-pub extern "C" fn voicevox_voice_model_get_metas_json(model: &VoicevoxVoiceModel) -> *const c_char {
+pub extern "C" fn voicevox_voice_model_file_get_metas_json(
+    model: &VoicevoxVoiceModelFile,
+) -> *const c_char {
     init_logger_once();
     model.metas().as_ptr()
 }
 
-/// ::VoicevoxVoiceModel を<b>破棄</b>(_destruct_)する。
+/// ::VoicevoxVoiceModelFile を、所有しているファイルディスクリプタを閉じた上で<b>破棄</b>(_destruct_)する。
 ///
 /// @param [in] model 破棄対象
 ///
 /// \safety{
-/// - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また既にこの関数で解放されていてはいけない。
+/// - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また既にこの関数で解放されていてはいけない。
 /// - `model`は以後<b>ダングリングポインタ</b>(_dangling pointer_)として扱われなくてはならない。
 /// }
 #[no_mangle]
-pub extern "C" fn voicevox_voice_model_delete(model: Box<VoicevoxVoiceModel>) {
+pub extern "C" fn voicevox_voice_model_file_close(model: Box<VoicevoxVoiceModelFile>) {
     init_logger_once();
     drop(model);
 }
@@ -506,7 +510,7 @@ pub struct VoicevoxSynthesizer {
 ///
 /// \safety{
 /// - `onnxruntime`は ::voicevox_onnxruntime_load_once または ::voicevox_onnxruntime_init_once で得たものでなければならない。
-/// - `open_jtalk`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_open_jtalk_rc_new で解放されていてはいけない。
+/// - `open_jtalk`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_open_jtalk_rc_new で解放されていてはいけない。
 /// - `out_synthesizer`は<a href="#voicevox-core-safety">書き込みについて有効</a>でなければならない。
 /// }
 #[no_mangle]
@@ -549,12 +553,12 @@ pub extern "C" fn voicevox_synthesizer_delete(synthesizer: Box<VoicevoxSynthesiz
 ///
 /// \safety{
 /// - `synthesizer`は ::voicevox_synthesizer_new で得たものでなければならず、また ::voicevox_synthesizer_delete で解放されていてはいけない。
-/// - `model`は ::voicevox_voice_model_new_from_path で得たものでなければならず、また ::voicevox_voice_model_delete で解放されていてはいけない。
+/// - `model`は ::voicevox_voice_model_file_open で得たものでなければならず、また ::voicevox_voice_model_file_close で解放されていてはいけない。
 /// }
 #[no_mangle]
 pub extern "C" fn voicevox_synthesizer_load_voice_model(
     synthesizer: &VoicevoxSynthesizer,
-    model: &VoicevoxVoiceModel,
+    model: &VoicevoxVoiceModelFile,
 ) -> VoicevoxResultCode {
     init_logger_once();
     into_result_code_with_error(synthesizer.load_voice_model(model.model()))
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
index a4381f74d..1997d30e9 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/simple_tts.rs
@@ -29,7 +29,7 @@ impl assert_cdylib::TestCase for TestCase {
 
         let model = {
             let mut model = MaybeUninit::uninit();
-            assert_ok(lib.voicevox_voice_model_new_from_path(
+            assert_ok(lib.voicevox_voice_model_file_open(
                 c_api::SAMPLE_VOICE_MODEL_FILE_PATH.as_ptr(),
                 model.as_mut_ptr(),
             ));
@@ -88,7 +88,7 @@ impl assert_cdylib::TestCase for TestCase {
 
         std::assert_eq!(SNAPSHOTS.output[&self.text].wav_length, wav_length);
 
-        lib.voicevox_voice_model_delete(model);
+        lib.voicevox_voice_model_file_close(model);
         lib.voicevox_open_jtalk_rc_delete(openjtalk);
         lib.voicevox_synthesizer_delete(synthesizer);
         lib.voicevox_wav_free(wav);
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
index 9ac8f4b35..ac662d06e 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/synthesizer_new_output_json.rs
@@ -63,7 +63,7 @@ impl assert_cdylib::TestCase for TestCase {
 
         let model = {
             let mut model = MaybeUninit::uninit();
-            assert_ok(lib.voicevox_voice_model_new_from_path(
+            assert_ok(lib.voicevox_voice_model_file_open(
                 c_api::SAMPLE_VOICE_MODEL_FILE_PATH.as_ptr(),
                 model.as_mut_ptr(),
             ));
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
index 0f2ff5fc8..2536a73d3 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/tts_via_audio_query.rs
@@ -29,7 +29,7 @@ impl assert_cdylib::TestCase for TestCase {
 
         let model = {
             let mut model = MaybeUninit::uninit();
-            assert_ok(lib.voicevox_voice_model_new_from_path(
+            assert_ok(lib.voicevox_voice_model_file_open(
                 c_api::SAMPLE_VOICE_MODEL_FILE_PATH.as_ptr(),
                 model.as_mut_ptr(),
             ));
@@ -99,7 +99,7 @@ impl assert_cdylib::TestCase for TestCase {
 
         std::assert_eq!(SNAPSHOTS.output[&self.text].wav_length, wav_length);
 
-        lib.voicevox_voice_model_delete(model);
+        lib.voicevox_voice_model_file_close(model);
         lib.voicevox_open_jtalk_rc_delete(openjtalk);
         lib.voicevox_synthesizer_delete(synthesizer);
         lib.voicevox_json_free(audio_query);
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
index 64e062251..d044962ae 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
@@ -47,7 +47,7 @@ impl assert_cdylib::TestCase for TestCase {
 
         let model = {
             let mut model = MaybeUninit::uninit();
-            assert_ok(lib.voicevox_voice_model_new_from_path(
+            assert_ok(lib.voicevox_voice_model_file_open(
                 c_api::SAMPLE_VOICE_MODEL_FILE_PATH.as_ptr(),
                 model.as_mut_ptr(),
             ));
@@ -119,7 +119,7 @@ impl assert_cdylib::TestCase for TestCase {
             audio_query_with_dict.get("kana")
         );
 
-        lib.voicevox_voice_model_delete(model);
+        lib.voicevox_voice_model_file_close(model);
         lib.voicevox_open_jtalk_rc_delete(openjtalk);
         lib.voicevox_synthesizer_delete(synthesizer);
         lib.voicevox_user_dict_delete(dict);
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
index 2fac70741..c59f8ca1e 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/Synthesizer.java
@@ -54,10 +54,11 @@ public boolean isGpuMode() {
    * @return メタ情報。
    */
   @Nonnull
-  public VoiceModel.SpeakerMeta[] metas() {
+  public VoiceModelFile.SpeakerMeta[] metas() {
     Gson gson = new Gson();
     String metasJson = rsGetMetasJson();
-    VoiceModel.SpeakerMeta[] rawMetas = gson.fromJson(metasJson, VoiceModel.SpeakerMeta[].class);
+    VoiceModelFile.SpeakerMeta[] rawMetas =
+        gson.fromJson(metasJson, VoiceModelFile.SpeakerMeta[].class);
     if (rawMetas == null) {
       throw new NullPointerException("metas");
     }
@@ -70,7 +71,7 @@ public VoiceModel.SpeakerMeta[] metas() {
    * @param voiceModel 読み込むモデル。
    * @throws InvalidModelDataException 無効なモデルデータの場合。
    */
-  public void loadVoiceModel(VoiceModel voiceModel) throws InvalidModelDataException {
+  public void loadVoiceModel(VoiceModelFile voiceModel) throws InvalidModelDataException {
     rsLoadVoiceModel(voiceModel);
   }
 
@@ -284,7 +285,7 @@ public TtsConfigurator tts(String text, int styleId) {
   @Nonnull
   private native String rsGetMetasJson();
 
-  private native void rsLoadVoiceModel(VoiceModel voiceModel) throws InvalidModelDataException;
+  private native void rsLoadVoiceModel(VoiceModelFile voiceModel) throws InvalidModelDataException;
 
   private native void rsUnloadVoiceModel(UUID voiceModelId);
 
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModelFile.java
similarity index 84%
rename from crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java
rename to crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModelFile.java
index d8c002f0f..b2cceca3f 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModel.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/VoiceModelFile.java
@@ -5,10 +5,11 @@
 import com.google.gson.annotations.SerializedName;
 import jakarta.annotation.Nonnull;
 import jakarta.annotation.Nullable;
+import java.io.Closeable;
 import java.util.UUID;
 
-/** 音声モデル。 */
-public class VoiceModel extends Dll {
+/** 音声モデルファイル。 */
+public class VoiceModelFile extends Dll implements Closeable {
   private long handle;
 
   /** ID。 */
@@ -17,8 +18,8 @@ public class VoiceModel extends Dll {
   /** メタ情報。 */
   @Nonnull public final SpeakerMeta[] metas;
 
-  public VoiceModel(String modelPath) {
-    rsFromPath(modelPath);
+  public VoiceModelFile(String modelPath) {
+    rsOpen(modelPath);
     id = rsGetId();
     String metasJson = rsGetMetasJson();
     Gson gson = new Gson();
@@ -29,12 +30,23 @@ public VoiceModel(String modelPath) {
     metas = rawMetas;
   }
 
+  /**
+   * VVMファイルを閉じる。
+   *
+   * <p>このメソッドが呼ばれた段階で{@link Synthesizer#loadVoiceModel}からのアクセスが継続中の場合、アクセスが終わるまで待つ。
+   */
+  @Override
+  public void close() {
+    rsClose();
+  }
+
+  @Override
   protected void finalize() throws Throwable {
     rsDrop();
     super.finalize();
   }
 
-  private native void rsFromPath(String modelPath);
+  private native void rsOpen(String modelPath);
 
   @Nonnull
   private native UUID rsGetId();
@@ -42,6 +54,8 @@ protected void finalize() throws Throwable {
   @Nonnull
   private native String rsGetMetasJson();
 
+  private native void rsClose();
+
   private native void rsDrop();
 
   /** 話者（speaker）のメタ情報。 */
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/MetaTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/MetaTest.java
index 60df7359f..ece3a87ff 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/MetaTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/MetaTest.java
@@ -14,7 +14,8 @@ void checkLoad() {
     // cwdはvoicevox_core/crates/voicevox_core_java_api/lib
     String cwd = System.getProperty("user.dir");
     File path = new File(cwd + "/../../test_util/data/model/sample.vvm");
-    VoiceModel model = new VoiceModel(path.getAbsolutePath());
-    assertNotNull(model.metas);
+    try (VoiceModelFile model = new VoiceModelFile(path.getAbsolutePath())) {
+      assertNotNull(model.metas);
+    }
   }
 }
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
index 0dfa17ea3..4c7d16f56 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/SynthesizerTest.java
@@ -49,58 +49,62 @@ boolean checkAllMoras(
   @Test
   void checkModel() throws InvalidModelDataException {
     Onnxruntime onnxruntime = loadOnnxruntime();
-    VoiceModel model = loadModel();
     OpenJtalk openJtalk = loadOpenJtalk();
     Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
 
     assertTrue(synthesizer.metas().length == 0);
 
-    synthesizer.loadVoiceModel(model);
+    try (VoiceModelFile model = openModel()) {
+      synthesizer.loadVoiceModel(model);
 
-    assertTrue(synthesizer.metas().length >= 1);
-    assertTrue(synthesizer.isLoadedVoiceModel(model.id));
+      assertTrue(synthesizer.metas().length >= 1);
+      assertTrue(synthesizer.isLoadedVoiceModel(model.id));
 
-    synthesizer.unloadVoiceModel(model.id);
+      synthesizer.unloadVoiceModel(model.id);
 
-    assertTrue(synthesizer.metas().length == 0);
-    assertFalse(synthesizer.isLoadedVoiceModel(model.id));
+      assertTrue(synthesizer.metas().length == 0);
+      assertFalse(synthesizer.isLoadedVoiceModel(model.id));
+    }
   }
 
   @Test
   void checkAudioQuery() throws RunModelException, InvalidModelDataException {
-    VoiceModel model = loadModel();
     Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
     Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
-    synthesizer.loadVoiceModel(model);
-    AudioQuery query = synthesizer.createAudioQuery("こんにちは", model.metas[0].styles[0].id);
 
-    synthesizer.synthesis(query, model.metas[0].styles[0].id).execute();
+    try (VoiceModelFile model = openModel()) {
+      synthesizer.loadVoiceModel(model);
+    }
+
+    AudioQuery query = synthesizer.createAudioQuery("こんにちは", synthesizer.metas()[0].styles[0].id);
+    synthesizer.synthesis(query, synthesizer.metas()[0].styles[0].id).execute();
   }
 
   @Test
   void checkAccentPhrases() throws RunModelException, InvalidModelDataException {
-    VoiceModel model = loadModel();
     OpenJtalk openJtalk = loadOpenJtalk();
     Onnxruntime onnxruntime = loadOnnxruntime();
     Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
-    synthesizer.loadVoiceModel(model);
+    try (VoiceModelFile model = openModel()) {
+      synthesizer.loadVoiceModel(model);
+    }
     List<AccentPhrase> accentPhrases =
-        synthesizer.createAccentPhrases("こんにちは", model.metas[0].styles[0].id);
+        synthesizer.createAccentPhrases("こんにちは", synthesizer.metas()[0].styles[0].id);
     List<AccentPhrase> accentPhrases2 =
-        synthesizer.replaceMoraPitch(accentPhrases, model.metas[1].styles[0].id);
+        synthesizer.replaceMoraPitch(accentPhrases, synthesizer.metas()[1].styles[0].id);
     assertTrue(
         checkAllMoras(
             accentPhrases, accentPhrases2, (mora, otherMora) -> mora.pitch != otherMora.pitch));
     List<AccentPhrase> accentPhrases3 =
-        synthesizer.replacePhonemeLength(accentPhrases, model.metas[1].styles[0].id);
+        synthesizer.replacePhonemeLength(accentPhrases, synthesizer.metas()[1].styles[0].id);
     assertTrue(
         checkAllMoras(
             accentPhrases,
             accentPhrases3,
             (mora, otherMora) -> mora.vowelLength != otherMora.vowelLength));
     List<AccentPhrase> accentPhrases4 =
-        synthesizer.replaceMoraData(accentPhrases, model.metas[1].styles[0].id);
+        synthesizer.replaceMoraData(accentPhrases, synthesizer.metas()[1].styles[0].id);
     assertTrue(
         checkAllMoras(
             accentPhrases,
@@ -111,11 +115,12 @@ void checkAccentPhrases() throws RunModelException, InvalidModelDataException {
 
   @Test
   void checkTts() throws RunModelException, InvalidModelDataException {
-    VoiceModel model = loadModel();
     Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
     Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
-    synthesizer.loadVoiceModel(model);
-    synthesizer.tts("こんにちは", model.metas[0].styles[0].id);
+    try (VoiceModelFile model = openModel()) {
+      synthesizer.loadVoiceModel(model);
+    }
+    synthesizer.tts("こんにちは", synthesizer.metas()[0].styles[0].id);
   }
 }
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java
index 9ab731cd9..f505c327f 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/TestUtils.java
@@ -3,13 +3,13 @@
 import java.io.File;
 
 class TestUtils {
-  VoiceModel loadModel() {
+  VoiceModelFile openModel() {
     // cwdはvoicevox_core/crates/voicevox_core_java_api/lib
     String cwd = System.getProperty("user.dir");
     File path = new File(cwd + "/../../test_util/data/model/sample.vvm");
 
     try {
-      return new VoiceModel(path.getCanonicalPath());
+      return new VoiceModelFile(path.getCanonicalPath());
     } catch (Exception e) {
       throw new RuntimeException(e);
     }
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
index 2fcfc06ab..ed9a94e8e 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/UserDictTest.java
@@ -15,21 +15,24 @@ class UserDictTest extends TestUtils {
   // 辞書ロード前後でkanaが異なることを確認する
   @Test
   void checkLoad() throws RunModelException, InvalidModelDataException, LoadUserDictException {
-    VoiceModel model = loadModel();
     Onnxruntime onnxruntime = loadOnnxruntime();
     OpenJtalk openJtalk = loadOpenJtalk();
     Synthesizer synthesizer = Synthesizer.builder(onnxruntime, openJtalk).build();
     UserDict userDict = new UserDict();
-    synthesizer.loadVoiceModel(model);
+    try (VoiceModelFile model = openModel()) {
+      synthesizer.loadVoiceModel(model);
+    }
     AudioQuery query1 =
         synthesizer.createAudioQuery(
-            "this_word_should_not_exist_in_default_dictionary", model.metas[0].styles[0].id);
+            "this_word_should_not_exist_in_default_dictionary",
+            synthesizer.metas()[0].styles[0].id);
 
     userDict.addWord(new UserDict.Word("this_word_should_not_exist_in_default_dictionary", "テスト"));
     openJtalk.useUserDict(userDict);
     AudioQuery query2 =
         synthesizer.createAudioQuery(
-            "this_word_should_not_exist_in_default_dictionary", model.metas[0].styles[0].id);
+            "this_word_should_not_exist_in_default_dictionary",
+            synthesizer.metas()[0].styles[0].id);
     assertTrue(query1.kana != query2.kana);
   }
 
diff --git a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java
index 5a720b07f..2bdba9c28 100644
--- a/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java
+++ b/crates/voicevox_core_java_api/lib/src/test/java/jp/hiroshiba/voicevoxcore/VoiceModelTest.java
@@ -17,7 +17,10 @@ class VoiceModelTest extends TestUtils {
   @Test
   void idShouldBePreservedAsIs() throws IOException {
     UUID expected = UUID.fromString(Manifest.readJson().id);
-    UUID actual = loadModel().id;
+    UUID actual;
+    try (VoiceModelFile model = openModel()) {
+      actual = model.id;
+    }
     assertEquals(expected, actual);
   }
 
diff --git a/crates/voicevox_core_java_api/src/common.rs b/crates/voicevox_core_java_api/src/common.rs
index 1b45dd44d..cb2a89a7f 100644
--- a/crates/voicevox_core_java_api/src/common.rs
+++ b/crates/voicevox_core_java_api/src/common.rs
@@ -1,4 +1,4 @@
-use std::{error::Error as _, iter};
+use std::{error::Error as _, iter, mem, ops::Deref};
 
 use derive_more::From;
 use easy_ext::ext;
@@ -6,7 +6,9 @@ use jni::{
     objects::{JObject, JThrowable},
     JNIEnv,
 };
+use tracing::{debug, warn};
 use uuid::Uuid;
+use voicevox_core::__internal::interop::raii::MaybeClosed;
 
 #[macro_export]
 macro_rules! object {
@@ -154,6 +156,9 @@ where
                             env.throw_new("java/lang/IllegalArgumentException", error.to_string())
                         )
                     }
+                    JavaApiError::IllegalState(msg) => {
+                        or_panic!(env.throw_new("java/lang/IllegalStateException", msg))
+                    }
                 };
             }
             fallback
@@ -161,6 +166,8 @@ where
     }
 }
 
+type JavaApiResult<T> = Result<T, JavaApiError>;
+
 #[derive(From, Debug)]
 pub(crate) enum JavaApiError {
     #[from]
@@ -173,6 +180,69 @@ pub(crate) enum JavaApiError {
     Uuid(uuid::Error),
 
     DeJson(serde_json::Error),
+
+    IllegalState(String),
+}
+
+pub(crate) struct Closable<T: HasJavaClassIdent>(std::sync::RwLock<MaybeClosed<T>>);
+
+impl<T: HasJavaClassIdent> Closable<T> {
+    pub(crate) fn new(content: T) -> Self {
+        Self(MaybeClosed::Open(content).into())
+    }
+
+    pub(crate) fn read(&self) -> JavaApiResult<impl Deref<Target = T> + '_> {
+        let lock = self.0.try_read().map_err(|e| match e {
+            std::sync::TryLockError::Poisoned(e) => panic!("{e}"),
+            std::sync::TryLockError::WouldBlock => {
+                JavaApiError::IllegalState(format!("The `{}` is being closed", T::JAVA_CLASS_IDENT))
+            }
+        })?;
+
+        voicevox_core::__internal::interop::raii::try_map_guard(lock, |lock| match &**lock {
+            MaybeClosed::Open(content) => Ok(content),
+            MaybeClosed::Closed => Err(JavaApiError::IllegalState(format!(
+                "The `{}` is closed",
+                T::JAVA_CLASS_IDENT,
+            ))),
+        })
+    }
+
+    pub(crate) fn close(&self) {
+        let lock = &mut *match self.0.try_write() {
+            Ok(lock) => lock,
+            Err(std::sync::TryLockError::Poisoned(e)) => panic!("{e}"),
+            Err(std::sync::TryLockError::WouldBlock) => {
+                self.0.write().unwrap_or_else(|e| panic!("{e}"))
+            }
+        };
+
+        if matches!(*lock, MaybeClosed::Open(_)) {
+            debug!("Closing a `{}`", T::JAVA_CLASS_IDENT);
+        }
+        drop(mem::replace(lock, MaybeClosed::Closed));
+    }
+}
+
+impl<T: HasJavaClassIdent> Drop for Closable<T> {
+    fn drop(&mut self) {
+        let content = mem::replace(
+            self.0.get_mut().unwrap_or_else(|e| panic!("{e}")),
+            MaybeClosed::Closed,
+        );
+        if let MaybeClosed::Open(content) = content {
+            warn!(
+                "デストラクタにより`{}`のクローズを行います。通常は、可能な限り`close`でクローズす\
+                 るようにして下さい",
+                T::JAVA_CLASS_IDENT,
+            );
+            drop(content);
+        }
+    }
+}
+
+pub(crate) trait HasJavaClassIdent {
+    const JAVA_CLASS_IDENT: &str;
 }
 
 #[ext(JNIEnvExt)]
diff --git a/crates/voicevox_core_java_api/src/synthesizer.rs b/crates/voicevox_core_java_api/src/synthesizer.rs
index 9ebd98e47..32cdf1200 100644
--- a/crates/voicevox_core_java_api/src/synthesizer.rs
+++ b/crates/voicevox_core_java_api/src/synthesizer.rs
@@ -107,8 +107,9 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_Synthesizer_rsLoadVoice
 ) {
     throw_if_err(env, (), |env| {
         let model = env
-            .get_rust_field::<_, _, Arc<voicevox_core::blocking::VoiceModel>>(&model, "handle")?
+            .get_rust_field::<_, _, crate::voice_model::VoiceModelFile>(&model, "handle")?
             .clone();
+        let model = model.read()?;
         let internal = env
             .get_rust_field::<_, _, Arc<voicevox_core::blocking::Synthesizer<voicevox_core::blocking::OpenJtalk>>>(
                 &this, "handle",
diff --git a/crates/voicevox_core_java_api/src/voice_model.rs b/crates/voicevox_core_java_api/src/voice_model.rs
index 1ea90ba8c..ef24edbfe 100644
--- a/crates/voicevox_core_java_api/src/voice_model.rs
+++ b/crates/voicevox_core_java_api/src/voice_model.rs
@@ -1,14 +1,20 @@
 use std::{borrow::Cow, sync::Arc};
 
-use crate::common::{throw_if_err, JNIEnvExt as _};
+use crate::common::{throw_if_err, Closable, HasJavaClassIdent, JNIEnvExt as _};
 use jni::{
     objects::{JObject, JString},
     sys::jobject,
     JNIEnv,
 };
 
+pub(crate) type VoiceModelFile = Arc<Closable<voicevox_core::blocking::VoiceModelFile>>;
+
+impl HasJavaClassIdent for voicevox_core::blocking::VoiceModelFile {
+    const JAVA_CLASS_IDENT: &str = "VoiceModelFile";
+}
+
 #[no_mangle]
-unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsFromPath<'local>(
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModelFile_rsOpen<'local>(
     env: JNIEnv<'local>,
     this: JObject<'local>,
     model_path: JString<'local>,
@@ -17,23 +23,24 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsFromPath<'
         let model_path = env.get_string(&model_path)?;
         let model_path = &*Cow::from(&model_path);
 
-        let internal = voicevox_core::blocking::VoiceModel::from_path(model_path)?;
-
-        env.set_rust_field(&this, "handle", Arc::new(internal))?;
+        let internal = voicevox_core::blocking::VoiceModelFile::open(model_path)?;
+        let internal = Arc::new(Closable::new(internal));
+        env.set_rust_field(&this, "handle", internal)?;
 
         Ok(())
     })
 }
 
 #[no_mangle]
-unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsGetId<'local>(
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModelFile_rsGetId<'local>(
     env: JNIEnv<'local>,
     this: JObject<'local>,
 ) -> jobject {
     throw_if_err(env, std::ptr::null_mut(), |env| {
         let internal = env
-            .get_rust_field::<_, _, Arc<voicevox_core::blocking::VoiceModel>>(&this, "handle")?
+            .get_rust_field::<_, _, VoiceModelFile>(&this, "handle")?
             .clone();
+        let internal = internal.read()?;
 
         let id = env.new_uuid(internal.id().raw_voice_model_id())?;
 
@@ -42,14 +49,15 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsGetId<'loc
 }
 
 #[no_mangle]
-unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsGetMetasJson<'local>(
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModelFile_rsGetMetasJson<'local>(
     env: JNIEnv<'local>,
     this: JObject<'local>,
 ) -> jobject {
     throw_if_err(env, std::ptr::null_mut(), |env| {
         let internal = env
-            .get_rust_field::<_, _, Arc<voicevox_core::blocking::VoiceModel>>(&this, "handle")?
+            .get_rust_field::<_, _, VoiceModelFile>(&this, "handle")?
             .clone();
+        let internal = internal.read()?;
 
         let metas = internal.metas();
         let metas_json = serde_json::to_string(&metas).expect("should not fail");
@@ -58,7 +66,19 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsGetMetasJs
 }
 
 #[no_mangle]
-unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModel_rsDrop<'local>(
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModelFile_rsClose<'local>(
+    env: JNIEnv<'local>,
+    this: JObject<'local>,
+) {
+    throw_if_err(env, (), |env| {
+        env.take_rust_field::<_, _, VoiceModelFile>(&this, "handle")?
+            .close();
+        Ok(())
+    })
+}
+
+#[no_mangle]
+unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_VoiceModelFile_rsDrop<'local>(
     env: JNIEnv<'local>,
     this: JObject<'local>,
 ) {
diff --git a/crates/voicevox_core_python_api/Cargo.toml b/crates/voicevox_core_python_api/Cargo.toml
index e0877b623..a2c6f7405 100644
--- a/crates/voicevox_core_python_api/Cargo.toml
+++ b/crates/voicevox_core_python_api/Cargo.toml
@@ -10,6 +10,7 @@ crate-type = ["cdylib"]
 [dependencies]
 camino.workspace = true
 easy-ext.workspace = true
+futures-lite.workspace = true
 log.workspace = true
 once_cell.workspace = true
 pyo3 = { workspace = true, features = ["abi3-py38", "extension-module"] }
@@ -17,6 +18,7 @@ pyo3-asyncio = { workspace = true, features = ["tokio-runtime"] }
 pyo3-log.workspace = true
 serde = { workspace = true, features = ["derive"] }
 serde_json.workspace = true
+tokio = { workspace = true, features = ["rt", "sync"] }
 tracing = { workspace = true, features = ["log"] }
 uuid.workspace = true
 voicevox_core = { workspace = true, features = ["load-onnxruntime"] }
diff --git a/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py b/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py
index aea4af999..3b6f857e3 100644
--- a/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py
+++ b/crates/voicevox_core_python_api/python/test/test_asyncio_metas.py
@@ -7,15 +7,15 @@
 import conftest
 import pytest
 import pytest_asyncio
-from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer, VoiceModelFile
 
 
-def test_voice_model_metas_works(voice_model: VoiceModel) -> None:
+def test_voice_model_metas_works(voice_model: VoiceModelFile) -> None:
     _ = voice_model.metas
 
 
 @pytest.mark.asyncio
-async def test_synthesizer_metas_works(voice_model: VoiceModel) -> None:
+async def test_synthesizer_metas_works(voice_model: VoiceModelFile) -> None:
     synthesizer = Synthesizer(
         await Onnxruntime.load_once(filename=conftest.onnxruntime_filename),
         await OpenJtalk.new(conftest.open_jtalk_dic_dir),
@@ -25,5 +25,5 @@ async def test_synthesizer_metas_works(voice_model: VoiceModel) -> None:
 
 
 @pytest_asyncio.fixture
-async def voice_model() -> VoiceModel:
-    return await VoiceModel.from_path(conftest.model_dir)
+async def voice_model() -> VoiceModelFile:
+    return await VoiceModelFile.open(conftest.model_dir)
diff --git a/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py b/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py
index d6906a6ac..b6fe50986 100644
--- a/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py
+++ b/crates/voicevox_core_python_api/python/test/test_asyncio_user_dict_load.py
@@ -19,7 +19,7 @@ async def test_user_dict_load() -> None:
         filename=conftest.onnxruntime_filename
     )
     open_jtalk = await voicevox_core.asyncio.OpenJtalk.new(conftest.open_jtalk_dic_dir)
-    model = await voicevox_core.asyncio.VoiceModel.from_path(conftest.model_dir)
+    model = await voicevox_core.asyncio.VoiceModelFile.open(conftest.model_dir)
     synthesizer = voicevox_core.asyncio.Synthesizer(onnxruntime, open_jtalk)
 
     await synthesizer.load_voice_model(model)
diff --git a/crates/voicevox_core_python_api/python/test/test_blocking_metas.py b/crates/voicevox_core_python_api/python/test/test_blocking_metas.py
index 00eade04b..a6aa6441d 100644
--- a/crates/voicevox_core_python_api/python/test/test_blocking_metas.py
+++ b/crates/voicevox_core_python_api/python/test/test_blocking_metas.py
@@ -6,14 +6,14 @@
 
 import conftest
 import pytest
-from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModelFile
 
 
-def test_voice_model_metas_works(voice_model: VoiceModel) -> None:
+def test_voice_model_metas_works(voice_model: VoiceModelFile) -> None:
     _ = voice_model.metas
 
 
-def test_synthesizer_metas_works(voice_model: VoiceModel) -> None:
+def test_synthesizer_metas_works(voice_model: VoiceModelFile) -> None:
     synthesizer = Synthesizer(
         Onnxruntime.load_once(filename=conftest.onnxruntime_filename),
         OpenJtalk(conftest.open_jtalk_dic_dir),
@@ -23,5 +23,5 @@ def test_synthesizer_metas_works(voice_model: VoiceModel) -> None:
 
 
 @pytest.fixture
-def voice_model() -> VoiceModel:
-    return VoiceModel.from_path(conftest.model_dir)
+def voice_model() -> VoiceModelFile:
+    return VoiceModelFile.open(conftest.model_dir)
diff --git a/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py b/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py
index 198becbe2..e8a5bd350 100644
--- a/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py
+++ b/crates/voicevox_core_python_api/python/test/test_blocking_user_dict_load.py
@@ -17,7 +17,7 @@ def test_user_dict_load() -> None:
         filename=conftest.onnxruntime_filename
     )
     open_jtalk = voicevox_core.blocking.OpenJtalk(conftest.open_jtalk_dic_dir)
-    model = voicevox_core.blocking.VoiceModel.from_path(conftest.model_dir)
+    model = voicevox_core.blocking.VoiceModelFile.open(conftest.model_dir)
     synthesizer = voicevox_core.blocking.Synthesizer(onnxruntime, open_jtalk)
 
     synthesizer.load_voice_model(model)
diff --git a/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py b/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py
index 26d389477..bfadf8471 100644
--- a/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py
+++ b/crates/voicevox_core_python_api/python/test/test_pseudo_raii_for_asyncio_synthesizer.py
@@ -10,28 +10,32 @@
 from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer
 
 
-def test_enter_returns_workable_self(synthesizer: Synthesizer) -> None:
-    with synthesizer as ctx:
+@pytest.mark.asyncio
+async def test_enter_returns_workable_self(synthesizer: Synthesizer) -> None:
+    async with synthesizer as ctx:
         assert ctx is synthesizer
         _ = synthesizer.metas
 
 
-def test_closing_multiple_times_is_allowed(synthesizer: Synthesizer) -> None:
-    with synthesizer:
-        with synthesizer:
+@pytest.mark.asyncio
+async def test_closing_multiple_times_is_allowed(synthesizer: Synthesizer) -> None:
+    async with synthesizer:
+        async with synthesizer:
             pass
-    synthesizer.close()
-    synthesizer.close()
+    await synthesizer.close()
+    await synthesizer.close()
 
 
-def test_access_after_close_denied(synthesizer: Synthesizer) -> None:
-    synthesizer.close()
+@pytest.mark.asyncio
+async def test_access_after_close_denied(synthesizer: Synthesizer) -> None:
+    await synthesizer.close()
     with pytest.raises(ValueError, match="^The `Synthesizer` is closed$"):
         _ = synthesizer.metas
 
 
-def test_access_after_exit_denied(synthesizer: Synthesizer) -> None:
-    with synthesizer:
+@pytest.mark.asyncio
+async def test_access_after_exit_denied(synthesizer: Synthesizer) -> None:
+    async with synthesizer:
         pass
     with pytest.raises(ValueError, match="^The `Synthesizer` is closed$"):
         _ = synthesizer.metas
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
index 7652a7d2c..b386d2d5a 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
@@ -14,14 +14,14 @@ if TYPE_CHECKING:
         VoiceModelId,
     )
 
-class VoiceModel:
+class VoiceModelFile:
     """
-    音声モデル。"""
+    音声モデルファイル。"""
 
     @staticmethod
-    async def from_path(path: Union[str, PathLike[str]]) -> VoiceModel:
+    async def open(path: Union[str, PathLike[str]]) -> VoiceModelFile:
         """
-        VVMファイルから ``VoiceModel`` を生成する。
+        VVMファイルを開く。
 
         Parameters
         ----------
@@ -29,6 +29,14 @@ class VoiceModel:
             VVMファイルへのパス。
         """
         ...
+    async def close(self) -> None:
+        """
+        VVMファイルを閉じる。
+
+        このメソッドが呼ばれた段階で :attr:`Synthesizer.load_voice_model`
+        からのアクセスが継続中の場合、アクセスが終わるまで待つ。
+        """
+        ...
     @property
     def id(self) -> VoiceModelId:
         """ID。"""
@@ -37,6 +45,8 @@ class VoiceModel:
     def metas(self) -> List[SpeakerMeta]:
         """メタ情報。"""
         ...
+    async def __aenter__(self) -> "VoiceModelFile": ...
+    async def __aexit__(self, exc_type, exc_value, traceback) -> None: ...
 
 class Onnxruntime:
     """
@@ -160,8 +170,8 @@ class Synthesizer:
         cpu_num_threads: int = 0,
     ) -> None: ...
     def __repr__(self) -> str: ...
-    def __enter__(self) -> "Synthesizer": ...
-    def __exit__(self, exc_type, exc_value, traceback) -> None: ...
+    async def __aenter__(self) -> "Synthesizer": ...
+    async def __aexit__(self, exc_type, exc_value, traceback) -> None: ...
     @property
     def onnxruntime(self) -> Onnxruntime:
         """ONNX Runtime。"""
@@ -174,7 +184,7 @@ class Synthesizer:
     def metas(self) -> List[SpeakerMeta]:
         """メタ情報。"""
         ...
-    async def load_voice_model(self, model: VoiceModel) -> None:
+    async def load_voice_model(self, model: VoiceModelFile) -> None:
         """
         モデルを読み込む。
 
@@ -411,7 +421,7 @@ class Synthesizer:
         WAVデータ。
         """
         ...
-    def close(self) -> None: ...
+    async def close(self) -> None: ...
 
 class UserDict:
     """ユーザー辞書。"""
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
index 602ff31bc..891ceb05e 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
@@ -14,14 +14,14 @@ if TYPE_CHECKING:
         VoiceModelId,
     )
 
-class VoiceModel:
+class VoiceModelFile:
     """
-    音声モデル。"""
+    音声モデルファイル。"""
 
     @staticmethod
-    def from_path(path: Union[str, PathLike[str]]) -> VoiceModel:
+    def open(path: Union[str, PathLike[str]]) -> VoiceModelFile:
         """
-        VVMファイルから ``VoiceModel`` を生成する。
+        VVMファイルを開く。
 
         Parameters
         ----------
@@ -29,6 +29,14 @@ class VoiceModel:
             VVMファイルへのパス。
         """
         ...
+    def close(self) -> None:
+        """
+        VVMファイルを閉じる。
+
+        このメソッドが呼ばれた段階で :attr:`Synthesizer.load_voice_model`
+        からのアクセスが継続中の場合、アクセスが終わるまで待つ。
+        """
+        ...
     @property
     def id(self) -> VoiceModelId:
         """ID。"""
@@ -37,6 +45,8 @@ class VoiceModel:
     def metas(self) -> List[SpeakerMeta]:
         """メタ情報。"""
         ...
+    def __enter__(self) -> "VoiceModelFile": ...
+    def __exit__(self, exc_type, exc_value, traceback) -> None: ...
 
 class Onnxruntime:
     """
@@ -169,7 +179,7 @@ class Synthesizer:
     def metas(self) -> List[SpeakerMeta]:
         """メタ情報。"""
         ...
-    def load_voice_model(self, model: VoiceModel) -> None:
+    def load_voice_model(self, model: VoiceModelFile) -> None:
         """
         モデルを読み込む。
 
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py b/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py
index 2cff19cdf..0dc5e0adb 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/asyncio.py
@@ -1,4 +1,4 @@
 # pyright: reportMissingModuleSource=false
-from ._rust.asyncio import Onnxruntime, OpenJtalk, Synthesizer, UserDict, VoiceModel
+from ._rust.asyncio import Onnxruntime, OpenJtalk, Synthesizer, UserDict, VoiceModelFile
 
-__all__ = ["Onnxruntime", "OpenJtalk", "Synthesizer", "UserDict", "VoiceModel"]
+__all__ = ["Onnxruntime", "OpenJtalk", "Synthesizer", "UserDict", "VoiceModelFile"]
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/blocking.py b/crates/voicevox_core_python_api/python/voicevox_core/blocking.py
index 7fed5fac7..01ea45029 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/blocking.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/blocking.py
@@ -1,4 +1,10 @@
 # pyright: reportMissingModuleSource=false
-from ._rust.blocking import Onnxruntime, OpenJtalk, Synthesizer, UserDict, VoiceModel
+from ._rust.blocking import (
+    Onnxruntime,
+    OpenJtalk,
+    Synthesizer,
+    UserDict,
+    VoiceModelFile,
+)
 
-__all__ = ["Onnxruntime", "OpenJtalk", "Synthesizer", "UserDict", "VoiceModel"]
+__all__ = ["Onnxruntime", "OpenJtalk", "Synthesizer", "UserDict", "VoiceModelFile"]
diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs
index e57f2fb13..8152bc980 100644
--- a/crates/voicevox_core_python_api/src/convert.rs
+++ b/crates/voicevox_core_python_api/src/convert.rs
@@ -1,11 +1,11 @@
-use std::{error::Error as _, future::Future, iter, path::PathBuf};
+use std::{error::Error as _, future::Future, iter, panic, path::PathBuf};
 
 use camino::Utf8PathBuf;
 use easy_ext::ext;
 use pyo3::{
-    exceptions::{PyException, PyValueError},
-    types::PyList,
-    FromPyObject as _, PyAny, PyObject, PyResult, Python, ToPyObject,
+    exceptions::{PyException, PyRuntimeError, PyValueError},
+    types::{IntoPyDict as _, PyList},
+    FromPyObject as _, IntoPy, PyAny, PyObject, PyResult, Python, ToPyObject,
 };
 use serde::{de::DeserializeOwned, Serialize};
 use serde_json::json;
@@ -60,16 +60,17 @@ pub(crate) fn from_dataclass<T: DeserializeOwned>(ob: &PyAny) -> PyResult<T> {
 pub(crate) fn to_pydantic_voice_model_meta<'py>(
     metas: &VoiceModelMeta,
     py: Python<'py>,
-) -> PyResult<Vec<&'py PyAny>> {
+) -> PyResult<&'py PyList> {
     let class = py
         .import("voicevox_core")?
         .getattr("SpeakerMeta")?
         .downcast()?;
 
-    metas
+    let metas = metas
         .iter()
         .map(|m| to_pydantic_dataclass(m, class))
-        .collect::<PyResult<Vec<_>>>()
+        .collect::<PyResult<Vec<_>>>()?;
+    Ok(PyList::new(py, metas))
 }
 
 pub(crate) fn to_pydantic_dataclass(x: impl Serialize, class: &PyAny) -> PyResult<&PyAny> {
@@ -144,7 +145,6 @@ pub(crate) fn to_rust_uuid(ob: &PyAny) -> PyResult<Uuid> {
     let uuid = ob.getattr("hex")?.extract::<String>()?;
     uuid.parse::<Uuid>().into_py_value_result()
 }
-// FIXME: `to_object`は必要無いのでは?
 pub(crate) fn to_py_uuid(py: Python<'_>, uuid: Uuid) -> PyResult<PyObject> {
     let uuid = uuid.hyphenated().to_string();
     let uuid = py.import("uuid")?.call_method1("UUID", (uuid,))?;
@@ -176,6 +176,45 @@ pub(crate) fn to_rust_word_type(word_type: &PyAny) -> PyResult<UserDictWordType>
     serde_json::from_value::<UserDictWordType>(json!(name)).into_py_value_result()
 }
 
+/// おおよそ以下のコードにおける`f(x)`のようなものを得る。
+///
+/// ```py
+/// async def f(x_):
+///     return x_
+///
+/// return f(x)
+/// ```
+pub(crate) fn ready(x: impl IntoPy<PyObject>, py: Python<'_>) -> PyResult<&PyAny> {
+    // ```py
+    // from asyncio import Future
+    //
+    // running_loop = asyncio.get_running_loop()
+    // fut = Future(loop=running_loop)
+    // fut.set_result(x)
+    // return fut
+    // ```
+
+    let asyncio_future = py.import("asyncio")?.getattr("Future")?;
+
+    let running_loop = pyo3_asyncio::get_running_loop(py)?;
+    let fut = asyncio_future.call((), Some([("loop", running_loop)].into_py_dict(py)))?;
+    fut.call_method1("set_result", (x,))?;
+    Ok(fut)
+}
+
+pub(crate) async fn run_in_executor<F, R>(f: F) -> PyResult<R>
+where
+    F: FnOnce() -> R + Send + 'static,
+    R: Send + 'static,
+{
+    tokio::task::spawn_blocking(f)
+        .await
+        .map_err(|e| match e.try_into_panic() {
+            Ok(p) => panic::resume_unwind(p),
+            Err(e) => PyRuntimeError::new_err(e.to_string()),
+        })
+}
+
 #[ext(VoicevoxCoreResultExt)]
 pub(crate) impl<T> voicevox_core::Result<T> {
     fn into_py_result(self, py: Python<'_>) -> PyResult<T> {
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index c09fafdc8..00b6e7102 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -1,16 +1,21 @@
-use std::marker::PhantomData;
+use std::{
+    marker::PhantomData,
+    mem,
+    ops::{Deref, DerefMut},
+};
 
 mod convert;
 use self::convert::{from_utf8_path, VoicevoxCoreResultExt as _};
 use easy_ext::ext;
-use log::debug;
+use log::{debug, warn};
 use pyo3::{
     create_exception,
     exceptions::{PyException, PyKeyError, PyValueError},
     pyfunction, pymodule,
-    types::PyModule,
-    wrap_pyfunction, PyResult, PyTypeInfo, Python,
+    types::{PyList, PyModule},
+    wrap_pyfunction, Py, PyObject, PyResult, PyTypeInfo, Python,
 };
+use voicevox_core::__internal::interop::raii::MaybeClosed;
 
 #[pymodule]
 #[pyo3(name = "_rust")]
@@ -27,7 +32,7 @@ fn rust(py: Python<'_>, module: &PyModule) -> PyResult<()> {
     blocking_module.add_class::<self::blocking::Synthesizer>()?;
     blocking_module.add_class::<self::blocking::Onnxruntime>()?;
     blocking_module.add_class::<self::blocking::OpenJtalk>()?;
-    blocking_module.add_class::<self::blocking::VoiceModel>()?;
+    blocking_module.add_class::<self::blocking::VoiceModelFile>()?;
     blocking_module.add_class::<self::blocking::UserDict>()?;
     module.add_and_register_submodule(blocking_module)?;
 
@@ -35,7 +40,7 @@ fn rust(py: Python<'_>, module: &PyModule) -> PyResult<()> {
     asyncio_module.add_class::<self::asyncio::Synthesizer>()?;
     asyncio_module.add_class::<self::asyncio::Onnxruntime>()?;
     asyncio_module.add_class::<self::asyncio::OpenJtalk>()?;
-    asyncio_module.add_class::<self::asyncio::VoiceModel>()?;
+    asyncio_module.add_class::<self::asyncio::VoiceModelFile>()?;
     asyncio_module.add_class::<self::asyncio::UserDict>()?;
     module.add_and_register_submodule(asyncio_module)
 }
@@ -88,48 +93,165 @@ exceptions! {
     InvalidWordError: PyValueError;
 }
 
-struct Closable<T, C: PyTypeInfo> {
-    content: MaybeClosed<T>,
-    marker: PhantomData<C>,
-}
-
-enum MaybeClosed<T> {
-    Open(T),
-    Closed,
+struct Closable<T, C: PyTypeInfo, A: Async> {
+    content: A::RwLock<MaybeClosed<T>>,
+    marker: PhantomData<(C, A)>,
 }
 
-impl<T, C: PyTypeInfo> Closable<T, C> {
+impl<T, C: PyTypeInfo, A: Async> Closable<T, C, A> {
     fn new(content: T) -> Self {
         Self {
-            content: MaybeClosed::Open(content),
+            content: MaybeClosed::Open(content).into(),
             marker: PhantomData,
         }
     }
 
-    fn get(&self) -> PyResult<&T> {
-        match &self.content {
+    fn read(&self) -> PyResult<impl Deref<Target = T> + '_> {
+        let lock = self
+            .content
+            .try_read_()
+            .map_err(|_| PyValueError::new_err(format!("The `{}` is being closed", C::NAME)))?;
+
+        voicevox_core::__internal::interop::raii::try_map_guard(lock, |lock| match &**lock {
             MaybeClosed::Open(content) => Ok(content),
             MaybeClosed::Closed => Err(PyValueError::new_err(format!(
                 "The `{}` is closed",
                 C::NAME,
             ))),
-        }
+        })
     }
 
-    fn close(&mut self) {
-        if matches!(self.content, MaybeClosed::Open(_)) {
+    async fn close_(&self) -> Option<T> {
+        let lock = &mut *match self.content.try_write_() {
+            Ok(lock) => lock,
+            Err(()) => {
+                warn!("The `{}` is still in use. Waiting before closing", C::NAME);
+                self.content.write_().await
+            }
+        };
+
+        if matches!(*lock, MaybeClosed::Open(_)) {
             debug!("Closing a {}", C::NAME);
         }
-        self.content = MaybeClosed::Closed;
+        match mem::replace(lock, MaybeClosed::Closed) {
+            MaybeClosed::Open(content) => Some(content),
+            MaybeClosed::Closed => None,
+        }
+    }
+}
+
+impl<T, C: PyTypeInfo> Closable<T, C, SingleTasked> {
+    #[must_use = "中身は明示的に`drop`でdropすること"]
+    fn close(&self) -> Option<T> {
+        futures_lite::future::block_on(self.close_())
+    }
+}
+
+impl<T, C: PyTypeInfo> Closable<T, C, Tokio> {
+    #[must_use = "中身は明示的に`drop`でdropすること"]
+    async fn close(&self) -> Option<T> {
+        self.close_().await
     }
 }
 
-impl<T, C: PyTypeInfo> Drop for Closable<T, C> {
+impl<T, C: PyTypeInfo, A: Async> Drop for Closable<T, C, A> {
     fn drop(&mut self) {
-        self.close();
+        let content = mem::replace(self.content.get_mut_(), MaybeClosed::Closed);
+        if matches!(content, MaybeClosed::Open(_)) {
+            warn!(
+                "デストラクタにより`{}`のクローズを行います。通常は、可能な限り`{}`でクローズする\
+                 ようにして下さい",
+                C::NAME,
+                A::EXIT_METHOD,
+            );
+            drop(content);
+        }
     }
 }
 
+trait Async {
+    const EXIT_METHOD: &str;
+    type RwLock<T>: RwLock<Item = T>;
+}
+
+enum SingleTasked {}
+enum Tokio {}
+
+impl Async for SingleTasked {
+    const EXIT_METHOD: &str = "__exit__";
+    type RwLock<T> = std::sync::RwLock<T>;
+}
+
+impl Async for Tokio {
+    const EXIT_METHOD: &str = "__aexit__";
+    type RwLock<T> = tokio::sync::RwLock<T>;
+}
+
+trait RwLock: From<Self::Item> {
+    type Item;
+    type RwLockWriteGuard<'a>: DerefMut<Target = Self::Item>
+    where
+        Self: 'a;
+    fn try_read_(&self) -> Result<impl Deref<Target = Self::Item>, ()>;
+    async fn write_(&self) -> Self::RwLockWriteGuard<'_>;
+    fn try_write_(&self) -> Result<Self::RwLockWriteGuard<'_>, ()>;
+    fn get_mut_(&mut self) -> &mut Self::Item;
+}
+
+impl<T> RwLock for std::sync::RwLock<T> {
+    type Item = T;
+    type RwLockWriteGuard<'a> = std::sync::RwLockWriteGuard<'a, Self::Item> where Self: 'a;
+
+    fn try_read_(&self) -> Result<impl Deref<Target = Self::Item>, ()> {
+        self.try_read().map_err(|e| match e {
+            std::sync::TryLockError::Poisoned(e) => panic!("{e}"),
+            std::sync::TryLockError::WouldBlock => (),
+        })
+    }
+
+    async fn write_(&self) -> Self::RwLockWriteGuard<'_> {
+        self.write().unwrap_or_else(|e| panic!("{e}"))
+    }
+
+    fn try_write_(&self) -> Result<Self::RwLockWriteGuard<'_>, ()> {
+        self.try_write().map_err(|e| match e {
+            std::sync::TryLockError::Poisoned(e) => panic!("{e}"),
+            std::sync::TryLockError::WouldBlock => (),
+        })
+    }
+
+    fn get_mut_(&mut self) -> &mut Self::Item {
+        self.get_mut().unwrap_or_else(|e| panic!("{e}"))
+    }
+}
+
+impl<T> RwLock for tokio::sync::RwLock<T> {
+    type Item = T;
+    type RwLockWriteGuard<'a> = tokio::sync::RwLockWriteGuard<'a, Self::Item> where Self: 'a;
+
+    fn try_read_(&self) -> Result<impl Deref<Target = Self::Item>, ()> {
+        self.try_read().map_err(|_| ())
+    }
+
+    async fn write_(&self) -> Self::RwLockWriteGuard<'_> {
+        self.write().await
+    }
+
+    fn try_write_(&self) -> Result<Self::RwLockWriteGuard<'_>, ()> {
+        self.try_write().map_err(|_| ())
+    }
+
+    fn get_mut_(&mut self) -> &mut Self::Item {
+        self.get_mut()
+    }
+}
+
+#[derive(Clone)]
+struct VoiceModelFilePyFields {
+    id: PyObject,      // `NewType("VoiceModelId", UUID)`
+    metas: Py<PyList>, // `list[SpeakerMeta]`
+}
+
 #[pyfunction]
 fn _validate_pronunciation(pronunciation: &str, py: Python<'_>) -> PyResult<()> {
     voicevox_core::__internal::validate_pronunciation(pronunciation).into_py_result(py)
@@ -155,33 +277,61 @@ mod blocking {
         UserDictWord,
     };
 
-    use crate::{convert::VoicevoxCoreResultExt as _, Closable};
+    use crate::{
+        convert::VoicevoxCoreResultExt as _, Closable, SingleTasked, VoiceModelFilePyFields,
+    };
 
     #[pyclass]
     #[derive(Clone)]
-    pub(crate) struct VoiceModel {
-        model: Arc<voicevox_core::blocking::VoiceModel>,
+    pub(crate) struct VoiceModelFile {
+        model: Arc<Closable<voicevox_core::blocking::VoiceModelFile, Self, SingleTasked>>,
+        fields: VoiceModelFilePyFields,
     }
 
     #[pymethods]
-    impl VoiceModel {
+    impl VoiceModelFile {
         #[staticmethod]
-        fn from_path(py: Python<'_>, path: PathBuf) -> PyResult<Self> {
-            let model = voicevox_core::blocking::VoiceModel::from_path(path)
-                .into_py_result(py)?
-                .into();
-            Ok(Self { model })
+        fn open(py: Python<'_>, path: PathBuf) -> PyResult<Self> {
+            let model = voicevox_core::blocking::VoiceModelFile::open(path).into_py_result(py)?;
+
+            let id = crate::convert::to_py_uuid(py, model.id().raw_voice_model_id())?;
+            let metas = crate::convert::to_pydantic_voice_model_meta(model.metas(), py)?.into();
+
+            let model = Closable::new(model).into();
+
+            Ok(Self {
+                model,
+                fields: VoiceModelFilePyFields { id, metas },
+            })
+        }
+
+        fn close(&self) {
+            let this = self.model.close();
+            drop(this);
         }
 
         #[getter]
-        fn id(&self, py: Python<'_>) -> PyResult<PyObject> {
-            let id = self.model.id().raw_voice_model_id();
-            crate::convert::to_py_uuid(py, id)
+        fn id(&self) -> PyObject {
+            self.fields.id.clone()
         }
 
         #[getter]
-        fn metas<'py>(&self, py: Python<'py>) -> Vec<&'py PyAny> {
-            crate::convert::to_pydantic_voice_model_meta(self.model.metas(), py).unwrap()
+        fn metas(&self) -> Py<PyList> {
+            self.fields.metas.clone()
+        }
+
+        fn __enter__(slf: PyRef<'_, Self>) -> PyResult<PyRef<'_, Self>> {
+            slf.model.read()?;
+            Ok(slf)
+        }
+
+        fn __exit__(
+            &self,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_type: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_value: &PyAny,
+            #[expect(unused_variables, reason = "`__exit__`としては必要")] traceback: &PyAny,
+        ) {
+            self.close();
         }
     }
 
@@ -279,6 +429,7 @@ mod blocking {
         synthesizer: Closable<
             voicevox_core::blocking::Synthesizer<voicevox_core::blocking::OpenJtalk>,
             Self,
+            SingleTasked,
         >,
     }
 
@@ -318,7 +469,7 @@ mod blocking {
         }
 
         fn __enter__(slf: PyRef<'_, Self>) -> PyResult<PyRef<'_, Self>> {
-            slf.synthesizer.get()?;
+            slf.synthesizer.read()?;
             Ok(slf)
         }
 
@@ -338,22 +489,21 @@ mod blocking {
 
         #[getter]
         fn is_gpu_mode(&self) -> PyResult<bool> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
             Ok(synthesizer.is_gpu_mode())
         }
 
         #[getter]
-        fn metas<'py>(&self, py: Python<'py>) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+        fn metas<'py>(&self, py: Python<'py>) -> PyResult<&'py PyList> {
+            let synthesizer = self.synthesizer.read()?;
             crate::convert::to_pydantic_voice_model_meta(&synthesizer.metas(), py)
         }
 
         fn load_voice_model(&mut self, model: &PyAny, py: Python<'_>) -> PyResult<()> {
-            let model: VoiceModel = model.extract()?;
-            self.synthesizer
-                .get()?
-                .load_voice_model(&model.model)
-                .into_py_result(py)
+            let this = self.synthesizer.read()?;
+            let model = model.extract::<VoiceModelFile>()?;
+            let model = &model.model.read()?;
+            this.load_voice_model(model).into_py_result(py)
         }
 
         fn unload_voice_model(
@@ -362,7 +512,7 @@ mod blocking {
             py: Python<'_>,
         ) -> PyResult<()> {
             self.synthesizer
-                .get()?
+                .read()?
                 .unload_voice_model(voice_model_id.into())
                 .into_py_result(py)
         }
@@ -373,7 +523,7 @@ mod blocking {
         ) -> PyResult<bool> {
             Ok(self
                 .synthesizer
-                .get()?
+                .read()?
                 .is_loaded_voice_model(voice_model_id.into()))
         }
 
@@ -383,7 +533,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
 
             let audio_query = synthesizer
                 .audio_query_from_kana(kana, StyleId::new(style_id))
@@ -399,7 +549,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizesr = self.synthesizer.get()?;
+            let synthesizesr = self.synthesizer.read()?;
 
             let audio_query = synthesizesr
                 .audio_query(text, StyleId::new(style_id))
@@ -415,7 +565,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
 
             let accent_phrases = synthesizer
                 .create_accent_phrases_from_kana(kana, StyleId::new(style_id))
@@ -434,7 +584,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
 
             let accent_phrases = synthesizer
                 .create_accent_phrases(text, StyleId::new(style_id))
@@ -453,7 +603,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
             crate::convert::blocking_modify_accent_phrases(
                 accent_phrases,
                 StyleId::new(style_id),
@@ -468,7 +618,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
             crate::convert::blocking_modify_accent_phrases(
                 accent_phrases,
                 StyleId::new(style_id),
@@ -483,7 +633,7 @@ mod blocking {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
             crate::convert::blocking_modify_accent_phrases(
                 accent_phrases,
                 StyleId::new(style_id),
@@ -506,7 +656,7 @@ mod blocking {
         ) -> PyResult<&'py PyBytes> {
             let wav = &self
                 .synthesizer
-                .get()?
+                .read()?
                 .synthesis(
                     &audio_query,
                     StyleId::new(style_id),
@@ -536,7 +686,7 @@ mod blocking {
             };
             let wav = &self
                 .synthesizer
-                .get()?
+                .read()?
                 .tts_from_kana(kana, style_id, options)
                 .into_py_result(py)?;
             Ok(PyBytes::new(py, wav))
@@ -560,14 +710,14 @@ mod blocking {
             };
             let wav = &self
                 .synthesizer
-                .get()?
+                .read()?
                 .tts(text, style_id, options)
                 .into_py_result(py)?;
             Ok(PyBytes::new(py, wav))
         }
 
         fn close(&mut self) {
-            self.synthesizer.close()
+            drop(self.synthesizer.close());
         }
     }
 
@@ -649,7 +799,7 @@ mod asyncio {
     use pyo3::{
         pyclass, pymethods,
         types::{IntoPyDict as _, PyBytes, PyDict, PyList},
-        Py, PyAny, PyObject, PyRef, PyResult, Python, ToPyObject as _,
+        Py, PyAny, PyErr, PyObject, PyRef, PyResult, Python, ToPyObject as _,
     };
     use uuid::Uuid;
     use voicevox_core::{
@@ -657,34 +807,73 @@ mod asyncio {
         UserDictWord,
     };
 
-    use crate::{convert::VoicevoxCoreResultExt as _, Closable};
+    use crate::{convert::VoicevoxCoreResultExt as _, Closable, Tokio, VoiceModelFilePyFields};
 
     #[pyclass]
     #[derive(Clone)]
-    pub(crate) struct VoiceModel {
-        model: Arc<voicevox_core::nonblocking::VoiceModel>,
+    pub(crate) struct VoiceModelFile {
+        model: Arc<Closable<voicevox_core::nonblocking::VoiceModelFile, Self, Tokio>>,
+        fields: VoiceModelFilePyFields,
     }
 
     #[pymethods]
-    impl VoiceModel {
+    impl VoiceModelFile {
         #[staticmethod]
-        fn from_path(py: Python<'_>, path: PathBuf) -> PyResult<&PyAny> {
+        fn open(py: Python<'_>, path: PathBuf) -> PyResult<&PyAny> {
             pyo3_asyncio::tokio::future_into_py(py, async move {
-                let model = voicevox_core::nonblocking::VoiceModel::from_path(path).await;
-                let model = Python::with_gil(|py| model.into_py_result(py))?.into();
-                Ok(Self { model })
+                let model = voicevox_core::nonblocking::VoiceModelFile::open(path).await;
+                let (model, id, metas) = Python::with_gil(|py| {
+                    let model = Python::with_gil(|py| model.into_py_result(py))?;
+                    let id = crate::convert::to_py_uuid(py, model.id().raw_voice_model_id())?;
+                    let metas =
+                        crate::convert::to_pydantic_voice_model_meta(model.metas(), py)?.into();
+                    Ok::<_, PyErr>((model, id, metas))
+                })?;
+
+                let model = Closable::new(model).into();
+
+                Ok(Self {
+                    model,
+                    fields: VoiceModelFilePyFields { id, metas },
+                })
+            })
+        }
+
+        fn close<'py>(&self, py: Python<'py>) -> PyResult<&'py PyAny> {
+            let this = self.model.clone();
+            pyo3_asyncio::tokio::future_into_py(py, async move {
+                if let Some(this) = this.close().await {
+                    this.close().await;
+                }
+                Ok(())
             })
         }
 
         #[getter]
-        fn id(&self, py: Python<'_>) -> PyResult<PyObject> {
-            let id = self.model.id().raw_voice_model_id();
-            crate::convert::to_py_uuid(py, id)
+        fn id(&self) -> PyObject {
+            self.fields.id.clone()
         }
 
         #[getter]
-        fn metas<'py>(&self, py: Python<'py>) -> Vec<&'py PyAny> {
-            crate::convert::to_pydantic_voice_model_meta(self.model.metas(), py).unwrap()
+        fn metas(&self) -> Py<PyList> {
+            self.fields.metas.clone()
+        }
+
+        fn __aenter__(slf: PyRef<'_, Self>) -> PyResult<&PyAny> {
+            slf.model.read()?;
+
+            let py = slf.py();
+            crate::convert::ready(slf, py)
+        }
+
+        fn __aexit__<'py>(
+            &self,
+            #[expect(unused_variables, reason = "`__aexit__`としては必要")] exc_type: &'py PyAny,
+            #[expect(unused_variables, reason = "`__aexit__`としては必要")] exc_value: &'py PyAny,
+            #[expect(unused_variables, reason = "`__aexit__`としては必要")] traceback: &'py PyAny,
+            py: Python<'py>,
+        ) -> PyResult<&'py PyAny> {
+            self.close(py)
         }
     }
 
@@ -791,9 +980,12 @@ mod asyncio {
 
     #[pyclass]
     pub(crate) struct Synthesizer {
-        synthesizer: Closable<
-            voicevox_core::nonblocking::Synthesizer<voicevox_core::nonblocking::OpenJtalk>,
-            Self,
+        synthesizer: Arc<
+            Closable<
+                voicevox_core::nonblocking::Synthesizer<voicevox_core::nonblocking::OpenJtalk>,
+                Self,
+                Tokio,
+            >,
         >,
     }
 
@@ -822,7 +1014,7 @@ mod asyncio {
                 },
             );
             let synthesizer = Python::with_gil(|py| synthesizer.into_py_result(py))?;
-            let synthesizer = Closable::new(synthesizer);
+            let synthesizer = Closable::new(synthesizer).into();
             Ok(Self { synthesizer })
         }
 
@@ -830,18 +1022,21 @@ mod asyncio {
             "Synthesizer { .. }"
         }
 
-        fn __enter__(slf: PyRef<'_, Self>) -> PyResult<PyRef<'_, Self>> {
-            slf.synthesizer.get()?;
-            Ok(slf)
+        fn __aenter__(slf: PyRef<'_, Self>) -> PyResult<&PyAny> {
+            slf.synthesizer.read()?;
+
+            let py = slf.py();
+            crate::convert::ready(slf, py)
         }
 
-        fn __exit__(
+        fn __aexit__<'py>(
             &mut self,
-            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_type: &PyAny,
-            #[expect(unused_variables, reason = "`__exit__`としては必要")] exc_value: &PyAny,
-            #[expect(unused_variables, reason = "`__exit__`としては必要")] traceback: &PyAny,
-        ) {
-            self.close();
+            #[expect(unused_variables, reason = "`__aexit__`としては必要")] exc_type: &'py PyAny,
+            #[expect(unused_variables, reason = "`__aexit__`としては必要")] exc_value: &'py PyAny,
+            #[expect(unused_variables, reason = "`__aexit__`としては必要")] traceback: &'py PyAny,
+            py: Python<'py>,
+        ) -> PyResult<&'py PyAny> {
+            self.close(py)
         }
 
         #[getter]
@@ -851,13 +1046,13 @@ mod asyncio {
 
         #[getter]
         fn is_gpu_mode(&self) -> PyResult<bool> {
-            let synthesizer = self.synthesizer.get()?;
+            let synthesizer = self.synthesizer.read()?;
             Ok(synthesizer.is_gpu_mode())
         }
 
         #[getter]
-        fn metas<'py>(&self, py: Python<'py>) -> PyResult<Vec<&'py PyAny>> {
-            let synthesizer = self.synthesizer.get()?;
+        fn metas<'py>(&self, py: Python<'py>) -> PyResult<&'py PyList> {
+            let synthesizer = self.synthesizer.read()?;
             crate::convert::to_pydantic_voice_model_meta(&synthesizer.metas(), py)
         }
 
@@ -866,10 +1061,10 @@ mod asyncio {
             model: &'py PyAny,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let model: VoiceModel = model.extract()?;
-            let synthesizer = self.synthesizer.get()?.clone();
+            let model: VoiceModelFile = model.extract()?;
+            let synthesizer = self.synthesizer.read()?.clone();
             pyo3_asyncio::tokio::future_into_py(py, async move {
-                let result = synthesizer.load_voice_model(&model.model).await;
+                let result = synthesizer.load_voice_model(&*model.model.read()?).await;
                 Python::with_gil(|py| result.into_py_result(py))
             })
         }
@@ -880,7 +1075,7 @@ mod asyncio {
             py: Python<'_>,
         ) -> PyResult<()> {
             self.synthesizer
-                .get()?
+                .read()?
                 .unload_voice_model(voice_model_id.into())
                 .into_py_result(py)
         }
@@ -891,7 +1086,7 @@ mod asyncio {
         ) -> PyResult<bool> {
             Ok(self
                 .synthesizer
-                .get()?
+                .read()?
                 .is_loaded_voice_model(voice_model_id.into()))
         }
 
@@ -901,7 +1096,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             let kana = kana.to_owned();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
@@ -929,7 +1124,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             let text = text.to_owned();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
@@ -953,7 +1148,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             let kana = kana.to_owned();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
@@ -982,7 +1177,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             let text = text.to_owned();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
@@ -1011,7 +1206,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             crate::convert::async_modify_accent_phrases(
                 accent_phrases,
                 StyleId::new(style_id),
@@ -1026,7 +1221,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             crate::convert::async_modify_accent_phrases(
                 accent_phrases,
                 StyleId::new(style_id),
@@ -1041,7 +1236,7 @@ mod asyncio {
             style_id: u32,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             crate::convert::async_modify_accent_phrases(
                 accent_phrases,
                 StyleId::new(style_id),
@@ -1058,7 +1253,7 @@ mod asyncio {
             enable_interrogative_upspeak: bool,
             py: Python<'py>,
         ) -> PyResult<&'py PyAny> {
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
                 pyo3_asyncio::tokio::get_current_locals(py)?,
@@ -1096,7 +1291,7 @@ mod asyncio {
             let options = TtsOptions {
                 enable_interrogative_upspeak,
             };
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             let kana = kana.to_owned();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
@@ -1128,7 +1323,7 @@ mod asyncio {
             let options = TtsOptions {
                 enable_interrogative_upspeak,
             };
-            let synthesizer = self.synthesizer.get()?.clone();
+            let synthesizer = self.synthesizer.read()?.clone();
             let text = text.to_owned();
             pyo3_asyncio::tokio::future_into_py_with_locals(
                 py,
@@ -1144,8 +1339,14 @@ mod asyncio {
             )
         }
 
-        fn close(&mut self) {
-            self.synthesizer.close()
+        fn close<'py>(&self, py: Python<'py>) -> PyResult<&'py PyAny> {
+            let this = self.synthesizer.clone();
+            pyo3_asyncio::tokio::future_into_py(py, async move {
+                if let Some(this) = this.close().await {
+                    crate::convert::run_in_executor(|| drop(this)).await?;
+                }
+                Ok(())
+            })
         }
     }
 
diff --git a/docs/usage.md b/docs/usage.md
index 067250126..26ed50810 100644
--- a/docs/usage.md
+++ b/docs/usage.md
@@ -62,15 +62,15 @@ VOICEVOX コアでは`Synthesizer`に音声モデルを読み込むことでテ
 
 ```python
 from pprint import pprint
-from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModelFile
 
 # 1. Synthesizerの初期化
 open_jtalk_dict_dir = "open_jtalk_dic_utf_8-1.11"
 synthesizer = Synthesizer(Onnxruntime.load_once(), OpenJtalk(open_jtalk_dict_dir))
 
 # 2. 音声モデルの読み込み
-model = VoiceModel.from_path("model/0.vvm")
-synthesizer.load_voice_model(model)
+with VoiceModelFile.open("model/0.vvm") as model:
+    synthesizer.load_voice_model(model)
 
 # 3. テキスト音声合成
 text = "サンプル音声です"
@@ -86,11 +86,11 @@ AIエンジンの`Onnxruntime`のインスタンスと、辞書などを取り
 
 ### 2. 音声モデルの読み込み
 
-VVM ファイルから`VoiceModel`インスタンスを作成し、`Synthesizer`に読み込ませます。その VVM ファイルにどの声が含まれているかは`VoiceModel`の`.metas`や[音声モデルと声の対応表](https://github.com/VOICEVOX/voicevox_fat_resource/blob/main/core/model/README.md#%E9%9F%B3%E5%A3%B0%E3%83%A2%E3%83%87%E3%83%ABvvm%E3%83%95%E3%82%A1%E3%82%A4%E3%83%AB%E3%81%A8%E5%A3%B0%E3%82%AD%E3%83%A3%E3%83%A9%E3%82%AF%E3%82%BF%E3%83%BC%E3%82%B9%E3%82%BF%E3%82%A4%E3%83%AB%E5%90%8D%E3%81%A8%E3%82%B9%E3%82%BF%E3%82%A4%E3%83%AB-id-%E3%81%AE%E5%AF%BE%E5%BF%9C%E8%A1%A8)で確認できます。
+VVM ファイルから`VoiceModelFile`インスタンスを作成し、`Synthesizer`に読み込ませます。その VVM ファイルにどの声が含まれているかは`VoiceModelFile`の`.metas`や[音声モデルと声の対応表](https://github.com/VOICEVOX/voicevox_fat_resource/blob/main/core/model/README.md#%E9%9F%B3%E5%A3%B0%E3%83%A2%E3%83%87%E3%83%ABvvm%E3%83%95%E3%82%A1%E3%82%A4%E3%83%AB%E3%81%A8%E5%A3%B0%E3%82%AD%E3%83%A3%E3%83%A9%E3%82%AF%E3%82%BF%E3%83%BC%E3%82%B9%E3%82%BF%E3%82%A4%E3%83%AB%E5%90%8D%E3%81%A8%E3%82%B9%E3%82%BF%E3%82%A4%E3%83%AB-id-%E3%81%AE%E5%AF%BE%E5%BF%9C%E8%A1%A8)で確認できます。
 
 ```python
-model = VoiceModel.from_path("model/0.vvm")
-pprint(model.metas)
+with VoiceModelFile.open("model/0.vvm") as model:
+    pprint(model.metas)
 ```
 
 ```txt
diff --git a/example/cpp/unix/simple_tts.cpp b/example/cpp/unix/simple_tts.cpp
index 5db24b12e..210df1549 100644
--- a/example/cpp/unix/simple_tts.cpp
+++ b/example/cpp/unix/simple_tts.cpp
@@ -47,8 +47,8 @@ int main(int argc, char *argv[]) {
     if (path.extension() != ".vvm") {
       continue;
     }
-    VoicevoxVoiceModel* model;
-    result = voicevox_voice_model_new_from_path(path.c_str(), &model);
+    VoicevoxVoiceModelFile* model;
+    result = voicevox_voice_model_file_open(path.c_str(), &model);
     if (result != VoicevoxResultCode::VOICEVOX_RESULT_OK) {
       std::cerr << voicevox_error_result_to_message(result) << std::endl;
       return 0;
@@ -58,7 +58,7 @@ int main(int argc, char *argv[]) {
       std::cerr << voicevox_error_result_to_message(result) << std::endl;
       return 0;
     }
-    voicevox_voice_model_delete(model);
+    voicevox_voice_model_file_close(model);
   }
 
   std::cout << "音声生成中..." << std::endl;
diff --git a/example/cpp/windows/simple_tts/simple_tts.cpp b/example/cpp/windows/simple_tts/simple_tts.cpp
index 946ef9679..2bdc947c6 100644
--- a/example/cpp/windows/simple_tts/simple_tts.cpp
+++ b/example/cpp/windows/simple_tts/simple_tts.cpp
@@ -59,9 +59,8 @@ int main() {
     if (path.extension() != ".vvm") {
       continue;
     }
-    VoicevoxVoiceModel* model;
-    result = voicevox_voice_model_new_from_path(path.generic_u8string().c_str(),
-                                                &model);
+    VoicevoxVoiceModelFile* model;
+    result = voicevox_voice_model_file_open(path.generic_u8string().c_str(), &model);
     if (result != VoicevoxResultCode::VOICEVOX_RESULT_OK) {
       OutErrorMessage(result);
       return 0;
@@ -71,7 +70,7 @@ int main() {
       OutErrorMessage(result);
       return 0;
     }
-    voicevox_voice_model_delete(model);
+    voicevox_voice_model_file_close(model);
   }
 
   std::wcout << L"音声生成中" << std::endl;
diff --git a/example/kotlin/app/src/main/kotlin/app/App.kt b/example/kotlin/app/src/main/kotlin/app/App.kt
index 7f2651020..0b8d05e33 100644
--- a/example/kotlin/app/src/main/kotlin/app/App.kt
+++ b/example/kotlin/app/src/main/kotlin/app/App.kt
@@ -47,7 +47,7 @@ fun main(args: Array<String>) {
           .build()
 
   println("Loading: ${vvmPath}")
-  val vvm = VoiceModel(vvmPath)
+  val vvm = VoiceModelFile(vvmPath)
   synthesizer.loadVoiceModel(vvm)
 
   println("Creating an AudioQuery from the text: ${text}")
diff --git a/example/python/run-asyncio.py b/example/python/run-asyncio.py
index b75509183..176ac290f 100644
--- a/example/python/run-asyncio.py
+++ b/example/python/run-asyncio.py
@@ -9,7 +9,7 @@
 from typing import Tuple
 
 from voicevox_core import AccelerationMode, AudioQuery
-from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.asyncio import Onnxruntime, OpenJtalk, Synthesizer, VoiceModelFile
 
 
 async def main() -> None:
@@ -45,8 +45,8 @@ async def main() -> None:
     logger.debug("%s", f"{synthesizer.is_gpu_mode=}")
 
     logger.info("%s", f"Loading `{vvm_path}`")
-    model = await VoiceModel.from_path(vvm_path)
-    await synthesizer.load_voice_model(model)
+    async with await VoiceModelFile.open(vvm_path) as model:
+        await synthesizer.load_voice_model(model)
 
     logger.info("%s", f"Creating an AudioQuery from {text!r}")
     audio_query = await synthesizer.audio_query(text, style_id)
diff --git a/example/python/run.py b/example/python/run.py
index 3a9fdd9e7..5f11a1a62 100644
--- a/example/python/run.py
+++ b/example/python/run.py
@@ -6,7 +6,7 @@
 from typing import Tuple
 
 from voicevox_core import AccelerationMode, AudioQuery
-from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModel
+from voicevox_core.blocking import Onnxruntime, OpenJtalk, Synthesizer, VoiceModelFile
 
 
 def main() -> None:
@@ -42,8 +42,8 @@ def main() -> None:
     logger.debug("%s", f"{synthesizer.is_gpu_mode=}")
 
     logger.info("%s", f"Loading `{vvm_path}`")
-    model = VoiceModel.from_path(vvm_path)
-    synthesizer.load_voice_model(model)
+    with VoiceModelFile.open(vvm_path) as model:
+        synthesizer.load_voice_model(model)
 
     logger.info("%s", f"Creating an AudioQuery from {text!r}")
     audio_query = synthesizer.audio_query(text, style_id)

From c7c8cf1da79040f0fb16fe5df90122b3b275b52f Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 20 Sep 2024 07:02:22 +0900
Subject: [PATCH 30/36] chore: minor refactor (#833)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

単体でPRを作るほどではない細かいリファクタを行う。
---
 crates/voicevox_core/Cargo.toml               |  3 --
 .../src/engine/acoustic_feature_extractor.rs  | 12 ++----
 crates/voicevox_core/src/engine/open_jtalk.rs | 37 +++++++++----------
 crates/voicevox_core/src/infer/domains.rs     |  4 --
 crates/voicevox_core/src/synthesizer.rs       |  5 ++-
 crates/voicevox_core/src/voice_model.rs       | 22 +----------
 crates/voicevox_core_c_api/build.rs           |  3 +-
 crates/voicevox_core_c_api/src/lib.rs         | 22 ++++-------
 .../tests/e2e/snapshots.toml                  |  5 +--
 .../tests/e2e/testcases/user_dict_load.rs     |  2 +-
 crates/voicevox_core_java_api/src/logger.rs   |  5 +--
 .../python/test/test_nop.py                   |  8 ----
 .../python/voicevox_core/_load_dlls.py        |  3 +-
 13 files changed, 42 insertions(+), 89 deletions(-)
 delete mode 100644 crates/voicevox_core_python_api/python/test/test_nop.py

diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index ba508ba44..d5fb28321 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -67,8 +67,5 @@ humansize.workspace = true
 windows = { workspace = true, features = ["Win32_Foundation", "Win32_Graphics_Dxgi"] }
 
 [lints.rust]
-# FIXME: `unsafe impl Send`のもあるが、以下2つのマージにより消える予定
-# * https://github.com/VOICEVOX/voicevox_core/pull/725
-# * https://github.com/VOICEVOX/voicevox_core/pull/772
 unsafe_code = "allow" # WindowsのGPU情報表示に、Win32を利用
 rust_2018_idioms = "warn"
diff --git a/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs b/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
index ca2da4697..02b66f903 100644
--- a/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
+++ b/crates/voicevox_core/src/engine/acoustic_feature_extractor.rs
@@ -63,9 +63,6 @@ static PHONEME_MAP: LazyLock<HashMap<&str, i64>> = LazyLock::new(|| {
 #[derive(Debug, Clone, PartialEq, new, Default, Getters)]
 pub(crate) struct OjtPhoneme {
     phoneme: String,
-    // FIXME: derive-getters(多分)が警告を覆い隠しているが、以下の二つは使っていないはず
-    start: f32,
-    end: f32,
 }
 
 impl OjtPhoneme {
@@ -113,8 +110,8 @@ mod tests {
     fn base_hello_hiho() -> Vec<OjtPhoneme> {
         STR_HELLO_HIHO
             .split_whitespace()
-            .enumerate()
-            .map(|(i, s)| OjtPhoneme::new(s.into(), i as f32, (i + 1) as f32))
+            .map(ToOwned::to_owned)
+            .map(OjtPhoneme::new)
             .collect()
     }
 
@@ -154,9 +151,8 @@ mod tests {
     }
 
     #[rstest]
-    #[case(ojt_hello_hiho(), 9, OjtPhoneme::new("a".into(), 9., 10.), true)]
-    #[case(ojt_hello_hiho(), 9, OjtPhoneme::new("k".into(), 9., 10.), false)]
-    #[case(ojt_hello_hiho(), 9, OjtPhoneme::new("a".into(), 10., 11.), false)]
+    #[case(ojt_hello_hiho(), 9, OjtPhoneme::new("a".into()), true)]
+    #[case(ojt_hello_hiho(), 9, OjtPhoneme::new("k".into()), false)]
     fn test_ojt_phoneme_equality(
         #[case] ojt_phonemes: Vec<OjtPhoneme>,
         #[case] index: usize,
diff --git a/crates/voicevox_core/src/engine/open_jtalk.rs b/crates/voicevox_core/src/engine/open_jtalk.rs
index f27e9b0a6..3cad9c99a 100644
--- a/crates/voicevox_core/src/engine/open_jtalk.rs
+++ b/crates/voicevox_core/src/engine/open_jtalk.rs
@@ -48,26 +48,23 @@ pub(crate) mod blocking {
         pub fn new(open_jtalk_dict_dir: impl AsRef<Utf8Path>) -> crate::result::Result<Self> {
             let dict_dir = open_jtalk_dict_dir.as_ref().to_owned();
 
-            // FIXME: この`{}`はGitのdiffを抑えるためだけに存在
-            {
-                let mut resources = Resources {
-                    mecab: ManagedResource::initialize(),
-                    njd: ManagedResource::initialize(),
-                    jpcommon: ManagedResource::initialize(),
-                };
-
-                // FIXME: 「システム辞書を読もうとしたけど読めなかった」というエラーをちゃんと用意する
-                resources
-                    .mecab
-                    .load(&*dict_dir)
-                    .inspect_err(|e| tracing::error!("{e:?}"))
-                    .map_err(|_| ErrorRepr::NotLoadedOpenjtalkDict)?;
-
-                Ok(Self(Arc::new(Inner {
-                    resources: Mutex::new(resources),
-                    dict_dir,
-                })))
-            }
+            let mut resources = Resources {
+                mecab: ManagedResource::initialize(),
+                njd: ManagedResource::initialize(),
+                jpcommon: ManagedResource::initialize(),
+            };
+
+            // FIXME: 「システム辞書を読もうとしたけど読めなかった」というエラーをちゃんと用意する
+            resources
+                .mecab
+                .load(&*dict_dir)
+                .inspect_err(|e| tracing::error!("{e:?}"))
+                .map_err(|_| ErrorRepr::NotLoadedOpenjtalkDict)?;
+
+            Ok(Self(Arc::new(Inner {
+                resources: Mutex::new(resources),
+                dict_dir,
+            })))
         }
 
         /// ユーザー辞書を設定する。
diff --git a/crates/voicevox_core/src/infer/domains.rs b/crates/voicevox_core/src/infer/domains.rs
index 5225f2ec3..72e1e0886 100644
--- a/crates/voicevox_core/src/infer/domains.rs
+++ b/crates/voicevox_core/src/infer/domains.rs
@@ -63,7 +63,3 @@ pub(crate) trait InferenceDomainMapValues {
 impl<T> InferenceDomainMapValues for (T,) {
     type Talk = T;
 }
-
-impl<A> InferenceDomainMapValues for [A] {
-    type Talk = A;
-}
diff --git a/crates/voicevox_core/src/synthesizer.rs b/crates/voicevox_core/src/synthesizer.rs
index 045a2d9ea..ee960cd1a 100644
--- a/crates/voicevox_core/src/synthesizer.rs
+++ b/crates/voicevox_core/src/synthesizer.rs
@@ -1079,8 +1079,9 @@ pub(crate) mod blocking {
             OjtPhoneme::convert(
                 phoneme_str_list
                     .iter()
-                    .enumerate()
-                    .map(|(i, s)| OjtPhoneme::new(s.as_ref().to_string(), i as f32, i as f32 + 1.))
+                    .map(AsRef::as_ref)
+                    .map(ToOwned::to_owned)
+                    .map(OjtPhoneme::new)
                     .collect::<Vec<OjtPhoneme>>()
                     .as_slice(),
             )
diff --git a/crates/voicevox_core/src/voice_model.rs b/crates/voicevox_core/src/voice_model.rs
index cf2c0f078..ef105fae6 100644
--- a/crates/voicevox_core/src/voice_model.rs
+++ b/crates/voicevox_core/src/voice_model.rs
@@ -509,7 +509,7 @@ pub(crate) mod nonblocking {
 
 #[cfg(test)]
 mod tests {
-    use rstest::{fixture, rstest};
+    use rstest::rstest;
     use serde_json::json;
 
     use crate::{
@@ -556,26 +556,6 @@ mod tests {
         assert_eq!(expected, actual);
     }
 
-    // FIXME: これ使ってないのでは？
-    #[fixture]
-    fn talk_speaker() -> SpeakerMeta {
-        serde_json::from_value(json!({
-            "name": "dummy",
-            "styles": [
-                {
-                    "id": 0,
-                    "name": "style1",
-                    "type": "talk",
-                    "order": 0
-                }
-            ],
-            "version": "0.0.1",
-            "speaker_uuid": "574bc678-8370-44be-b941-08e46e7b47d7",
-            "order": 0
-        }))
-        .unwrap()
-    }
-
     fn speaker(style_types: &'static [StyleType]) -> SpeakerMeta {
         let styles = style_types
             .iter()
diff --git a/crates/voicevox_core_c_api/build.rs b/crates/voicevox_core_c_api/build.rs
index 6b0934882..28eb7c04c 100644
--- a/crates/voicevox_core_c_api/build.rs
+++ b/crates/voicevox_core_c_api/build.rs
@@ -1,4 +1,5 @@
-// TODO: voicevox_onnxruntimeになったらやめる
+// TODO: #802 の時点でiOS以外不要になっているはずなので、このbuild.rsは丸ごと消す
+// (iOSのためにbuild_util/make_ios_xcframework.bashの修正は必要)
 fn main() {
     #[cfg(target_os = "linux")]
     println!("cargo:rustc-link-arg=-Wl,-rpath,$ORIGIN");
diff --git a/crates/voicevox_core_c_api/src/lib.rs b/crates/voicevox_core_c_api/src/lib.rs
index 63f344553..a5c440146 100644
--- a/crates/voicevox_core_c_api/src/lib.rs
+++ b/crates/voicevox_core_c_api/src/lib.rs
@@ -59,8 +59,7 @@ fn init_logger_once() {
                 && anstyle_query::windows::enable_ansi_colors().unwrap_or(true)
         };
 
-        // FIXME: `try_init` → `init` （subscriberは他に存在しないはずなので）
-        let _ = tracing_subscriber::fmt()
+        tracing_subscriber::fmt()
             .with_env_filter(if env::var_os(EnvFilter::DEFAULT_ENV).is_some() {
                 EnvFilter::from_default_env()
             } else {
@@ -69,7 +68,7 @@ fn init_logger_once() {
             .with_timer(local_time as fn(&mut Writer<'_>) -> _)
             .with_ansi(ansi)
             .with_writer(out)
-            .try_init();
+            .init();
     });
 
     fn local_time(wtr: &mut Writer<'_>) -> fmt::Result {
@@ -83,13 +82,6 @@ fn init_logger_once() {
     }
 }
 
-/*
- * Cの関数として公開するための型や関数を定義するこれらの実装はvoicevox_core/publish.rsに定義してある対応する関数にある
- * この関数ではvoicevox_core/publish.rsにある対応する関数の呼び出しと、その戻り値をCの形式に変換する処理のみとする
- * これはC文脈の処理と実装をわけるためと、内部実装の変更がAPIに影響を与えにくくするためである
- * voicevox_core/publish.rsにある対応する関数とはこのファイルに定義してある公開関数からvoicevoxプレフィックスを取り除いた名前の関数である
- */
-
 // TODO: https://github.com/mozilla/cbindgen/issues/927
 //#[cfg(feature = "load-onnxruntime")]
 //pub const VOICEVOX_ONNXRUNTIME_LIB_NAME: &CStr = ..;
@@ -392,10 +384,12 @@ pub extern "C" fn voicevox_get_version() -> *const c_char {
     init_logger_once();
     return C_STRING_DROP_CHECKER.blacklist(VERSION).as_ptr();
 
-    // FIXME: 実行時チェックにすることでこの`unsafe`は削れるはず
-    const VERSION: &CStr = unsafe {
-        // SAFETY: The package version is a SemVer, so it should not contain '\0'
-        CStr::from_bytes_with_nul_unchecked(concat!(env!("CARGO_PKG_VERSION"), '\0').as_bytes())
+    const VERSION: &CStr = if let Ok(version) =
+        CStr::from_bytes_with_nul(concat!(env!("CARGO_PKG_VERSION"), '\0').as_bytes())
+    {
+        version
+    } else {
+        panic!("`$CARGO_PKG_VERSION` should be a SemVer, so it should not contain `\\0`");
     };
 }
 
diff --git a/crates/voicevox_core_c_api/tests/e2e/snapshots.toml b/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
index 17ccd61f8..eb5911c7e 100644
--- a/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
+++ b/crates/voicevox_core_c_api/tests/e2e/snapshots.toml
@@ -88,7 +88,7 @@ result_messages.22 = "ユーザー辞書に単語が見つかりませんでし
 result_messages.23 = "OpenJTalkのユーザー辞書の設定に失敗しました"
 result_messages.24 = "ユーザー辞書の単語のバリデーションに失敗しました"
 result_messages.25 = "UUIDの変換に失敗しました"
-# FIXME: 26, 27, 28が抜けている
+result_messages.28 = "モデルの形式が不正です"
 result_messages.29 = "推論ライブラリのロードまたは初期化ができませんでした"
 stderr = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
@@ -180,8 +180,7 @@ stderr.unix = '''
 {timestamp}  INFO voicevox_core::synthesizer::blocking: CPUを利用します
 '''
 
-# FIXME: "user_dict_load"のはず
-[user_dict]
+[user_dict_load]
 stderr.windows = '''
 {timestamp}  INFO ort: Loaded ONNX Runtime dylib with version '{onnxruntime_version}'
 {windows-video-cards}
diff --git a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
index d044962ae..620610ed9 100644
--- a/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
+++ b/crates/voicevox_core_c_api/tests/e2e/testcases/user_dict_load.rs
@@ -144,7 +144,7 @@ impl assert_cdylib::TestCase for TestCase {
     }
 }
 
-static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(user_dict);
+static SNAPSHOTS: LazyLock<Snapshots> = snapshots::section!(user_dict_load);
 
 #[derive(Deserialize)]
 struct Snapshots {
diff --git a/crates/voicevox_core_java_api/src/logger.rs b/crates/voicevox_core_java_api/src/logger.rs
index 30545725e..d7feb6d65 100644
--- a/crates/voicevox_core_java_api/src/logger.rs
+++ b/crates/voicevox_core_java_api/src/logger.rs
@@ -25,8 +25,7 @@ extern "system" fn Java_jp_hiroshiba_voicevoxcore_Dll_00024LoggerInitializer_ini
         };
         use tracing_subscriber::{fmt::format::Writer, EnvFilter};
 
-        // FIXME: `try_init` → `init` （subscriberは他に存在しないはずなので）
-        let _ = tracing_subscriber::fmt()
+        tracing_subscriber::fmt()
             .with_env_filter(if env::var_os(EnvFilter::DEFAULT_ENV).is_some() {
                 EnvFilter::from_default_env()
             } else {
@@ -36,7 +35,7 @@ extern "system" fn Java_jp_hiroshiba_voicevoxcore_Dll_00024LoggerInitializer_ini
             .with_timer(local_time as fn(&mut Writer<'_>) -> _)
             .with_ansi(out().is_terminal() && env_allows_ansi())
             .with_writer(out)
-            .try_init();
+            .init();
 
         fn local_time(wtr: &mut Writer<'_>) -> fmt::Result {
             // ローカル時刻で表示はするが、そのフォーマットはtracing-subscriber本来のものに近いようにする。
diff --git a/crates/voicevox_core_python_api/python/test/test_nop.py b/crates/voicevox_core_python_api/python/test/test_nop.py
deleted file mode 100644
index 43956957d..000000000
--- a/crates/voicevox_core_python_api/python/test/test_nop.py
+++ /dev/null
@@ -1,8 +0,0 @@
-# FIXME: ちゃんとしたテストを用意する
-
-import conftest  # noqa: F401
-import voicevox_core  # noqa: F401
-
-
-def test_nop() -> None:
-    pass
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py b/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py
index 0f9e3d034..2b90b9988 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_load_dlls.py
@@ -1,4 +1,5 @@
-# TODO: voicevox_onnxruntimeになったらやめる
+# TODO: ここは #803 の時点でさほど必要性が無くなっているはずなので、(ドキュメントでの案内
+# はした上で)やめる
 import glob
 import platform
 from ctypes import CDLL

From 9fdb347824ee9266b8128d3cb20334188dcf672b Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Tue, 24 Sep 2024 16:52:53 +0900
Subject: [PATCH 31/36] =?UTF-8?q?#830=20=E3=81=AE=E8=A8=AD=E8=A8=88?=
 =?UTF-8?q?=E3=82=92`UserDict`=E3=81=AB=E3=82=82=20(#834)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`UserDict`に対して以下の二つを行う。

1. #830 のように`Inner<A: Async>`で共通化する設計にする
2. async-fsを導入することでasync APIとしての質を向上させる
---
 crates/voicevox_core/Cargo.toml            |   2 +-
 crates/voicevox_core/src/asyncs.rs         |  20 ++
 crates/voicevox_core/src/user_dict/dict.rs | 204 +++++++++++++--------
 3 files changed, 153 insertions(+), 73 deletions(-)

diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml
index d5fb28321..8390e1de3 100644
--- a/crates/voicevox_core/Cargo.toml
+++ b/crates/voicevox_core/Cargo.toml
@@ -16,7 +16,7 @@ link-onnxruntime = []
 
 [dependencies]
 anyhow.workspace = true
-async-fs.workspace = true # 今これを使っている箇所はどこにも無いが、`UserDict`にはこれを使った方がよいはず
+async-fs.workspace = true
 async-lock.workspace = true
 async_zip = { workspace = true, features = ["deflate"] }
 blocking.workspace = true
diff --git a/crates/voicevox_core/src/asyncs.rs b/crates/voicevox_core/src/asyncs.rs
index d89aa7d4b..24fdd82b4 100644
--- a/crates/voicevox_core/src/asyncs.rs
+++ b/crates/voicevox_core/src/asyncs.rs
@@ -34,6 +34,10 @@ pub(crate) trait Async: 'static {
     /// `io::Error`は素（`i32`相当）のままにしておき、この関数を呼び出す側でfs-err風のメッセージを付
     /// ける。
     async fn open_file_ro(path: impl AsRef<Path>) -> io::Result<Self::RoFile>;
+
+    async fn read(path: impl AsRef<Path>) -> io::Result<Vec<u8>>;
+
+    async fn write(path: impl AsRef<Path>, content: impl AsRef<[u8]>) -> io::Result<()>;
 }
 
 pub(crate) trait Mutex<T>: From<T> + Send + Sync + Unpin {
@@ -59,6 +63,14 @@ impl Async for SingleTasked {
     async fn open_file_ro(path: impl AsRef<Path>) -> io::Result<Self::RoFile> {
         std::fs::File::open(path).map(StdFile)
     }
+
+    async fn read(path: impl AsRef<Path>) -> io::Result<Vec<u8>> {
+        std::fs::read(path)
+    }
+
+    async fn write(path: impl AsRef<Path>, content: impl AsRef<[u8]>) -> io::Result<()> {
+        std::fs::write(path, content)
+    }
 }
 
 pub(crate) struct StdMutex<T>(std::sync::Mutex<T>);
@@ -111,6 +123,14 @@ impl Async for BlockingThreadPool {
     async fn open_file_ro(path: impl AsRef<Path>) -> io::Result<Self::RoFile> {
         AsyncRoFile::open(path).await
     }
+
+    async fn read(path: impl AsRef<Path>) -> io::Result<Vec<u8>> {
+        async_fs::read(path).await
+    }
+
+    async fn write(path: impl AsRef<Path>, content: impl AsRef<[u8]>) -> io::Result<()> {
+        async_fs::write(path, content).await
+    }
 }
 
 impl<T: Send + Sync + Unpin> Mutex<T> for async_lock::Mutex<T> {
diff --git a/crates/voicevox_core/src/user_dict/dict.rs b/crates/voicevox_core/src/user_dict/dict.rs
index 0e1c89ca2..2f851b138 100644
--- a/crates/voicevox_core/src/user_dict/dict.rs
+++ b/crates/voicevox_core/src/user_dict/dict.rs
@@ -1,33 +1,128 @@
-// TODO: `VoiceModelFile`のように、次のような設計にする。
-//
-// ```
-// pub(crate) mod blocking {
-//     pub struct UserDict(Inner<SingleTasked>);
-//     // …
-// }
-// pub(crate) mod nonblocking {
-//     pub struct UserDict(Inner<BlockingThreadPool>);
-//     // …
-// }
-// ```
+use std::{marker::PhantomData, path::Path};
+
+use anyhow::Context as _;
+use easy_ext::ext;
+use educe::Educe;
+use indexmap::IndexMap;
+use itertools::Itertools as _;
+use uuid::Uuid;
+
+use crate::{asyncs::Async, error::ErrorRepr};
+
+use super::UserDictWord;
+
+#[derive(Educe)]
+#[educe(Default(bound = "A:"))]
+#[educe(Debug(bound = "A:"))]
+struct Inner<A> {
+    words: std::sync::Mutex<IndexMap<Uuid, UserDictWord>>,
+    _marker: PhantomData<A>,
+}
+
+impl<A: Async> Inner<A> {
+    fn to_json(&self) -> String {
+        self.with_words(|words| serde_json::to_string(words).expect("should not fail"))
+    }
+
+    fn with_words<F, R>(&self, f: F) -> R
+    where
+        F: FnOnce(&mut IndexMap<Uuid, UserDictWord>) -> R,
+    {
+        f(&mut self.words.lock().unwrap_or_else(|e| panic!("{e}")))
+    }
+
+    async fn load(&self, store_path: &str) -> crate::Result<()> {
+        let words = async {
+            let words = &A::fs_err_read(store_path).await?;
+            let words = serde_json::from_slice::<IndexMap<_, _>>(words)?;
+            Ok(words)
+        }
+        .await
+        .map_err(ErrorRepr::LoadUserDict)?;
+
+        self.with_words(|words_| words_.extend(words));
+        Ok(())
+    }
+
+    fn add_word(&self, word: UserDictWord) -> crate::Result<Uuid> {
+        let word_uuid = Uuid::new_v4();
+        self.with_words(|word_| word_.insert(word_uuid, word));
+        Ok(word_uuid)
+    }
+
+    fn update_word(&self, word_uuid: Uuid, new_word: UserDictWord) -> crate::Result<()> {
+        self.with_words(|words| {
+            if !words.contains_key(&word_uuid) {
+                return Err(ErrorRepr::WordNotFound(word_uuid).into());
+            }
+            words.insert(word_uuid, new_word);
+            Ok(())
+        })
+    }
+
+    fn remove_word(&self, word_uuid: Uuid) -> crate::Result<UserDictWord> {
+        let Some(word) = self.with_words(|words| words.remove(&word_uuid)) else {
+            return Err(ErrorRepr::WordNotFound(word_uuid).into());
+        };
+        Ok(word)
+    }
+
+    fn import(&self, other: &Self) -> crate::Result<()> {
+        self.with_words(|self_words| {
+            other.with_words(|other_words| {
+                for (word_uuid, word) in other_words {
+                    self_words.insert(*word_uuid, word.clone());
+                }
+                Ok(())
+            })
+        })
+    }
+
+    async fn save(&self, store_path: &str) -> crate::Result<()> {
+        A::fs_err_write(
+            store_path,
+            serde_json::to_vec(&self.words).expect("should not fail"),
+        )
+        .await
+        .map_err(ErrorRepr::SaveUserDict)
+        .map_err(Into::into)
+    }
+
+    fn to_mecab_format(&self) -> String {
+        self.with_words(|words| words.values().map(UserDictWord::to_mecab_format).join("\n"))
+    }
+}
+
+#[ext]
+impl<A: Async> A {
+    async fn fs_err_read(path: impl AsRef<Path>) -> anyhow::Result<Vec<u8>> {
+        Self::read(&path)
+            .await
+            .with_context(|| format!("failed to read from file `{}`", path.as_ref().display()))
+    }
+
+    async fn fs_err_write(path: impl AsRef<Path>, content: impl AsRef<[u8]>) -> anyhow::Result<()> {
+        Self::write(&path, content)
+            .await
+            .with_context(|| format!("failed to write to file `{}`", path.as_ref().display()))
+    }
+}
 
 pub(crate) mod blocking {
     use indexmap::IndexMap;
-    use itertools::join;
     use uuid::Uuid;
 
-    use crate::{error::ErrorRepr, Result};
+    use crate::{asyncs::SingleTasked, future::FutureExt as _, Result};
 
-    use super::super::word::UserDictWord;
+    use super::{super::word::UserDictWord, Inner};
 
     /// ユーザー辞書。
     ///
     /// 単語はJSONとの相互変換のために挿入された順序を保つ。
     #[derive(Debug, Default)]
-    pub struct UserDict {
-        words: std::sync::Mutex<IndexMap<Uuid, UserDictWord>>,
-    }
+    pub struct UserDict(Inner<SingleTasked>);
 
+    // TODO: 引数の`path`は全部`AsRef<Path>`にする
     impl self::UserDict {
         /// ユーザー辞書を作成する。
         pub fn new() -> Self {
@@ -35,11 +130,12 @@ pub(crate) mod blocking {
         }
 
         pub fn to_json(&self) -> String {
-            serde_json::to_string(&*self.words.lock().unwrap()).expect("should not fail")
+            self.0.to_json()
         }
 
+        // TODO: `&mut IndexMap<_>`を取れるようにする
         pub fn with_words<R>(&self, f: impl FnOnce(&IndexMap<Uuid, UserDictWord>) -> R) -> R {
-            f(&self.words.lock().unwrap())
+            self.0.with_words(|words| f(words))
         }
 
         /// ユーザー辞書をファイルから読み込む。
@@ -48,82 +144,48 @@ pub(crate) mod blocking {
         ///
         /// ファイルが読めなかった、または内容が不正だった場合はエラーを返す。
         pub fn load(&self, store_path: &str) -> Result<()> {
-            let words = (|| {
-                let words = &fs_err::read(store_path)?;
-                let words = serde_json::from_slice::<IndexMap<_, _>>(words)?;
-                Ok(words)
-            })()
-            .map_err(ErrorRepr::LoadUserDict)?;
-
-            self.words.lock().unwrap().extend(words);
-            Ok(())
+            self.0.load(store_path).block_on()
         }
 
         /// ユーザー辞書に単語を追加する。
         pub fn add_word(&self, word: UserDictWord) -> Result<Uuid> {
-            let word_uuid = Uuid::new_v4();
-            self.words.lock().unwrap().insert(word_uuid, word);
-            Ok(word_uuid)
+            self.0.add_word(word)
         }
 
         /// ユーザー辞書の単語を変更する。
         pub fn update_word(&self, word_uuid: Uuid, new_word: UserDictWord) -> Result<()> {
-            let mut words = self.words.lock().unwrap();
-            if !words.contains_key(&word_uuid) {
-                return Err(ErrorRepr::WordNotFound(word_uuid).into());
-            }
-            words.insert(word_uuid, new_word);
-            Ok(())
+            self.0.update_word(word_uuid, new_word)
         }
 
         /// ユーザー辞書から単語を削除する。
         pub fn remove_word(&self, word_uuid: Uuid) -> Result<UserDictWord> {
-            let Some(word) = self.words.lock().unwrap().remove(&word_uuid) else {
-                return Err(ErrorRepr::WordNotFound(word_uuid).into());
-            };
-            Ok(word)
+            self.0.remove_word(word_uuid)
         }
 
         /// 他のユーザー辞書をインポートする。
         pub fn import(&self, other: &Self) -> Result<()> {
-            for (word_uuid, word) in &*other.words.lock().unwrap() {
-                self.words.lock().unwrap().insert(*word_uuid, word.clone());
-            }
-            Ok(())
+            self.0.import(&other.0)
         }
 
         /// ユーザー辞書を保存する。
         pub fn save(&self, store_path: &str) -> Result<()> {
-            fs_err::write(
-                store_path,
-                serde_json::to_vec(&self.words).expect("should not fail"),
-            )
-            .map_err(|e| ErrorRepr::SaveUserDict(e.into()).into())
+            self.0.save(store_path).block_on()
         }
 
         /// MeCabで使用する形式に変換する。
         pub(crate) fn to_mecab_format(&self) -> String {
-            join(
-                self.words
-                    .lock()
-                    .unwrap()
-                    .values()
-                    .map(UserDictWord::to_mecab_format),
-                "\n",
-            )
+            self.0.to_mecab_format()
         }
     }
 }
 
 pub(crate) mod nonblocking {
-    use std::sync::Arc;
-
     use indexmap::IndexMap;
     use uuid::Uuid;
 
-    use crate::Result;
+    use crate::{asyncs::BlockingThreadPool, Result};
 
-    use super::super::word::UserDictWord;
+    use super::{super::word::UserDictWord, Inner};
 
     /// ユーザー辞書。
     ///
@@ -136,20 +198,22 @@ pub(crate) mod nonblocking {
     /// [blocking]: https://docs.rs/crate/blocking
     /// [`nonblocking`モジュールのドキュメント]: crate::nonblocking
     #[derive(Debug, Default)]
-    pub struct UserDict(Arc<super::blocking::UserDict>);
+    pub struct UserDict(Inner<BlockingThreadPool>);
 
+    // TODO: 引数の`path`は全部`AsRef<Path>`にする
     impl self::UserDict {
         /// ユーザー辞書を作成する。
         pub fn new() -> Self {
-            Self(super::blocking::UserDict::new().into())
+            Default::default()
         }
 
         pub fn to_json(&self) -> String {
             self.0.to_json()
         }
 
+        // TODO: `&mut IndexMap<_>`を取れるようにする
         pub fn with_words<R>(&self, f: impl FnOnce(&IndexMap<Uuid, UserDictWord>) -> R) -> R {
-            self.0.with_words(f)
+            self.0.with_words(|words| f(words))
         }
 
         /// ユーザー辞書をファイルから読み込む。
@@ -158,9 +222,7 @@ pub(crate) mod nonblocking {
         ///
         /// ファイルが読めなかった、または内容が不正だった場合はエラーを返す。
         pub async fn load(&self, store_path: &str) -> Result<()> {
-            let blocking = self.0.clone();
-            let store_path = store_path.to_owned();
-            crate::task::asyncify(move || blocking.load(&store_path)).await
+            self.0.load(store_path).await
         }
 
         /// ユーザー辞書に単語を追加する。
@@ -185,9 +247,7 @@ pub(crate) mod nonblocking {
 
         /// ユーザー辞書を保存する。
         pub async fn save(&self, store_path: &str) -> Result<()> {
-            let blocking = self.0.clone();
-            let store_path = store_path.to_owned();
-            crate::task::asyncify(move || blocking.save(&store_path)).await
+            self.0.save(store_path).await
         }
 
         /// MeCabで使用する形式に変換する。

From 8d603d9b70372c3eaad56d2f9bdf6bcbd78935d1 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Tue, 24 Sep 2024 22:36:30 +0900
Subject: [PATCH 32/36] change: minor changes for `UserDict` API (#835)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`UserDict`のパブリックAPIについて以下の変更を加える。

1. `load`と`store`が引数に取るファイルパスについて:
    * Rust APIでは`&str`から`impl AsRef<Path>`にする
    * Python APIでは`StrPath`相当にする
    * Java APIでは`java.io.File`と`java.nio.file.Path`のオーバーロードを
        追加する
2. Rust APIの`with_words`から`&mut IndexMap<…>`が得られるようにする

`dict`や`java.util.HashMap`へ変換するAPIの改良はfuture workとする。
---
 crates/voicevox_core/src/user_dict/dict.rs    | 28 ++++++-------
 .../jp/hiroshiba/voicevoxcore/UserDict.java   | 42 +++++++++++++++++++
 .../voicevox_core_java_api/src/user_dict.rs   |  4 +-
 .../python/voicevox_core/_rust/asyncio.pyi    |  4 +-
 .../python/voicevox_core/_rust/blocking.pyi   |  4 +-
 .../voicevox_core_python_api/src/convert.rs   |  1 -
 crates/voicevox_core_python_api/src/lib.rs    | 10 ++---
 7 files changed, 66 insertions(+), 27 deletions(-)

diff --git a/crates/voicevox_core/src/user_dict/dict.rs b/crates/voicevox_core/src/user_dict/dict.rs
index 2f851b138..e3bb640c9 100644
--- a/crates/voicevox_core/src/user_dict/dict.rs
+++ b/crates/voicevox_core/src/user_dict/dict.rs
@@ -31,7 +31,7 @@ impl<A: Async> Inner<A> {
         f(&mut self.words.lock().unwrap_or_else(|e| panic!("{e}")))
     }
 
-    async fn load(&self, store_path: &str) -> crate::Result<()> {
+    async fn load(&self, store_path: impl AsRef<Path>) -> crate::Result<()> {
         let words = async {
             let words = &A::fs_err_read(store_path).await?;
             let words = serde_json::from_slice::<IndexMap<_, _>>(words)?;
@@ -78,7 +78,7 @@ impl<A: Async> Inner<A> {
         })
     }
 
-    async fn save(&self, store_path: &str) -> crate::Result<()> {
+    async fn save(&self, store_path: impl AsRef<Path>) -> crate::Result<()> {
         A::fs_err_write(
             store_path,
             serde_json::to_vec(&self.words).expect("should not fail"),
@@ -109,6 +109,8 @@ impl<A: Async> A {
 }
 
 pub(crate) mod blocking {
+    use std::path::Path;
+
     use indexmap::IndexMap;
     use uuid::Uuid;
 
@@ -122,7 +124,6 @@ pub(crate) mod blocking {
     #[derive(Debug, Default)]
     pub struct UserDict(Inner<SingleTasked>);
 
-    // TODO: 引数の`path`は全部`AsRef<Path>`にする
     impl self::UserDict {
         /// ユーザー辞書を作成する。
         pub fn new() -> Self {
@@ -133,9 +134,8 @@ pub(crate) mod blocking {
             self.0.to_json()
         }
 
-        // TODO: `&mut IndexMap<_>`を取れるようにする
-        pub fn with_words<R>(&self, f: impl FnOnce(&IndexMap<Uuid, UserDictWord>) -> R) -> R {
-            self.0.with_words(|words| f(words))
+        pub fn with_words<R>(&self, f: impl FnOnce(&mut IndexMap<Uuid, UserDictWord>) -> R) -> R {
+            self.0.with_words(f)
         }
 
         /// ユーザー辞書をファイルから読み込む。
@@ -143,7 +143,7 @@ pub(crate) mod blocking {
         /// # Errors
         ///
         /// ファイルが読めなかった、または内容が不正だった場合はエラーを返す。
-        pub fn load(&self, store_path: &str) -> Result<()> {
+        pub fn load(&self, store_path: impl AsRef<Path>) -> Result<()> {
             self.0.load(store_path).block_on()
         }
 
@@ -168,7 +168,7 @@ pub(crate) mod blocking {
         }
 
         /// ユーザー辞書を保存する。
-        pub fn save(&self, store_path: &str) -> Result<()> {
+        pub fn save(&self, store_path: impl AsRef<Path>) -> Result<()> {
             self.0.save(store_path).block_on()
         }
 
@@ -180,6 +180,8 @@ pub(crate) mod blocking {
 }
 
 pub(crate) mod nonblocking {
+    use std::path::Path;
+
     use indexmap::IndexMap;
     use uuid::Uuid;
 
@@ -200,7 +202,6 @@ pub(crate) mod nonblocking {
     #[derive(Debug, Default)]
     pub struct UserDict(Inner<BlockingThreadPool>);
 
-    // TODO: 引数の`path`は全部`AsRef<Path>`にする
     impl self::UserDict {
         /// ユーザー辞書を作成する。
         pub fn new() -> Self {
@@ -211,9 +212,8 @@ pub(crate) mod nonblocking {
             self.0.to_json()
         }
 
-        // TODO: `&mut IndexMap<_>`を取れるようにする
-        pub fn with_words<R>(&self, f: impl FnOnce(&IndexMap<Uuid, UserDictWord>) -> R) -> R {
-            self.0.with_words(|words| f(words))
+        pub fn with_words<R>(&self, f: impl FnOnce(&mut IndexMap<Uuid, UserDictWord>) -> R) -> R {
+            self.0.with_words(f)
         }
 
         /// ユーザー辞書をファイルから読み込む。
@@ -221,7 +221,7 @@ pub(crate) mod nonblocking {
         /// # Errors
         ///
         /// ファイルが読めなかった、または内容が不正だった場合はエラーを返す。
-        pub async fn load(&self, store_path: &str) -> Result<()> {
+        pub async fn load(&self, store_path: impl AsRef<Path>) -> Result<()> {
             self.0.load(store_path).await
         }
 
@@ -246,7 +246,7 @@ pub(crate) mod nonblocking {
         }
 
         /// ユーザー辞書を保存する。
-        pub async fn save(&self, store_path: &str) -> Result<()> {
+        pub async fn save(&self, store_path: impl AsRef<Path>) -> Result<()> {
             self.0.save(store_path).await
         }
 
diff --git a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/UserDict.java b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/UserDict.java
index 21f6843dd..7135365ff 100644
--- a/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/UserDict.java
+++ b/crates/voicevox_core_java_api/lib/src/main/java/jp/hiroshiba/voicevoxcore/UserDict.java
@@ -7,6 +7,8 @@
 import jakarta.annotation.Nonnull;
 import jakarta.validation.constraints.Max;
 import jakarta.validation.constraints.Min;
+import java.io.File;
+import java.nio.file.Path;
 import java.util.HashMap;
 import jp.hiroshiba.voicevoxcore.exceptions.LoadUserDictException;
 import jp.hiroshiba.voicevoxcore.exceptions.SaveUserDictException;
@@ -70,6 +72,26 @@ public void importDict(UserDict dict) {
     rsImportDict(dict);
   }
 
+  /**
+   * ユーザー辞書を読み込む。
+   *
+   * @param path ユーザー辞書のパス。
+   * @throws LoadUserDictException ユーザー辞書を読み込めなかった場合。
+   */
+  public void load(Path path) throws LoadUserDictException {
+    load(path.toString());
+  }
+
+  /**
+   * ユーザー辞書を読み込む。
+   *
+   * @param path ユーザー辞書のパス。
+   * @throws LoadUserDictException ユーザー辞書を読み込めなかった場合。
+   */
+  public void load(File path) throws LoadUserDictException {
+    load(path.toString());
+  }
+
   /**
    * ユーザー辞書を読み込む。
    *
@@ -80,6 +102,26 @@ public void load(String path) throws LoadUserDictException {
     rsLoad(path);
   }
 
+  /**
+   * ユーザー辞書を保存する。
+   *
+   * @param path ユーザー辞書のパス。
+   * @throws SaveUserDictException ユーザー辞書を保存できなかった場合。
+   */
+  public void save(Path path) throws SaveUserDictException {
+    rsSave(path.toString());
+  }
+
+  /**
+   * ユーザー辞書を保存する。
+   *
+   * @param path ユーザー辞書のパス。
+   * @throws SaveUserDictException ユーザー辞書を保存できなかった場合。
+   */
+  public void save(File path) throws SaveUserDictException {
+    rsSave(path.toString());
+  }
+
   /**
    * ユーザー辞書を保存する。
    *
diff --git a/crates/voicevox_core_java_api/src/user_dict.rs b/crates/voicevox_core_java_api/src/user_dict.rs
index df8b8270b..ceee1f42e 100644
--- a/crates/voicevox_core_java_api/src/user_dict.rs
+++ b/crates/voicevox_core_java_api/src/user_dict.rs
@@ -124,7 +124,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_UserDict_rsLoad<'local>
             .clone();
 
         let path = env.get_string(&path)?;
-        let path = &Cow::from(&path);
+        let path = &*Cow::from(&path);
 
         internal.load(path)?;
 
@@ -144,7 +144,7 @@ unsafe extern "system" fn Java_jp_hiroshiba_voicevoxcore_UserDict_rsSave<'local>
             .clone();
 
         let path = env.get_string(&path)?;
-        let path = &Cow::from(&path);
+        let path = &*Cow::from(&path);
 
         internal.save(path)?;
 
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
index b386d2d5a..d6359e038 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/asyncio.pyi
@@ -431,7 +431,7 @@ class UserDict:
         """このオプジェクトの :class:`dict` としての表現。"""
         ...
     def __init__(self) -> None: ...
-    async def load(self, path: str) -> None:
+    async def load(self, path: Union[str, PathLike[str]]) -> None:
         """ファイルに保存されたユーザー辞書を読み込む。
 
         Parameters
@@ -440,7 +440,7 @@ class UserDict:
             ユーザー辞書のパス。
         """
         ...
-    async def save(self, path: str) -> None:
+    async def save(self, path: Union[str, PathLike[str]]) -> None:
         """
         ユーザー辞書をファイルに保存する。
 
diff --git a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
index 891ceb05e..cf4f1f5c6 100644
--- a/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
+++ b/crates/voicevox_core_python_api/python/voicevox_core/_rust/blocking.pyi
@@ -426,7 +426,7 @@ class UserDict:
         """このオプジェクトの :class:`dict` としての表現。"""
         ...
     def __init__(self) -> None: ...
-    def load(self, path: str) -> None:
+    def load(self, path: Union[str, PathLike[str]]) -> None:
         """ファイルに保存されたユーザー辞書を読み込む。
 
         Parameters
@@ -435,7 +435,7 @@ class UserDict:
             ユーザー辞書のパス。
         """
         ...
-    def save(self, path: str) -> None:
+    def save(self, path: Union[str, PathLike[str]]) -> None:
         """
         ユーザー辞書をファイルに保存する。
 
diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs
index 8152bc980..d4a867606 100644
--- a/crates/voicevox_core_python_api/src/convert.rs
+++ b/crates/voicevox_core_python_api/src/convert.rs
@@ -37,7 +37,6 @@ pub(crate) fn from_acceleration_mode(ob: &PyAny) -> PyResult<AccelerationMode> {
     }
 }
 
-// FIXME: `UserDict`についてはこれではなく、`PathBuf::extract`を直接使うようにする
 pub(crate) fn from_utf8_path(ob: &PyAny) -> PyResult<Utf8PathBuf> {
     PathBuf::extract(ob)?
         .into_os_string()
diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs
index 00b6e7102..24d28261d 100644
--- a/crates/voicevox_core_python_api/src/lib.rs
+++ b/crates/voicevox_core_python_api/src/lib.rs
@@ -734,11 +734,11 @@ mod blocking {
             Self::default()
         }
 
-        fn load(&self, path: &str, py: Python<'_>) -> PyResult<()> {
+        fn load(&self, path: PathBuf, py: Python<'_>) -> PyResult<()> {
             self.dict.load(path).into_py_result(py)
         }
 
-        fn save(&self, path: &str, py: Python<'_>) -> PyResult<()> {
+        fn save(&self, path: PathBuf, py: Python<'_>) -> PyResult<()> {
             self.dict.save(path).into_py_result(py)
         }
 
@@ -1363,9 +1363,8 @@ mod asyncio {
             Self::default()
         }
 
-        fn load<'py>(&self, path: &str, py: Python<'py>) -> PyResult<&'py PyAny> {
+        fn load<'py>(&self, path: PathBuf, py: Python<'py>) -> PyResult<&'py PyAny> {
             let this = self.dict.clone();
-            let path = path.to_owned();
 
             pyo3_asyncio::tokio::future_into_py(py, async move {
                 let result = this.load(&path).await;
@@ -1373,9 +1372,8 @@ mod asyncio {
             })
         }
 
-        fn save<'py>(&self, path: &str, py: Python<'py>) -> PyResult<&'py PyAny> {
+        fn save<'py>(&self, path: PathBuf, py: Python<'py>) -> PyResult<&'py PyAny> {
             let this = self.dict.clone();
-            let path = path.to_owned();
 
             pyo3_asyncio::tokio::future_into_py(py, async move {
                 let result = this.save(&path).await;

From bcd23b8c139ec60d57a81746cd8b3fd848b85553 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 27 Sep 2024 03:46:50 +0900
Subject: [PATCH 33/36] =?UTF-8?q?chore:=20voicevox.github.io/voicevox=5Fco?=
 =?UTF-8?q?re/apis=E5=86=85=E3=81=AE=E3=83=AA=E3=83=B3=E3=82=AF=E3=82=92?=
 =?UTF-8?q?=E7=BD=AE=E3=81=8D=E6=8F=9B=E3=81=88=20(#837)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

voicevox.github.io/voicevox_core/apisのC APIとPython APIのリンク先が不親
切なことになっているので、置き換える。
---
 docs/apis/index.html | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/apis/index.html b/docs/apis/index.html
index d1f5d09b2..78493fa11 100644
--- a/docs/apis/index.html
+++ b/docs/apis/index.html
@@ -7,8 +7,8 @@
     <!-- TODO: まともなページを用意する -->
     <ul>
       <li><a href="./rust_api/voicevox_core">Rust API</a></li>
-      <li><a href="./c_api">C API</a></li>
-      <li><a href="./python_api">Python API</a></li>
+      <li><a href="./c_api/voicevox__core_8h.html">C API</a></li>
+      <li><a href="./python_api/autoapi/voicevox_core/index.html">Python API</a></li>
       <li><a href="./java_api">Java API</a></li>
     </ul>
   </body>

From f75ce9d7f4481f0a3ede05e5030b970ac3d2b7f1 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Fri, 27 Sep 2024 04:19:07 +0900
Subject: [PATCH 34/36] =?UTF-8?q?chore:=20README=E3=81=8B=E3=82=89voicevox?=
 =?UTF-8?q?.github.io/voicevox=5Fcore/apis=E3=81=AB=E3=83=AA=E3=83=B3?=
 =?UTF-8?q?=E3=82=AF=20(#838)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

#269 の頃からあるリンクの宛先をvoicevox.github.io/voicevox_core/apis直下
にする。

今後 #496 の話が絡んでくるかもしれない。
---
 README.md            | 2 +-
 docs/apis/index.html | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 4812c1297..4496dd491 100644
--- a/README.md
+++ b/README.md
@@ -16,7 +16,7 @@
 
 ## API
 
-[API ドキュメント](https://voicevox.github.io/voicevox_core/apis/c_api/globals_func.html)をご覧ください。
+[API ドキュメント](https://voicevox.github.io/voicevox_core/apis/)をご覧ください。
 
 ## ユーザーガイド
 
diff --git a/docs/apis/index.html b/docs/apis/index.html
index 78493fa11..efae64b13 100644
--- a/docs/apis/index.html
+++ b/docs/apis/index.html
@@ -4,7 +4,8 @@
     <meta charset="utf-8" />
   </head>
   <body>
-    <!-- TODO: まともなページを用意する -->
+    <p>TODO: まともなページを用意する</p>
+    <p><a href="https://github.com/VOICEVOX/voicevox_core/pull/496">VOICEVOX/voicevox_core#496</a></p>
     <ul>
       <li><a href="./rust_api/voicevox_core">Rust API</a></li>
       <li><a href="./c_api/voicevox__core_8h.html">C API</a></li>

From 521cd54c1aa30aadf974f1510ad68f6f7923eb69 Mon Sep 17 00:00:00 2001
From: Ryo Yamashita <qryxip@gmail.com>
Date: Sun, 29 Sep 2024 15:51:21 +0900
Subject: [PATCH 35/36] =?UTF-8?q?chore:=20=E3=81=99=E3=81=B9=E3=81=A6?=
 =?UTF-8?q?=E3=81=AE=E4=BE=9D=E5=AD=98=E3=82=92Renovate=E3=81=AE=E5=AF=BE?=
 =?UTF-8?q?=E8=B1=A1=E3=81=AB=E3=81=99=E3=82=8B=20(#839)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

次の2つの"group"にまとめる形で、あらゆる依存をRenovateの自動PRの対象にす
る。

* "major dependencies" (`renovate/major-dependencies`)
* "non-major dependencies" (`renovate/non-major-dependencies`)

0.y.zのy（ただしy≧1）、0.0.zのzの変更は"major dependencies"側に分類す
る。Rustのバージョンは"non-major"側。

運用としては二つのPRを**普段は保持し続け、更新可能ライブラリを把握する目
的に留める**。そして6週間おきのRustのリリースのタイミングで"non-major"の
PRを「収穫」し、"major"の方はしかるべき機会が来たら収穫する。

このリポジトリにおいては懸念が一つあり、Gradle Wrapperのアップデートに失
敗してgradle-wrapper.jarを消し飛ばしたPRが生成されてしまう。ただどういう
感じの現象なのかまだ不明であるし、Gradle Wrapperのバージョンだけ手動で更
新すれば回避可能であると思われることから、このPRでは除外設定はしない。

Resolves #470.

Co-authored-by: Hiroshiba <hihokaruta@gmail.com>
---
 renovate.json  | 41 -----------------------
 renovate.json5 | 90 ++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 90 insertions(+), 41 deletions(-)
 delete mode 100644 renovate.json
 create mode 100644 renovate.json5

diff --git a/renovate.json b/renovate.json
deleted file mode 100644
index f56767ea0..000000000
--- a/renovate.json
+++ /dev/null
@@ -1,41 +0,0 @@
-{
-  "$schema": "https://docs.renovatebot.com/renovate-schema.json",
-  "extends": [
-    "config:recommended"
-  ],
-  "timezone": "Asia/Tokyo",
-  "packageRules": [
-    {
-      "groupSlug": "rust",
-      "groupName": "Rust",
-      "matchPackagePatterns": [
-        "^rust-lang/rust$"
-      ]
-    },
-    {
-      "groupSlug": "others",
-      "groupName": "Others",
-      "matchPackagePatterns": [
-        "*"
-      ],
-      "excludePackagePatterns": [
-        "^rust-lang/rust$"
-      ],
-      "dependencyDashboardApproval": true
-    }
-  ],
-  "customManagers": [
-    {
-      "customType": "regex",
-      "fileMatch": [
-        "^rust-toolchain$"
-      ],
-      "matchStrings": [
-        "(?<currentValue>\\d+\\.\\d+\\.\\d+)"
-      ],
-      "depNameTemplate": "Rust",
-      "packageNameTemplate": "rust-lang/rust",
-      "datasourceTemplate": "github-tags"
-    }
-  ]
-}
diff --git a/renovate.json5 b/renovate.json5
new file mode 100644
index 000000000..6fc45ac18
--- /dev/null
+++ b/renovate.json5
@@ -0,0 +1,90 @@
+{
+  $schema: "https://docs.renovatebot.com/renovate-schema.json",
+  extends: [
+    "config:recommended",
+  ],
+  timezone: "Asia/Tokyo",
+  separateMajorMinor: false,
+  dependencyDashboardApproval: true, // 万が一`packageRules`の網羅性に穴ができた場合に備え
+  packageRules: [
+    // `separateMajorMinor`を無効化した上で次の二つのgroupにすべてをまとめる。
+    //
+    // * "major dependencies" (`renovate/major-dependencies`)
+    // * "non-major dependencies" (`renovate/non-major-dependencies`)
+    //
+    // バージョン0.y.z (y≧1)のyとバージョン0.0.zのzの変更は"major dependencies"の方に含むようにする。
+
+    // メジャーバージョンの更新
+    {
+      groupName: "major dependencies",
+      matchUpdateTypes: [
+        "major",
+      ],
+      dependencyDashboardApproval: false,
+    },
+    {
+      groupName: "major dependencies",
+      matchUpdateTypes: [
+        "minor",
+      ],
+      matchCurrentVersion: "/^v?0\\./",
+      dependencyDashboardApproval: false,
+    },
+    {
+      groupName: "major dependencies",
+      matchUpdateTypes: [
+        "patch",
+      ],
+      matchCurrentVersion: "/^v?0\\.0\\./",
+      dependencyDashboardApproval: false,
+    },
+
+    // メジャーバージョン以外の更新
+    {
+      groupName: "non-major dependencies",
+      matchUpdateTypes: [
+        "minor",
+      ],
+      matchCurrentVersion: "!/^v?0\\./",
+      dependencyDashboardApproval: false,
+    },
+    {
+      groupName: "non-major dependencies",
+      matchUpdateTypes: [
+        "patch",
+      ],
+      matchCurrentVersion: "!/^v?0\\.0\\./",
+      dependencyDashboardApproval: false,
+    },
+
+    // GHAのrunnerに対しては無効化する
+    {
+      matchDatasources: [
+        "github-runners",
+      ],
+      matchPackageNames: [
+        "windows",
+        "macos",
+        "ubuntu",
+      ],
+      enabled: false,
+    },
+  ],
+  cargo: {
+    rangeStrategy: "bump",
+  },
+  customManagers: [
+    {
+      customType: "regex",
+      fileMatch: [
+        "^rust-toolchain$",
+      ],
+      matchStrings: [
+        "(?<currentValue>\\d+\\.\\d+\\.\\d+)",
+      ],
+      depNameTemplate: "Rust",
+      packageNameTemplate: "rust-lang/rust",
+      datasourceTemplate: "github-tags",
+    },
+  ],
+}

From f3c5be04822cd05a53f7cc6009ba2aa499d65689 Mon Sep 17 00:00:00 2001
From: Hiroshiba <hihokaruta@gmail.com>
Date: Sun, 29 Sep 2024 16:04:37 +0900
Subject: [PATCH 36/36] =?UTF-8?q?docs:=20README=E3=81=AE=E3=83=93=E3=83=AB?=
 =?UTF-8?q?=E3=83=89=E5=91=A8=E3=82=8A=E3=81=AE=E8=A8=98=E8=BC=89=E3=82=92?=
 =?UTF-8?q?=E6=9B=B4=E6=96=B0=E3=81=97=E3=80=81=E8=87=AA=E5=88=86=E3=81=A7?=
 =?UTF-8?q?=E3=83=93=E3=83=AB=E3=83=89=E3=81=97=E3=81=9F=E5=A0=B4=E5=90=88?=
 =?UTF-8?q?=E3=81=AF=E8=A3=BD=E5=93=81=E7=89=88=E3=81=AEVVM=E3=81=8C?=
 =?UTF-8?q?=E8=AA=AD=E3=82=81=E3=81=AA=E3=81=84=E3=81=93=E3=81=A8=E3=82=92?=
 =?UTF-8?q?=E3=82=8F=E3=81=8B=E3=82=8B=E3=82=88=E3=81=86=E3=81=AB=20(#840)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

頂いたコメントをもとに、自分でビルドした場合はサンプルモデルしか読み込め
ないことがわかるようにする。

https://github.com/VOICEVOX/voicevox_core/issues/492#issuecomment-2377448309

実際は自分で作ったonnxモデルなども読み込めるといえば読み込めるため、「製
品版VOICEVOXのvvmは読み込めません。」の方が適切かもしれない。ただ
VOICEVOX/voicevox_project#24 を完遂したら不要になる一文であるため、あま
り考えすぎる必要もないということで元の文章からほとんど変わらない形を採用
した。

close #492
---
 README.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 4496dd491..129854da8 100644
--- a/README.md
+++ b/README.md
@@ -144,9 +144,9 @@ VOICEVOX CORE の主要機能は Rust で実装されることを前提として
 
 ## コアライブラリのビルド
 
-[Releases](https://github.com/VOICEVOX/voicevox_core/releases) にあるビルド済みのコアライブラリを利用せず、自分で一からビルドする場合こちらを参照してください。ビルドには [Rust](https://www.rust-lang.org/ja) ([Windows での Rust 開発環境構築手順はこちら](https://docs.microsoft.com/ja-jp/windows/dev-environment/rust/setup)) と [cmake](https://cmake.org/download/) が必要です。
-
-model フォルダにある onnx モデルはダミーのため、ノイズの混じった音声が出力されます
+ビルドには [Rust](https://www.rust-lang.org/ja) ([Windows での Rust 開発環境構築手順はこちら](https://docs.microsoft.com/ja-jp/windows/dev-environment/rust/setup)) と [cmake](https://cmake.org/download/) が必要です。
+[Releases](https://github.com/VOICEVOX/voicevox_core/releases) にあるビルド済みのコアライブラリを利用せず、自分で一からビルドした場合は、model フォルダにある onnx モデルのみが利用できます。
+このモデルはダミーのため、ノイズの混じった音声が出力されます。
 
 ```bash
 # DLLをビルド