faster tauri dev

yujonglee · yujonglee · commit e9ce3c199a57 · 2025-09-18T15:55:48.000-07:00
diff --git a/crates/whisper-local/Cargo.toml b/crates/whisper-local/Cargo.toml
@@ -5,14 +5,16 @@ edition = "2021"
 
 # https://github.com/tazz4843/whisper-rs/blob/e3d67d5/Cargo.toml
 [features]
-default = []
-coreml = ["whisper-rs/coreml"]
-cuda = ["whisper-rs/cuda"]
-hipblas = ["whisper-rs/hipblas"]
-openblas = ["whisper-rs/openblas"]
-metal = ["whisper-rs/metal"]
-vulkan = ["whisper-rs/vulkan"]
-openmp = ["whisper-rs/openmp"]
+default = ["actual"]
+actual = ["dep:whisper-rs"]
+
+coreml = ["actual", "whisper-rs/coreml"]
+cuda = ["actual", "whisper-rs/cuda"]
+hipblas = ["actual", "whisper-rs/hipblas"]
+openblas = ["actual", "whisper-rs/openblas"]
+metal = ["actual", "whisper-rs/metal"]
+vulkan = ["actual", "whisper-rs/vulkan"]
+openmp = ["actual", "whisper-rs/openmp"]
 
 [dependencies]
 hypr-audio-utils = { workspace = true }
@@ -23,7 +25,7 @@ hound = { workspace = true }
 
 kalosm-sound = { workspace = true, default-features = false }
 rodio = { workspace = true }
-whisper-rs = { git = "https://codeberg.org/tazz4843/whisper-rs", rev = "0c509ec", features = ["raw-api", "tracing_backend"] }
+whisper-rs = { git = "https://codeberg.org/tazz4843/whisper-rs", rev = "0c509ec", features = ["raw-api", "tracing_backend"], optional = true }
 
 futures-util = { workspace = true }
 tracing = { workspace = true }
diff --git a/crates/whisper-local/src/error.rs b/crates/whisper-local/src/error.rs
@@ -4,6 +4,7 @@ use serde::{ser::Serializer, Serialize};
 pub enum Error {
     #[error("model_not_found")]
     ModelNotFound,
+    #[cfg(feature = "actual")]
     #[error(transparent)]
     LocalWhisperError(#[from] whisper_rs::WhisperError),
 }
diff --git a/crates/whisper-local/src/ggml.rs b/crates/whisper-local/src/ggml.rs
@@ -0,0 +1,62 @@
+#[derive(Debug, Clone, serde::Serialize, serde::Deserialize, specta::Type)]
+pub struct GgmlBackend {
+    pub kind: String,
+    pub name: String,
+    pub description: String,
+    pub total_memory_mb: usize,
+    pub free_memory_mb: usize,
+}
+
+#[cfg(any(feature = "actual", debug_assertions))]
+pub fn list_ggml_backends() -> Vec<GgmlBackend> {
+    vec![]
+}
+
+// https://github.com/ggml-org/llama.cpp/blob/3a9457d/common/arg.cpp#L2300
+#[cfg(all(feature = "actual", not(debug_assertions)))]
+pub fn list_ggml_backends() -> Vec<GgmlBackend> {
+    use whisper_rs::whisper_rs_sys::{
+        ggml_backend_dev_count, ggml_backend_dev_description, ggml_backend_dev_get,
+        ggml_backend_dev_memory, ggml_backend_dev_name, ggml_backend_dev_type,
+        ggml_backend_dev_type_GGML_BACKEND_DEVICE_TYPE_ACCEL as GGML_BACKEND_DEVICE_TYPE_ACCEL,
+        ggml_backend_dev_type_GGML_BACKEND_DEVICE_TYPE_CPU as GGML_BACKEND_DEVICE_TYPE_CPU,
+        ggml_backend_dev_type_GGML_BACKEND_DEVICE_TYPE_GPU as GGML_BACKEND_DEVICE_TYPE_GPU,
+    };
+
+    let count = unsafe { ggml_backend_dev_count() };
+    let mut devices = Vec::with_capacity(count);
+
+    for i in 0..count {
+        unsafe {
+            let dev = ggml_backend_dev_get(i);
+
+            let kind: String = match ggml_backend_dev_type(dev) {
+                GGML_BACKEND_DEVICE_TYPE_CPU => "CPU".into(),
+                GGML_BACKEND_DEVICE_TYPE_ACCEL => "ACCEL".into(),
+                GGML_BACKEND_DEVICE_TYPE_GPU => "GPU".into(),
+                _ => "UNKNOWN".into(),
+            };
+
+            let name = std::ffi::CStr::from_ptr(ggml_backend_dev_name(dev))
+                .to_string_lossy()
+                .into_owned();
+            let description = std::ffi::CStr::from_ptr(ggml_backend_dev_description(dev))
+                .to_string_lossy()
+                .into_owned();
+
+            let mut free_mem: usize = 0;
+            let mut total_mem: usize = 0;
+            ggml_backend_dev_memory(dev, &mut free_mem, &mut total_mem);
+
+            devices.push(GgmlBackend {
+                kind,
+                name,
+                description,
+                total_memory_mb: total_mem / 1024 / 1024,
+                free_memory_mb: free_mem / 1024 / 1024,
+            });
+        }
+    }
+
+    devices
+}
diff --git a/crates/whisper-local/src/lib.rs b/crates/whisper-local/src/lib.rs
@@ -1,4 +1,5 @@
-// https://github.com/tazz4843/whisper-rs/blob/master/examples/audio_transcription.rs
+mod ggml;
+pub use ggml::*;
 
 mod stream;
 pub use stream::*;
@@ -8,60 +9,3 @@ pub use model::*;
 
 mod error;
 pub use error::*;
-
-#[derive(Debug, Clone, serde::Serialize, serde::Deserialize, specta::Type)]
-pub struct GgmlBackend {
-    pub kind: String,
-    pub name: String,
-    pub description: String,
-    pub total_memory_mb: usize,
-    pub free_memory_mb: usize,
-}
-
-// https://github.com/ggml-org/llama.cpp/blob/3a9457d/common/arg.cpp#L2300
-pub fn list_ggml_backends() -> Vec<GgmlBackend> {
-    use whisper_rs::whisper_rs_sys::{
-        ggml_backend_dev_count, ggml_backend_dev_description, ggml_backend_dev_get,
-        ggml_backend_dev_memory, ggml_backend_dev_name, ggml_backend_dev_type,
-        ggml_backend_dev_type_GGML_BACKEND_DEVICE_TYPE_ACCEL as GGML_BACKEND_DEVICE_TYPE_ACCEL,
-        ggml_backend_dev_type_GGML_BACKEND_DEVICE_TYPE_CPU as GGML_BACKEND_DEVICE_TYPE_CPU,
-        ggml_backend_dev_type_GGML_BACKEND_DEVICE_TYPE_GPU as GGML_BACKEND_DEVICE_TYPE_GPU,
-    };
-
-    let count = unsafe { ggml_backend_dev_count() };
-    let mut devices = Vec::with_capacity(count);
-
-    for i in 0..count {
-        unsafe {
-            let dev = ggml_backend_dev_get(i);
-
-            let kind: String = match ggml_backend_dev_type(dev) {
-                GGML_BACKEND_DEVICE_TYPE_CPU => "CPU".into(),
-                GGML_BACKEND_DEVICE_TYPE_ACCEL => "ACCEL".into(),
-                GGML_BACKEND_DEVICE_TYPE_GPU => "GPU".into(),
-                _ => "UNKNOWN".into(),
-            };
-
-            let name = std::ffi::CStr::from_ptr(ggml_backend_dev_name(dev))
-                .to_string_lossy()
-                .into_owned();
-            let description = std::ffi::CStr::from_ptr(ggml_backend_dev_description(dev))
-                .to_string_lossy()
-                .into_owned();
-
-            let mut free_mem: usize = 0;
-            let mut total_mem: usize = 0;
-            ggml_backend_dev_memory(dev, &mut free_mem, &mut total_mem);
-
-            devices.push(GgmlBackend {
-                kind,
-                name,
-                description,
-                total_memory_mb: total_mem / 1024 / 1024,
-                free_memory_mb: free_mem / 1024 / 1024,
-            });
-        }
-    }
-
-    devices
-}
diff --git a/crates/whisper-local/src/model/actual.rs b/crates/whisper-local/src/model/actual.rs
@@ -10,6 +10,8 @@ use whisper_rs::{
 
 use hypr_whisper::Language;
 
+use crate::Segment;
+
 lazy_static! {
     static ref TRAILING_DOTS: Regex = Regex::new(r"\.{2,}$").unwrap();
 }
@@ -89,7 +91,7 @@ impl Whisper {
         WhisperBuilder::default()
     }
 
-    pub fn transcribe(&mut self, audio: &[f32]) -> Result<Vec<Segment>, super::Error> {
+    pub fn transcribe(&mut self, audio: &[f32]) -> Result<Vec<Segment>, crate::Error> {
         #[cfg(debug_assertions)]
         self.debug(audio);
 
@@ -187,7 +189,7 @@ impl Whisper {
         Ok(segments)
     }
 
-    fn get_language(&mut self, audio: &[f32]) -> Result<Option<String>, super::Error> {
+    fn get_language(&mut self, audio: &[f32]) -> Result<Option<String>, crate::Error> {
         if self.languages.len() == 0 {
             tracing::info!("no_language_specified");
             return Ok(None);
@@ -292,47 +294,6 @@ impl Whisper {
     }
 }
 
-// https://github.com/floneum/floneum/blob/52967ae/models/rwhisper/src/lib.rs#L116
-#[derive(Debug, Default)]
-pub struct Segment {
-    pub text: String,
-    pub language: Option<String>,
-    pub start: f64,
-    pub end: f64,
-    pub confidence: f32,
-    pub meta: Option<serde_json::Value>,
-}
-
-impl Segment {
-    pub fn text(&self) -> &str {
-        &self.text
-    }
-
-    pub fn language(&self) -> Option<&str> {
-        self.language.as_deref()
-    }
-
-    pub fn start(&self) -> f64 {
-        self.start
-    }
-
-    pub fn end(&self) -> f64 {
-        self.end
-    }
-
-    pub fn duration(&self) -> f64 {
-        self.end - self.start
-    }
-
-    pub fn confidence(&self) -> f32 {
-        self.confidence
-    }
-
-    pub fn meta(&self) -> Option<serde_json::Value> {
-        self.meta.clone()
-    }
-}
-
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/crates/whisper-local/src/model/mock.rs b/crates/whisper-local/src/model/mock.rs
@@ -0,0 +1,39 @@
+use crate::Segment;
+use hypr_whisper::Language;
+
+#[derive(Default)]
+pub struct WhisperBuilder {}
+
+#[derive(Default)]
+pub struct Whisper {}
+
+impl WhisperBuilder {
+    pub fn model_path(self, _model_path: impl Into<String>) -> Self {
+        self
+    }
+
+    pub fn languages(self, _languages: Vec<Language>) -> Self {
+        self
+    }
+
+    pub fn build(self) -> Result<Whisper, crate::Error> {
+        Ok(Whisper {})
+    }
+}
+
+impl Whisper {
+    pub fn builder() -> WhisperBuilder {
+        WhisperBuilder::default()
+    }
+
+    pub fn transcribe(&mut self, _samples: &[f32]) -> Result<Vec<Segment>, crate::Error> {
+        Ok(vec![Segment {
+            text: "mock".to_string(),
+            language: None,
+            start: 0.0,
+            end: 1.0,
+            confidence: 1.0,
+            meta: None,
+        }])
+    }
+}
diff --git a/crates/whisper-local/src/model/mod.rs b/crates/whisper-local/src/model/mod.rs
@@ -0,0 +1,49 @@
+#[cfg(feature = "actual")]
+mod actual;
+#[cfg(feature = "actual")]
+pub use actual::*;
+
+#[cfg(not(feature = "actual"))]
+mod mock;
+#[cfg(not(feature = "actual"))]
+pub use mock::*;
+
+#[derive(Debug, Default)]
+pub struct Segment {
+    pub text: String,
+    pub language: Option<String>,
+    pub start: f64,
+    pub end: f64,
+    pub confidence: f32,
+    pub meta: Option<serde_json::Value>,
+}
+
+impl Segment {
+    pub fn text(&self) -> &str {
+        &self.text
+    }
+
+    pub fn language(&self) -> Option<&str> {
+        self.language.as_deref()
+    }
+
+    pub fn start(&self) -> f64 {
+        self.start
+    }
+
+    pub fn end(&self) -> f64 {
+        self.end
+    }
+
+    pub fn duration(&self) -> f64 {
+        self.end - self.start
+    }
+
+    pub fn confidence(&self) -> f32 {
+        self.confidence
+    }
+
+    pub fn meta(&self) -> Option<serde_json::Value> {
+        self.meta.clone()
+    }
+}
diff --git a/crates/whisper-local/src/stream.rs b/crates/whisper-local/src/stream.rs
@@ -8,7 +8,7 @@ use dasp::sample::FromSample;
 use futures_util::{Stream, StreamExt};
 use rodio::Source;
 
-use super::{Segment, Whisper};
+use crate::{Segment, Whisper};
 
 pub struct TranscriptionTask<S, T> {
     stream: S,

Original file line number	Diff line number	Diff line change
`@@ -4,6 +4,7 @@ use serde::{ser::Serializer, Serialize};`
`4`	`4`	`pub enum Error {`
`5`	`5`	`#[error("model_not_found")]`
`6`	`6`	`ModelNotFound,`
	`7`	`+ #[cfg(feature = "actual")]`
`7`	`8`	`#[error(transparent)]`
`8`	`9`	`LocalWhisperError(#[from] whisper_rs::WhisperError),`
`9`	`10`	`}`