[package] name = "kalosm-sound" version = "0.3.4" edition = "2021" description = "A set of pretrained audio models " license = "MIT/Apache-2.0" repository = "https://github.com/floneum/floneum" authors = ["Evan Almloff"] keywords = ["ai", "whisper"] [dependencies] anyhow = "1.0.70" cpal = "0.15.1" itertools = "0.10.5" rand = "0.8.5" candle-core.workspace = true candle-nn.workspace = true candle-transformers.workspace = true byteorder = "1.4.3" tokenizers = "0.19.1" serde_json = "1.0.107" hound = "3.5" rodio = "0.17.1" dasp = { version = "0.11.0", features = ["all"] } tokio = { version = "1.32.0", features = ["full"] } tracing = "0.1.37" futures-core = "0.3.30" futures-util = "0.3.30" futures-channel = "0.3.30" async-trait = "0.1.73" kalosm-streams.workspace = true rwhisper.workspace = true voice_activity_detector = { version = "0.1.0", features = ["async"], optional = true } ort = { version = "=2.0.0-rc.4", optional = true} nnnoiseless = { version = "0.5.1", optional = true } [features] default = ["voice_detection", "denoise"] metal = ["candle-core/metal", "rwhisper/accelerate", "rwhisper/metal"] cuda = ["candle-core/cuda", "rwhisper/cuda", "rwhisper/cudnn"] mkl = ["candle-core/mkl", "rwhisper/mkl"] denoise = ["dep:nnnoiseless"] voice_detection = ["dep:voice_activity_detector", "dep:ort"] [dev-dependencies] kalosm = { workspace = true, features = ["sound"] }