Onde Inference
Instant local inference.
Infinite cloud scale.
A native on-device runtime built on Apple Silicon that bursts seamlessly to the cloud with a single line of code.
main.rs
use onde::inference::{ChatEngine, GgufModelConfig}; let engine = ChatEngine::new();engine.load_gguf_model( GgufModelConfig::platform_default(), Some("You are a helpful assistant.".into()), None,) .await?; let result = engine.send_message("Hello!").await?;println!("{}", result.text);// completed in 85ms — 100% on device