A local-first private AI assistant for everyday use. Runs on-device models with encrypted P2P sync, and supports sharing chats publicly on ATProto.
10
fork

Configure Feed

Select the types of activity you want to include in your feed.

refactor

madclaws 7dcfa4e2 7f171188

+3 -8
-3
Cargo.lock
··· 528 528 checksum = "145052bdd345b87320e369255277e3fb5152762ad123a901ef5c262dd38fe8d2" 529 529 dependencies = [ 530 530 "iana-time-zone", 531 - "js-sys", 532 531 "num-traits", 533 - "wasm-bindgen", 534 532 "windows-link", 535 533 ] 536 534 ··· 3316 3314 version = "0.4.0-rc.1" 3317 3315 dependencies = [ 3318 3316 "anyhow", 3319 - "chrono", 3320 3317 "clap", 3321 3318 "futures-util", 3322 3319 "hf-hub",
+1 -2
server/backend/mlx.py
··· 170 170 "choices": [{"index": 0, "delta": {}, "finish_reason": "stop"}], 171 171 } 172 172 173 - # Include benchmarking metrics if available 173 + # Include benchmarking metrics if available 174 174 if metrics: 175 175 final_response["metrics"] = { 176 176 "ttft_ms": metrics.ttft_ms, ··· 178 178 "tokens_per_second": metrics.tokens_per_second, 179 179 "total_latency_s": metrics.total_latency_s, 180 180 } 181 - print(f"data: {json.dumps(final_response)}") 182 181 yield f"data: {json.dumps(final_response)}\n\n" 183 182 yield "data: [DONE]\n\n" 184 183
-1
tiles/Cargo.toml
··· 15 15 futures-util = "0.3" 16 16 hf-hub = {version = "0.4", features = ["tokio"]} 17 17 rustyline = "17.0" 18 - chrono = "0.4"
+2 -2
tiles/src/runtime/mlx.rs
··· 452 452 format!( 453 453 "\n{} {:.1} tok/s | {} tokens | {:.0}ms TTFT", 454 454 "💡".yellow(), 455 - bench_metrics.total_tokens 456 - / bench_metrics.total_latency_s as i32, 455 + bench_metrics.total_tokens as f64 456 + / bench_metrics.total_latency_s, 457 457 bench_metrics.total_tokens, 458 458 bench_metrics.ttft_ms 459 459 )