refactor · tiles.run/tiles@7dcfa4e

A local-first private AI assistant for everyday use. Runs on-device models with encrypted P2P sync, and supports sharing chats publicly on ATProto.

fork

+3 -8

4 changed files

expand all

Cargo.lock

server

backend

mlx.py

tiles

Cargo.toml

src

runtime

mlx.rs

-3

Cargo.lock

··· 528 528 checksum = "145052bdd345b87320e369255277e3fb5152762ad123a901ef5c262dd38fe8d2" 529 529 dependencies = [ 530 530 "iana-time-zone", 531 - "js-sys", 532 531 "num-traits", 533 - "wasm-bindgen", 534 532 "windows-link", 535 533 ] 536 534 ··· 3316 3314 version = "0.4.0-rc.1" 3317 3315 dependencies = [ 3318 3316 "anyhow", 3319 - "chrono", 3320 3317 "clap", 3321 3318 "futures-util", 3322 3319 "hf-hub",

+1 -2

server/backend/mlx.py

··· 170 170 "choices": [{"index": 0, "delta": {}, "finish_reason": "stop"}], 171 171 } 172 172 173 - # Include benchmarking metrics if available 173 + # Include benchmarking metrics if available 174 174 if metrics: 175 175 final_response["metrics"] = { 176 176 "ttft_ms": metrics.ttft_ms, ··· 178 178 "tokens_per_second": metrics.tokens_per_second, 179 179 "total_latency_s": metrics.total_latency_s, 180 180 } 181 - print(f"data: {json.dumps(final_response)}") 182 181 yield f"data: {json.dumps(final_response)}\n\n" 183 182 yield "data: [DONE]\n\n" 184 183

-1

tiles/Cargo.toml

··· 15 15 futures-util = "0.3" 16 16 hf-hub = {version = "0.4", features = ["tokio"]} 17 17 rustyline = "17.0" 18 - chrono = "0.4"

+2 -2

tiles/src/runtime/mlx.rs

··· 452 452 format!( 453 453 "\n{} {:.1} tok/s | {} tokens | {:.0}ms TTFT", 454 454 "💡".yellow(), 455 - bench_metrics.total_tokens 456 - / bench_metrics.total_latency_s as i32, 455 + bench_metrics.total_tokens as f64 456 + / bench_metrics.total_latency_s, 457 457 bench_metrics.total_tokens, 458 458 bench_metrics.ttft_ms 459 459 )

Configure Feed

Configure Feed