[package]
name = "ruvllm-cli"
version.workspace = true
edition.workspace = true
rust-version.workspace = true
license.workspace = true
authors.workspace = true
repository.workspace = true
description = "CLI for RuvLLM model management and inference on Apple Silicon"

[[bin]]
name = "ruvllm"
path = "src/main.rs"

[dependencies]
# RuvLLM core library
ruvllm = { path = "../ruvllm", features = ["candle"] }

# CLI framework
clap = { version = "4.5", features = ["derive", "cargo", "env"] }
indicatif = { workspace = true }
console = { workspace = true }

# Async runtime
tokio = { workspace = true, features = ["full", "signal"] }
futures = { workspace = true }

# HuggingFace Hub for model downloads
hf-hub = { version = "0.3", features = ["tokio"] }

# HTTP server for inference API
axum = { version = "0.7", features = ["ws"] }
tower = "0.5"
tower-http = { version = "0.6", features = ["cors", "trace"] }

# Serialization
serde = { workspace = true }
serde_json = { workspace = true }

# Error handling
thiserror = { workspace = true }
anyhow = { workspace = true }
tracing = { workspace = true }
tracing-subscriber = { workspace = true }

# Utilities
chrono = { workspace = true }
uuid = { workspace = true }
dirs = "5.0"
colored = "2.1"
rustyline = "14.0"
ctrlc = "3.4"
bytesize = "1.3"
prettytable-rs = "0.10"
dialoguer = "0.11"

# Streaming
async-stream = "0.3"

[dev-dependencies]
assert_cmd = "2.0"
predicates = "3.1"
tempfile = "3.13"

[features]
default = []
# Metal acceleration for Apple Silicon (M1/M2/M3/M4)
metal = ["ruvllm/metal"]
# CUDA acceleration for NVIDIA GPUs
cuda = ["ruvllm/cuda"]