- docker-compose: Ollama-container GPU:lla + persistent volume malleille - native-node: Candle poistettu, kutsuu Ollaman HTTP API:a (async) - Dockerfile: yksinkertaistettu, ei CUDA SDK:ta (Ollama hoitaa GPU:n) - Tukee kaikkia malleja: qwen2.5-coder:1.5b/3b/7b/14b/32b - OLLAMA_MODEL ympäristömuuttujalla vaihdetaan malli - kpn models näyttää Ollama-mallit nopeustiedoilla Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
18 lines
478 B
TOML
18 lines
478 B
TOML
[package]
|
|
name = "native-node"
|
|
version = "0.2.0"
|
|
edition = "2024"
|
|
|
|
[dependencies]
|
|
tokio = { version = "1.36", features = ["full"] }
|
|
tokio-tungstenite = { version = "0.21", features = ["native-tls"] }
|
|
futures-util = "0.3"
|
|
serde = { version = "1.0", features = ["derive"] }
|
|
serde_json = "1.0"
|
|
sysinfo = "0.30"
|
|
nvml-wrapper = "0.10"
|
|
wgpu = "24"
|
|
reqwest = { version = "0.12", features = ["json"] }
|
|
tracing = "0.1"
|
|
tracing-subscriber = { version = "0.3", features = ["env-filter"] }
|