Native node: lämmittelykutsu lataa mallin VRAM:iin heti käynnistyksessä
This commit is contained in:
@@ -1 +1 @@
|
|||||||
56f21a9
|
cf3bf54
|
||||||
|
|||||||
Binary file not shown.
@@ -363,8 +363,18 @@ async fn main() {
|
|||||||
st.push_log("System", format!("Malli valmis: {}", active_model), None);
|
st.push_log("System", format!("Malli valmis: {}", active_model), None);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Haetaan VRAM-tila heti ja käynnistetään taustapäivitys (30s välein)
|
// Lämmittelykutsu: ladataan malli VRAM:iin ja haetaan VRAM-tila
|
||||||
if let Some(ref engine) = llm {
|
if let Some(ref engine) = llm {
|
||||||
|
{
|
||||||
|
let mut st = tui_state.write().await;
|
||||||
|
st.vram_status = "Ladataan VRAM:iin...".to_string();
|
||||||
|
st.push_log("System", "Ladataan mallia VRAM:iin...".to_string(), None);
|
||||||
|
}
|
||||||
|
// Lyhyt generate-kutsu pakottaa Ollaman lataamaan mallin GPU:lle
|
||||||
|
let _ = engine.generate("hi", &inference::GenerateOptions {
|
||||||
|
max_tokens: 1, system_prompt: None, temperature: Some(0.0),
|
||||||
|
top_k: Some(1), repeat_penalty: None, stop: None,
|
||||||
|
}).await;
|
||||||
if let Ok(Some(ps)) = engine.fetch_ps().await {
|
if let Ok(Some(ps)) = engine.fetch_ps().await {
|
||||||
let mut st = tui_state.write().await;
|
let mut st = tui_state.write().await;
|
||||||
st.vram_status = ps.display();
|
st.vram_status = ps.display();
|
||||||
|
|||||||
Reference in New Issue
Block a user