3 parallel models
This commit is contained in:
@@ -85,7 +85,32 @@
|
||||
#keep_alive = "15m";
|
||||
available_models = [
|
||||
{
|
||||
name = "glm-4.7-flash";
|
||||
name = "deepseek-r1:1.5b";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "deepseek-r1:32b";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "deepseek-r1:70b";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "qwen3-coder-next";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "lennyerik/zeta";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "nomic-embed-text:latest";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
@@ -94,6 +119,21 @@
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "glm-4.7-flash";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "nemotron-cascade-2:30b";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
{
|
||||
name = "magistral";
|
||||
max_tokens = 128000;
|
||||
keep_alive = "15m";
|
||||
}
|
||||
];
|
||||
};
|
||||
};
|
||||
|
||||
Reference in New Issue
Block a user