Skip to content

Commit 1eeaf9a

Browse files
committed
change tps value, bump version
1 parent 5c732db commit 1eeaf9a

File tree

3 files changed

+12
-8
lines changed

3 files changed

+12
-8
lines changed

Cargo.lock

Lines changed: 4 additions & 4 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ default-members = ["compute"]
77

88
[workspace.package]
99
edition = "2021"
10-
version = "0.6.3"
10+
version = "0.6.4"
1111
license = "Apache-2.0"
1212
readme = "README.md"
1313

executor/src/executors/ollama.rs

Lines changed: 7 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ const DEFAULT_OLLAMA_PORT: u16 = 11434;
1515
/// Timeout duration for checking model performance during a generation.
1616
const PERFORMANCE_TIMEOUT: Duration = Duration::from_secs(120);
1717
/// Minimum tokens per second (TPS) for checking model performance during a generation.
18-
const PERFORMANCE_MIN_TPS: f64 = 15.0;
18+
const PERFORMANCE_MIN_TPS: f64 = 10.0;
1919

2020
/// Ollama-specific configurations.
2121
#[derive(Clone)]
@@ -85,8 +85,12 @@ impl OllamaClient {
8585
models: &mut HashSet<Model>,
8686
) -> Result<HashMap<Model, SpecModelPerformance>> {
8787
log::info!(
88-
"Checking Ollama requirements (auto-pull {}, timeout: {}s, min tps: {})",
89-
if self.auto_pull { "on" } else { "off" },
88+
"Checking Ollama requirements ({}, timeout: {}s, min tps: {})",
89+
if self.auto_pull {
90+
"auto-pull enabled"
91+
} else {
92+
"auto-pull disabled"
93+
},
9094
PERFORMANCE_TIMEOUT.as_secs(),
9195
PERFORMANCE_MIN_TPS
9296
);

0 commit comments

Comments
 (0)