fix: use rawPredict for non-streaming Claude requests
CI / All (ubuntu-latest) (push) Failing after 24s
CI / All (macos-latest) (push) Has been cancelled
CI / All (windows-latest) (push) Has been cancelled

This commit is contained in:
2026-06-09 23:05:31 -06:00
parent bca25404ab
commit 33c6f2c4e3
3 changed files with 9 additions and 5 deletions
+5 -1
View File
@@ -119,7 +119,11 @@ fn prepare_chat_completions(
format!("{base_url}/google/models/{model_name}:{func}") format!("{base_url}/google/models/{model_name}:{func}")
} }
ModelCategory::Claude => { ModelCategory::Claude => {
format!("{base_url}/anthropic/models/{model_name}:streamRawPredict") let func = match data.stream {
true => "streamRawPredict",
false => "rawPredict",
};
format!("{base_url}/anthropic/models/{model_name}:{func}")
} }
ModelCategory::Mistral => { ModelCategory::Mistral => {
let func = match data.stream { let func = match data.stream {
+3 -3
View File
@@ -16,8 +16,8 @@ use parking_lot::RwLock;
use serde::{Deserialize, Serialize}; use serde::{Deserialize, Serialize};
use serde_json::json; use serde_json::json;
use std::{ use std::{
collections::HashMap, env, fmt, fmt::Debug, fs, hash::Hash, path::Path, sync::Arc, cmp::Ordering, collections::HashMap, env, fmt, fmt::Debug, fs, hash::Hash, path::Path,
time::Duration, sync::Arc, time::Duration,
}; };
use tokio::time::sleep; use tokio::time::sleep;
@@ -1196,7 +1196,7 @@ fn reciprocal_rank_fusion(
} }
} }
let mut sorted_items: Vec<(DocumentId, f32)> = map.into_iter().collect(); let mut sorted_items: Vec<(DocumentId, f32)> = map.into_iter().collect();
sorted_items.sort_by(|a, b| b.1.partial_cmp(&a.1).unwrap()); sorted_items.sort_by(|a, b| b.1.partial_cmp(&a.1).unwrap_or(Ordering::Equal));
sorted_items sorted_items
.into_iter() .into_iter()