initial outline for rate limiting status updates

This commit is contained in:
KCaverly 2023-09-08 12:35:15 -04:00
parent e9747d0fea
commit a5ee8fc805
4 changed files with 106 additions and 8 deletions

View file

@ -21,7 +21,7 @@ use std::{
atomic::{self, AtomicUsize},
Arc,
},
time::SystemTime,
time::{Duration, SystemTime},
};
use unindent::Unindent;
use util::RandomCharIter;
@ -1275,6 +1275,10 @@ impl EmbeddingProvider for FakeEmbeddingProvider {
200
}
fn rate_limit_expiration(&self) -> Duration {
Duration::ZERO
}
async fn embed_batch(&self, spans: Vec<String>) -> Result<Vec<Embedding>> {
self.embedding_count
.fetch_add(spans.len(), atomic::Ordering::SeqCst);