Struct EmbedPool

Source

pub struct EmbedPool {
    tx: Sender<EmbedRequest>,
    live_workers: Arc<AtomicUsize>,
    loaded_workers: Arc<AtomicUsize>,
    model_rss_per_worker_bytes: Arc<AtomicUsize>,
}

Expand description

Async handle to the embedding worker thread pool.

Wraps a bounded mpsc channel shared by n spawn_blocking worker threads. Each worker owns its own ORT session and tokenizer; the pool dispatches EmbedRequest variants to whichever worker is free next.

Clone is cheap — the underlying channel sender and atomic counters are reference-counted.

Fields§

§tx: Sender<EmbedRequest>§live_workers: Arc<AtomicUsize>§loaded_workers: Arc<AtomicUsize>

Number of workers that currently have model instances loaded in memory.

§model_rss_per_worker_bytes: Arc<AtomicUsize>

Median RSS delta (bytes) measured across all workers during sequential model load.

Workers load one at a time (leader first, then followers in sequence). Each reports its own RSS before/after load_models() via ready_tx. The pool stores the median once all workers have signaled ready — robust to one outlier from page-cache settling or ORT arena init jitter.

Used by run_readiness_probe to correctly deduct the model-weight footprint from the available workspace before computing per-worker budget. Returns 0 on non-Linux targets where RSS measurement is unavailable, or before the init task has completed.

Struct EmbedPool Copy item path

Fields§

Implementations§

impl EmbedPool

pub fn spawn( n: usize, cache_dir: PathBuf, config: WorkerConfig, ) -> (Self, JoinHandle<Result<()>>)

pub async fn dense( &self, texts: Vec<String>, ) -> Result<(Vec<Vec<f32>>, EmbedStats)>

§Errors

pub async fn sparse( &self, texts: Vec<String>, ) -> Result<(Vec<SparseEmbedding>, EmbedStats)>

§Errors

pub async fn both( &self, texts: Vec<String>, ) -> Result<(Vec<DualEmbedding>, EmbedStats)>

§Errors

pub(crate) async fn probe(&self, texts: Vec<String>) -> Result<ProbeResult>

pub fn live_worker_count(&self) -> usize

pub fn loaded_worker_count(&self) -> usize

pub fn queue_depth(&self) -> usize

pub fn model_rss_per_worker_bytes(&self) -> usize

Trait Implementations§

impl Clone for EmbedPool

fn clone(&self) -> EmbedPool

fn clone_from(&mut self, source: &Self)

Auto Trait Implementations§

impl Freeze for EmbedPool

impl RefUnwindSafe for EmbedPool

impl Send for EmbedPool

impl Sync for EmbedPool

impl Unpin for EmbedPool

impl UnsafeUnpin for EmbedPool

impl UnwindSafe for EmbedPool

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> FromRef<T> for Twhere T: Clone,

fn from_ref(input: &T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct EmbedPool

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> FromRef<T> for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,