pub trait Pipeline:
Send
+ Sync
+ PreProcessingMixin
+ IsqPipelineMixin
+ CacheManagerMixin
+ AdapterActivationMixin
+ MetadataMixin
+ AnyMoePipelineMixin {
// Required methods
fn forward_inputs(
&mut self,
inputs: Box<dyn Any>,
return_raw_logits: bool,
) -> Result<ForwardInputsResult, Error>;
fn sample_causal_gen<'life0, 'life1, 'life2, 'life3, 'async_trait>(
&'life0 self,
seqs: &'life1 mut [&'life2 mut Sequence],
logits: Vec<Tensor>,
prefix_cacher: &'life3 mut PrefixCacheManagerV2,
disable_eos_stop: bool,
rng: Arc<Mutex<Isaac64Rng>>,
) -> Pin<Box<dyn Future<Output = Result<(), Error>> + Send + 'async_trait>>
where Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
'life2: 'async_trait,
'life3: 'async_trait;
fn category(&self) -> ModelCategory;
// Provided method
fn step<'life0, 'life1, 'life2, 'life3, 'life4, 'async_trait>(
&'life0 mut self,
input_seqs: &'life1 mut [&'life2 mut Sequence],
is_prompt: bool,
return_raw_logits: bool,
prefix_cacher: &'life3 mut PrefixCacheManagerV2,
disable_eos_stop: bool,
rng: Arc<Mutex<Isaac64Rng>>,
backend_metadata: CacheBackendMetadata<'life4>,
) -> Pin<Box<dyn Future<Output = Result<Duration, Error>> + Send + 'async_trait>>
where Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
'life2: 'async_trait,
'life3: 'async_trait,
'life4: 'async_trait { ... }
}
Required Methods§
fn forward_inputs( &mut self, inputs: Box<dyn Any>, return_raw_logits: bool, ) -> Result<ForwardInputsResult, Error>
fn sample_causal_gen<'life0, 'life1, 'life2, 'life3, 'async_trait>(
&'life0 self,
seqs: &'life1 mut [&'life2 mut Sequence],
logits: Vec<Tensor>,
prefix_cacher: &'life3 mut PrefixCacheManagerV2,
disable_eos_stop: bool,
rng: Arc<Mutex<Isaac64Rng>>,
) -> Pin<Box<dyn Future<Output = Result<(), Error>> + Send + 'async_trait>>where
Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
'life2: 'async_trait,
'life3: 'async_trait,
fn category(&self) -> ModelCategory
Provided Methods§
sourcefn step<'life0, 'life1, 'life2, 'life3, 'life4, 'async_trait>(
&'life0 mut self,
input_seqs: &'life1 mut [&'life2 mut Sequence],
is_prompt: bool,
return_raw_logits: bool,
prefix_cacher: &'life3 mut PrefixCacheManagerV2,
disable_eos_stop: bool,
rng: Arc<Mutex<Isaac64Rng>>,
backend_metadata: CacheBackendMetadata<'life4>,
) -> Pin<Box<dyn Future<Output = Result<Duration, Error>> + Send + 'async_trait>>where
Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
'life2: 'async_trait,
'life3: 'async_trait,
'life4: 'async_trait,
fn step<'life0, 'life1, 'life2, 'life3, 'life4, 'async_trait>(
&'life0 mut self,
input_seqs: &'life1 mut [&'life2 mut Sequence],
is_prompt: bool,
return_raw_logits: bool,
prefix_cacher: &'life3 mut PrefixCacheManagerV2,
disable_eos_stop: bool,
rng: Arc<Mutex<Isaac64Rng>>,
backend_metadata: CacheBackendMetadata<'life4>,
) -> Pin<Box<dyn Future<Output = Result<Duration, Error>> + Send + 'async_trait>>where
Self: 'async_trait,
'life0: 'async_trait,
'life1: 'async_trait,
'life2: 'async_trait,
'life3: 'async_trait,
'life4: 'async_trait,
Returns the total of model execution time.