List of all items
Structs
- mistralrs_for_server_builder::MistralRsForServerBuilder
- mistralrs_for_server_builder::ModelConfig
- mistralrs_server_router_builder::MistralRsServerRouterBuilder
- openai::ChatCompletionRequest
- openai::CompletionRequest
- openai::FunctionCalled
- openai::ImageGenerationRequest
- openai::JsonSchemaResponseFormat
- openai::Message
- openai::MessageContent
- openai::MessageInnerContent
- openai::ModelObject
- openai::ModelObjects
- openai::SpeechGenerationRequest
- openai::ToolCall
- streaming::BaseStreamer
Enums
- image_generation::ImageGenerationResponder
- openai::AudioResponseFormat
- openai::Grammar
- openai::ResponseFormat
- openai::StopTokens
- speech_generation::SpeechGenerationResponder
- streaming::DoneState
Functions
- chat_completion::chatcompletions
- chat_completion::create_streamer
- chat_completion::handle_error
- chat_completion::match_responses
- chat_completion::parse_request
- chat_completion::process_non_streaming_response
- completions::completions
- completions::create_streamer
- completions::handle_error
- completions::match_responses
- completions::parse_request
- completions::process_non_streaming_response
- handler_core::create_response_channel
- handler_core::send_request
- handler_core::send_request_with_model
- image_generation::handle_error
- image_generation::image_generation
- image_generation::match_responses
- image_generation::parse_request
- image_generation::process_non_streaming_response
- mistralrs_for_server_builder::configure_paged_attn_from_flags
- mistralrs_for_server_builder::get_bert_model
- openapi_doc::get_openapi_doc
- speech_generation::handle_error
- speech_generation::match_responses
- speech_generation::parse_request
- speech_generation::process_non_streaming_response
- speech_generation::speech_generation
- streaming::get_keep_alive_interval
- util::parse_audio_url
- util::parse_image_url
- util::validate_model_name
Type Aliases
- chat_completion::ChatCompletionOnChunkCallback
- chat_completion::ChatCompletionOnDoneCallback
- chat_completion::ChatCompletionResponder
- chat_completion::ChatCompletionStreamer
- completions::CompletionOnChunkCallback
- completions::CompletionOnDoneCallback
- completions::CompletionResponder
- completions::CompletionStreamer
- types::ExtractedMistralRsState
- types::OnChunkCallback
- types::OnDoneCallback
- types::SharedMistralRsState
Constants
- handler_core::DEFAULT_CHANNEL_BUFFER_SIZE
- mistralrs_for_server_builder::defaults::CHAT_TEMPLATE
- mistralrs_for_server_builder::defaults::CPU
- mistralrs_for_server_builder::defaults::DEVICE
- mistralrs_for_server_builder::defaults::ENABLE_SEARCH
- mistralrs_for_server_builder::defaults::INTERACTIVE_MODE
- mistralrs_for_server_builder::defaults::IN_SITU_QUANT
- mistralrs_for_server_builder::defaults::JINJA_EXPLICIT
- mistralrs_for_server_builder::defaults::LOG
- mistralrs_for_server_builder::defaults::MAX_SEQS
- mistralrs_for_server_builder::defaults::MODEL
- mistralrs_for_server_builder::defaults::NO_KV_CACHE
- mistralrs_for_server_builder::defaults::NUM_DEVICE_LAYERS
- mistralrs_for_server_builder::defaults::PAGED_ATTN
- mistralrs_for_server_builder::defaults::PAGED_ATTN_BLOCK_SIZE
- mistralrs_for_server_builder::defaults::PAGED_ATTN_CPU
- mistralrs_for_server_builder::defaults::PAGED_ATTN_CUDA
- mistralrs_for_server_builder::defaults::PAGED_ATTN_GPU_MEM
- mistralrs_for_server_builder::defaults::PAGED_ATTN_GPU_MEM_USAGE
- mistralrs_for_server_builder::defaults::PAGED_ATTN_METAL
- mistralrs_for_server_builder::defaults::PAGED_CACHE_TYPE
- mistralrs_for_server_builder::defaults::PAGED_CTXT_LEN
- mistralrs_for_server_builder::defaults::PREFIX_CACHE_N
- mistralrs_for_server_builder::defaults::PROMPT_CHUNKSIZE
- mistralrs_for_server_builder::defaults::SEARCH_BERT_MODEL
- mistralrs_for_server_builder::defaults::SEARCH_CALLBACK
- mistralrs_for_server_builder::defaults::SEED
- mistralrs_for_server_builder::defaults::TOKEN_SOURCE
- mistralrs_for_server_builder::defaults::TRUNCATE_SEQUENCE
- mistralrs_server_router_builder::DEFAULT_MAX_BODY_LIMIT
- streaming::DEFAULT_KEEP_ALIVE_INTERVAL_MS