← Back

Module serve

struct ServerConfig

Source: serve.joule:31

fn default() -> Self

Source: serve.joule:57

struct CorsConfig

Source: serve.joule:76

fn permissive() -> Self

Source: serve.joule:84

struct TlsConfig

Source: serve.joule:96

struct RateLimitConfig

Source: serve.joule:103

struct EnergyTrackingConfig

Source: serve.joule:116

fn default() -> Self

Source: serve.joule:132

struct SloConfig

Source: serve.joule:146

fn default() -> Self

Source: serve.joule:162

struct CompletionRequest

Source: serve.joule:180

struct CompletionResponse

Source: serve.joule:205

struct CompletionChoice

Source: serve.joule:224

struct UsageStats

Source: serve.joule:232

struct EnergyUsage

Source: serve.joule:240

struct ChatMessage

Source: serve.joule:255

struct ChatCompletionRequest

Source: serve.joule:262

struct ChatCompletionResponse

Source: serve.joule:277

struct ChatChoice

Source: serve.joule:289

struct StreamChunk

Source: serve.joule:297

struct StreamChoice

Source: serve.joule:307

struct LoadedModel

Loaded model entry

Source: serve.joule:318

struct ModelVersion

Source: serve.joule:333

struct ModelRegistry

Model registry for managing multiple models

Source: serve.joule:342

fn new() -> Self

Source: serve.joule:349

fn get_engine(&self, model_id: &str) -> Option<Arc<Engine>>

Source: serve.joule:357

fn list_models(&self) -> Vec<String>

Source: serve.joule:362

struct ServerMetrics

Source: serve.joule:374

struct SloCompliance

Source: serve.joule:407

struct MetricsCollector

Metrics collector

Source: serve.joule:418

fn new() -> Self

Source: serve.joule:438

fn record_request(

Source: serve.joule:451

fn compute_metrics(&self, slo: &SloConfig, active_requests: usize) -> ServerMetrics

Source: serve.joule:506

fn percentile(values: &[Duration], p: f64) -> Duration

Source: serve.joule:603

fn average_duration(values: &[Duration]) -> Duration

Source: serve.joule:613

enum ServeError

Source: serve.joule:627

fn from(e: InferenceError) -> Self

Source: serve.joule:638

struct Server

Model server

Source: serve.joule:644

fn new(config: ServerConfig) -> Self

Create new server

Source: serve.joule:654

fn unload_model(&self, model_id: &str) -> Result<(), ServeError>

Unload model

Source: serve.joule:721

fn list_models(&self) -> Vec<ModelInfo>

List loaded models

Source: serve.joule:729

fn metrics(&self) -> ServerMetrics

Get server metrics

Source: serve.joule:735

fn stop(&self)

Stop server

Source: serve.joule:1019

fn health(&self) -> HealthStatus

Health check

Source: serve.joule:1024

fn format_chat_prompt(&self, messages: &[ChatMessage]) -> String

Source: serve.joule:1038

struct HealthStatus

Source: serve.joule:1058

fn estimate_request_energy(

Get energy cost estimate for a request

Source: serve.joule:1111