use std::sync::Arc;
use axum::routing::{get, post};
use axum::Router;
use crate::admin;
use crate::auth::{auth_middleware, ApiKeys};
use crate::batch;
use crate::batch_spool;
use crate::body_limit::body_limit_layer;
use crate::config::ServerConfig;
use crate::rate_limit::{per_key_rate_limit_middleware, rate_limit_middleware, RateLimiter};
use crate::routes;
use crate::state::AppState;
use crate::threads;
use crate::tracing_layer::tracing_middleware;
use crate::ws::ws_handler;
pub fn build_app(state: Arc<AppState>) -> Router {
Router::new()
.route("/v1/chat/completions", post(routes::chat::chat_completions))
.route("/v1/completions", post(routes::completions::completions))
.route("/v1/embeddings", post(routes::embeddings::embeddings))
.route("/v1/models", get(routes::models::list_models))
.route("/health", get(routes::health::health))
.route("/v1/chat/ws", get(ws_handler))
.route(
"/v1/batches",
post(batch::create_batch).get(batch::list_batches),
)
.route("/v1/batches/{id}", get(batch::get_batch))
.route("/v1/batches/{id}/cancel", post(batch::cancel_batch))
.route(
"/v1/batch_jobs",
post(batch_spool::routes::create_batch).get(batch_spool::routes::list_batches),
)
.route("/v1/batch_jobs/{id}", get(batch_spool::routes::get_batch))
.route(
"/v1/batch_jobs/{id}/output",
get(batch_spool::routes::get_batch_output),
)
.route(
"/v1/batch_jobs/{id}/cancel",
post(batch_spool::routes::cancel_batch),
)
.route(
"/v1/files",
post(routes::files::create_file_handler).get(routes::files::list_files_handler),
)
.route(
"/v1/files/{file_id}",
get(routes::files::get_file_handler).delete(routes::files::delete_file_handler),
)
.route(
"/v1/files/{file_id}/content",
get(routes::files::get_file_content_handler),
)
.route("/v1/threads", post(threads::routes::create_thread_handler))
.route(
"/v1/threads/{thread_id}",
get(threads::routes::get_thread_handler),
)
.route(
"/v1/threads/{thread_id}/messages",
post(threads::routes::create_message_handler)
.get(threads::routes::list_messages_handler),
)
.route(
"/v1/threads/{thread_id}/runs",
post(threads::routes::create_run_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}",
get(threads::routes::get_run_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}/cancel",
post(threads::routes::cancel_run_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}/steps",
get(threads::steps::list_steps_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}/steps/{step_id}",
get(threads::steps::get_step_handler),
)
.route(
"/v1/responses",
post(routes::responses::create_response).get(routes::responses::list_responses),
)
.route("/v1/responses/{id}", get(routes::responses::get_response))
.route("/admin/models/load", post(admin::admin_load_model))
.route("/admin/models/unload", post(admin::admin_unload_model))
.route("/admin/models", get(admin::admin_list_models))
.route("/admin/stats", get(admin::admin_stats))
.route("/admin/health", get(admin::admin_health))
.route(
"/admin/loras",
post(admin::admin_register_lora).get(admin::admin_list_loras),
)
.route(
"/admin/loras/{name}",
axum::routing::delete(admin::admin_unregister_lora),
)
.with_state(state)
}
pub fn build_app_with_config(state: Arc<AppState>, config: &ServerConfig) -> Router {
let metrics = Arc::clone(&state.metrics);
let admin_auth = crate::admin::AdminAuth {
token: config.admin_bearer_token.clone(),
};
let mut app = Router::new()
.route("/v1/chat/completions", post(routes::chat::chat_completions))
.route("/v1/completions", post(routes::completions::completions))
.route("/v1/embeddings", post(routes::embeddings::embeddings))
.route("/v1/models", get(routes::models::list_models))
.route("/health", get(routes::health::health))
.route("/v1/chat/ws", get(ws_handler))
.route(
"/v1/batches",
post(batch::create_batch).get(batch::list_batches),
)
.route("/v1/batches/{id}", get(batch::get_batch))
.route("/v1/batches/{id}/cancel", post(batch::cancel_batch))
.route(
"/v1/batch_jobs",
post(batch_spool::routes::create_batch).get(batch_spool::routes::list_batches),
)
.route("/v1/batch_jobs/{id}", get(batch_spool::routes::get_batch))
.route(
"/v1/batch_jobs/{id}/output",
get(batch_spool::routes::get_batch_output),
)
.route(
"/v1/batch_jobs/{id}/cancel",
post(batch_spool::routes::cancel_batch),
)
.route(
"/v1/files",
post(routes::files::create_file_handler).get(routes::files::list_files_handler),
)
.route(
"/v1/files/{file_id}",
get(routes::files::get_file_handler).delete(routes::files::delete_file_handler),
)
.route(
"/v1/files/{file_id}/content",
get(routes::files::get_file_content_handler),
)
.route("/v1/threads", post(threads::routes::create_thread_handler))
.route(
"/v1/threads/{thread_id}",
get(threads::routes::get_thread_handler),
)
.route(
"/v1/threads/{thread_id}/messages",
post(threads::routes::create_message_handler)
.get(threads::routes::list_messages_handler),
)
.route(
"/v1/threads/{thread_id}/runs",
post(threads::routes::create_run_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}",
get(threads::routes::get_run_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}/cancel",
post(threads::routes::cancel_run_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}/steps",
get(threads::steps::list_steps_handler),
)
.route(
"/v1/threads/{thread_id}/runs/{run_id}/steps/{step_id}",
get(threads::steps::get_step_handler),
)
.route(
"/v1/responses",
post(routes::responses::create_response).get(routes::responses::list_responses),
)
.route("/v1/responses/{id}", get(routes::responses::get_response))
.route("/admin/models/load", post(admin::admin_load_model))
.route("/admin/models/unload", post(admin::admin_unload_model))
.route("/admin/models", get(admin::admin_list_models))
.route("/admin/stats", get(admin::admin_stats))
.route("/admin/health", get(admin::admin_health))
.route(
"/admin/loras",
post(admin::admin_register_lora).get(admin::admin_list_loras),
)
.route(
"/admin/loras/{name}",
axum::routing::delete(admin::admin_unregister_lora),
);
if config.metrics_enabled {
app = app.route("/metrics", get(routes::metrics::metrics));
}
let mut app = app.with_state(Arc::clone(&state));
app = app.layer(axum::Extension(admin_auth));
if config.metrics_enabled {
app = app.layer(axum::Extension(metrics));
}
if config.structured_tracing {
app = app.layer(axum::middleware::from_fn(tracing_middleware));
}
if let Some(per_key_limiter) = state.per_key_rate_limiter.as_ref().cloned() {
app = app.layer(axum::middleware::from_fn_with_state(
per_key_limiter,
per_key_rate_limit_middleware,
));
}
if config.rate_limit_capacity > 0.0 {
let limiter = RateLimiter::new(config.rate_limit_capacity, config.rate_limit_rate);
app = app
.layer(axum::middleware::from_fn(rate_limit_middleware))
.layer(axum::Extension(limiter));
}
#[cfg(feature = "jwt")]
if let Some(jwt_config) = config.jwt.clone() {
use crate::jwt_auth::{jwt_auth_middleware, JwtVerifier};
let verifier = Arc::new(JwtVerifier::new(jwt_config));
app = app.layer(axum::middleware::from_fn_with_state(
verifier,
jwt_auth_middleware,
));
} else if !config.api_keys.is_empty() {
let keys = ApiKeys(Arc::new(config.api_keys.clone()));
app = app
.layer(axum::middleware::from_fn(auth_middleware))
.layer(axum::Extension(keys));
}
#[cfg(not(feature = "jwt"))]
if !config.api_keys.is_empty() {
let keys = ApiKeys(Arc::new(config.api_keys.clone()));
app = app
.layer(axum::middleware::from_fn(auth_middleware))
.layer(axum::Extension(keys));
}
if config.body_limit_bytes > 0 {
app = app.layer(body_limit_layer(config.body_limit_bytes));
}
app
}