mirror of
https://github.com/sigp/lighthouse.git
synced 2026-03-09 19:51:47 +00:00
217 lines
6.6 KiB
Rust
217 lines
6.6 KiB
Rust
//! This crate provides a HTTP server that is solely dedicated to serving the `/metrics` endpoint.
|
|
//!
|
|
//! For other endpoints, see the `http_api` crate.
|
|
|
|
use lighthouse_validator_store::LighthouseValidatorStore;
|
|
use lighthouse_version::version_with_platform;
|
|
use logging::crit;
|
|
use malloc_utils::scrape_allocator_metrics;
|
|
use parking_lot::RwLock;
|
|
use serde::{Deserialize, Serialize};
|
|
use slot_clock::{SlotClock, SystemTimeSlotClock};
|
|
use std::future::Future;
|
|
use std::net::{IpAddr, Ipv4Addr, SocketAddr};
|
|
use std::sync::Arc;
|
|
use std::time::{SystemTime, UNIX_EPOCH};
|
|
use tracing::info;
|
|
use types::EthSpec;
|
|
use validator_services::duties_service::DutiesService;
|
|
use warp::{Filter, http::Response};
|
|
|
|
#[derive(Debug)]
|
|
pub enum Error {
|
|
Warp(#[allow(dead_code)] warp::Error),
|
|
Other(#[allow(dead_code)] String),
|
|
}
|
|
|
|
impl From<warp::Error> for Error {
|
|
fn from(e: warp::Error) -> Self {
|
|
Error::Warp(e)
|
|
}
|
|
}
|
|
|
|
impl From<String> for Error {
|
|
fn from(e: String) -> Self {
|
|
Error::Other(e)
|
|
}
|
|
}
|
|
|
|
type ValidatorStore<E> = LighthouseValidatorStore<SystemTimeSlotClock, E>;
|
|
|
|
/// Contains objects which have shared access from inside/outside of the metrics server.
|
|
pub struct Shared<E> {
|
|
pub validator_store: Option<Arc<ValidatorStore<E>>>,
|
|
pub duties_service: Option<Arc<DutiesService<ValidatorStore<E>, SystemTimeSlotClock>>>,
|
|
pub genesis_time: Option<u64>,
|
|
}
|
|
|
|
/// A wrapper around all the items required to spawn the HTTP server.
|
|
///
|
|
/// The server will gracefully handle the case where any fields are `None`.
|
|
pub struct Context<E> {
|
|
pub config: Config,
|
|
pub shared: RwLock<Shared<E>>,
|
|
}
|
|
|
|
/// Configuration for the HTTP server.
|
|
#[derive(PartialEq, Debug, Clone, Serialize, Deserialize)]
|
|
pub struct Config {
|
|
pub enabled: bool,
|
|
pub listen_addr: IpAddr,
|
|
pub listen_port: u16,
|
|
pub allow_origin: Option<String>,
|
|
pub allocator_metrics_enabled: bool,
|
|
}
|
|
|
|
impl Default for Config {
|
|
fn default() -> Self {
|
|
Self {
|
|
enabled: false,
|
|
listen_addr: IpAddr::V4(Ipv4Addr::new(127, 0, 0, 1)),
|
|
listen_port: 5064,
|
|
allow_origin: None,
|
|
allocator_metrics_enabled: true,
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Creates a server that will serve requests using information from `ctx`.
|
|
///
|
|
/// The server will shut down gracefully when the `shutdown` future resolves.
|
|
///
|
|
/// ## Returns
|
|
///
|
|
/// This function will bind the server to the provided address and then return a tuple of:
|
|
///
|
|
/// - `SocketAddr`: the address that the HTTP server will listen on.
|
|
/// - `Future`: the actual server future that will need to be awaited.
|
|
///
|
|
/// ## Errors
|
|
///
|
|
/// Returns an error if the server is unable to bind or there is another error during
|
|
/// configuration.
|
|
pub fn serve<E: EthSpec>(
|
|
ctx: Arc<Context<E>>,
|
|
shutdown: impl Future<Output = ()> + Send + Sync + 'static,
|
|
) -> Result<(SocketAddr, impl Future<Output = ()>), Error> {
|
|
let config = &ctx.config;
|
|
|
|
// Configure CORS.
|
|
let cors_builder = {
|
|
let builder = warp::cors()
|
|
.allow_method("GET")
|
|
.allow_headers(vec!["Content-Type"]);
|
|
|
|
warp_utils::cors::set_builder_origins(
|
|
builder,
|
|
config.allow_origin.as_deref(),
|
|
(config.listen_addr, config.listen_port),
|
|
)?
|
|
};
|
|
|
|
// Sanity check.
|
|
if !config.enabled {
|
|
crit!("Cannot start disabled metrics HTTP server");
|
|
return Err(Error::Other(
|
|
"A disabled metrics server should not be started".to_string(),
|
|
));
|
|
}
|
|
|
|
let inner_ctx = ctx.clone();
|
|
let routes = warp::get()
|
|
.and(warp::path("metrics"))
|
|
.map(move || inner_ctx.clone())
|
|
.and_then(|ctx: Arc<Context<E>>| async move {
|
|
Ok::<_, warp::Rejection>(
|
|
gather_prometheus_metrics(&ctx)
|
|
.map(|body| {
|
|
Response::builder()
|
|
.status(200)
|
|
.header("Content-Type", "text/plain")
|
|
.body(body)
|
|
.unwrap()
|
|
})
|
|
.unwrap_or_else(|e| {
|
|
Response::builder()
|
|
.status(500)
|
|
.header("Content-Type", "text/plain")
|
|
.body(format!("Unable to gather metrics: {:?}", e))
|
|
.unwrap()
|
|
}),
|
|
)
|
|
})
|
|
// Add a `Server` header.
|
|
.map(|reply| warp::reply::with_header(reply, "Server", &version_with_platform()))
|
|
.with(cors_builder.build());
|
|
|
|
let (listening_socket, server) = warp::serve(routes).try_bind_with_graceful_shutdown(
|
|
SocketAddr::new(config.listen_addr, config.listen_port),
|
|
async {
|
|
shutdown.await;
|
|
},
|
|
)?;
|
|
|
|
info!(
|
|
listen_address = listening_socket.to_string(),
|
|
"Metrics HTTP server started"
|
|
);
|
|
|
|
Ok((listening_socket, server))
|
|
}
|
|
|
|
pub fn gather_prometheus_metrics<E: EthSpec>(
|
|
ctx: &Context<E>,
|
|
) -> std::result::Result<String, String> {
|
|
use validator_metrics::*;
|
|
let mut buffer = vec![];
|
|
let encoder = TextEncoder::new();
|
|
|
|
{
|
|
let shared = ctx.shared.read();
|
|
|
|
if let Some(genesis_time) = shared.genesis_time
|
|
&& let Ok(now) = SystemTime::now().duration_since(UNIX_EPOCH)
|
|
{
|
|
let distance = now.as_secs() as i64 - genesis_time as i64;
|
|
set_gauge(&GENESIS_DISTANCE, distance);
|
|
}
|
|
|
|
if let Some(duties_service) = &shared.duties_service
|
|
&& let Some(slot) = duties_service.slot_clock.now()
|
|
{
|
|
let current_epoch = slot.epoch(E::slots_per_epoch());
|
|
let next_epoch = current_epoch + 1;
|
|
|
|
set_int_gauge(
|
|
&PROPOSER_COUNT,
|
|
&[CURRENT_EPOCH],
|
|
duties_service.proposer_count(current_epoch) as i64,
|
|
);
|
|
set_int_gauge(
|
|
&ATTESTER_COUNT,
|
|
&[CURRENT_EPOCH],
|
|
duties_service.attester_count(current_epoch) as i64,
|
|
);
|
|
set_int_gauge(
|
|
&ATTESTER_COUNT,
|
|
&[NEXT_EPOCH],
|
|
duties_service.attester_count(next_epoch) as i64,
|
|
);
|
|
}
|
|
}
|
|
|
|
// It's important to ensure these metrics are explicitly enabled in the case that users aren't
|
|
// using glibc and this function causes panics.
|
|
if ctx.config.allocator_metrics_enabled {
|
|
scrape_allocator_metrics();
|
|
}
|
|
|
|
health_metrics::metrics::scrape_health_metrics();
|
|
|
|
encoder
|
|
.encode(&metrics::gather(), &mut buffer)
|
|
.map_err(|e| format!("{e:?}"))?;
|
|
|
|
String::from_utf8(buffer).map_err(|e| format!("Failed to encode prometheus info: {:?}", e))
|
|
}
|