Backend: - migrations/003_jobs_scheduling.sql: retry_next_at/last_error columns, pg_notify trigger for immediate job dispatch, retry index - pm-agent-client: ApplyPatchesRequest/Response, AgentJobStatus, RollbackResponse types; apply_patches/job_status/rollback_job client methods + generic POST helper - pm-core/models: JobStatus, JobKind, PatchJob, PatchJobHost, CreateJobRequest, PatchJobSummary - pm-web/routes/jobs.rs: POST/GET /api/v1/jobs, GET /jobs/:id, POST /jobs/:id/cancel, POST /jobs/:id/rollback - pm-worker/job_executor.rs: NOTIFY listener, periodic scanner, execute_host_job, poll_running_jobs, handle_host_failure (3-retry exponential backoff 1m/5m/30m), sync_job_status, retry_pending_jobs - pm-worker/main.rs: spawn job_executor Frontend: - types/index.ts: PatchInfo, PatchJobHost, PatchJob, PatchJobSummary, CreateJobRequest interfaces - api/client.ts: jobsApi (list/get/create/cancel/rollback), patchesApi (getHostPatches) - pages/PatchDeploymentPage.tsx: 3-step MUI Stepper (host select → configure → result) - pages/JobsPage.tsx: job list table, expandable per-host detail, cancel/rollback actions with confirm dialog, load-more pagination - App.tsx: /jobs and /deployment routes wired to real pages cargo check: 0 errors | vite build: 0 errors
528 lines
18 KiB
Rust
528 lines
18 KiB
Rust
//! Host management routes.
|
|
//!
|
|
//! GET /api/v1/hosts — list hosts (RBAC scoped)
|
|
//! POST /api/v1/hosts — register new host (admin only)
|
|
//! GET /api/v1/hosts/{id} — get host detail
|
|
//! DELETE /api/v1/hosts/{id} — remove host (admin only)
|
|
//! GET /api/v1/hosts/{id}/groups — list groups for host
|
|
//! POST /api/v1/hosts/{id}/groups — assign host to group
|
|
//! DELETE /api/v1/hosts/{id}/groups/{group_id} — remove host from group
|
|
//! POST /api/v1/hosts/{id}/refresh — queue on-demand refresh (operator+)
|
|
|
|
use axum::{
|
|
extract::{Path, Query, State},
|
|
http::StatusCode,
|
|
response::Json,
|
|
routing::{delete, get, post},
|
|
Router,
|
|
};
|
|
use pm_core::{
|
|
audit::{log_event, AuditAction},
|
|
models::{
|
|
CreateHostRequest, HostSummary, Group,
|
|
},
|
|
};
|
|
use pm_auth::rbac::AuthUser;
|
|
use serde::{Deserialize, Serialize};
|
|
use serde_json::{json, Value};
|
|
use uuid::Uuid;
|
|
|
|
use crate::AppState;
|
|
|
|
pub fn router() -> Router<AppState> {
|
|
Router::new()
|
|
.route("/", get(list_hosts).post(register_host))
|
|
.route("/:id", get(get_host).delete(remove_host))
|
|
.route("/:id/groups", get(list_host_groups).post(add_host_to_group))
|
|
.route("/:id/groups/:group_id", delete(remove_host_from_group))
|
|
.route("/:id/refresh", post(refresh_host))
|
|
}
|
|
|
|
// ── Query params ─────────────────────────────────────────────────────────────
|
|
|
|
#[derive(Debug, Deserialize)]
|
|
pub struct HostListQuery {
|
|
pub group_id: Option<Uuid>,
|
|
pub health_status: Option<String>,
|
|
pub os_family: Option<String>,
|
|
pub search: Option<String>,
|
|
pub limit: Option<i64>,
|
|
pub offset: Option<i64>,
|
|
}
|
|
|
|
// ── Response types ────────────────────────────────────────────────────────────
|
|
|
|
#[derive(Debug, Serialize)]
|
|
struct HostListResponse {
|
|
hosts: Vec<HostSummary>,
|
|
total: i64,
|
|
limit: i64,
|
|
offset: i64,
|
|
}
|
|
|
|
// ── Helper: check if operator can access a host ───────────────────────────────
|
|
|
|
async fn operator_can_access_host(
|
|
pool: &sqlx::PgPool,
|
|
user_id: Uuid,
|
|
host_id: Uuid,
|
|
) -> Result<bool, sqlx::Error> {
|
|
// Admins can access all; operators can access hosts in their groups
|
|
// OR ungrouped hosts (no group memberships)
|
|
let in_group: bool = sqlx::query_scalar(
|
|
r#"
|
|
SELECT EXISTS (
|
|
SELECT 1 FROM host_groups hg
|
|
JOIN user_groups ug ON ug.group_id = hg.group_id
|
|
WHERE hg.host_id = $1 AND ug.user_id = $2
|
|
)
|
|
"#,
|
|
)
|
|
.bind(host_id)
|
|
.bind(user_id)
|
|
.fetch_one(pool)
|
|
.await?;
|
|
|
|
if in_group {
|
|
return Ok(true);
|
|
}
|
|
|
|
// Ungrouped hosts are accessible to any operator
|
|
let ungrouped: bool = sqlx::query_scalar(
|
|
"SELECT NOT EXISTS (SELECT 1 FROM host_groups WHERE host_id = $1)",
|
|
)
|
|
.bind(host_id)
|
|
.fetch_one(pool)
|
|
.await?;
|
|
|
|
Ok(ungrouped)
|
|
}
|
|
|
|
// ── GET /api/v1/hosts ─────────────────────────────────────────────────────────
|
|
|
|
async fn list_hosts(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Query(q): Query<HostListQuery>,
|
|
) -> Result<Json<HostListResponse>, (StatusCode, Json<Value>)> {
|
|
let limit = q.limit.unwrap_or(50).min(200);
|
|
let offset = q.offset.unwrap_or(0);
|
|
|
|
// For operators: only show hosts in their groups (or ungrouped)
|
|
let hosts: Vec<HostSummary> = if auth.role.is_admin() {
|
|
sqlx::query_as(
|
|
r#"
|
|
SELECT id, fqdn, ip_address::text AS ip_address, display_name,
|
|
os_family, os_name, health_status, agent_version, registered_at
|
|
FROM hosts
|
|
ORDER BY fqdn
|
|
LIMIT $1 OFFSET $2
|
|
"#,
|
|
)
|
|
.bind(limit)
|
|
.bind(offset)
|
|
.fetch_all(&state.db)
|
|
.await
|
|
} else {
|
|
sqlx::query_as(
|
|
r#"
|
|
SELECT DISTINCT h.id, h.fqdn, h.ip_address::text AS ip_address,
|
|
h.display_name, h.os_family, h.os_name,
|
|
h.health_status, h.agent_version, h.registered_at
|
|
FROM hosts h
|
|
WHERE
|
|
-- Hosts in operator's groups
|
|
EXISTS (
|
|
SELECT 1 FROM host_groups hg
|
|
JOIN user_groups ug ON ug.group_id = hg.group_id
|
|
WHERE hg.host_id = h.id AND ug.user_id = $3
|
|
)
|
|
-- OR ungrouped hosts
|
|
OR NOT EXISTS (SELECT 1 FROM host_groups WHERE host_id = h.id)
|
|
ORDER BY h.fqdn
|
|
LIMIT $1 OFFSET $2
|
|
"#,
|
|
)
|
|
.bind(limit)
|
|
.bind(offset)
|
|
.bind(auth.user_id)
|
|
.fetch_all(&state.db)
|
|
.await
|
|
}
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, "Failed to list hosts");
|
|
(
|
|
StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })),
|
|
)
|
|
})?;
|
|
|
|
let total: i64 = sqlx::query_scalar("SELECT COUNT(*) FROM hosts")
|
|
.fetch_one(&state.db)
|
|
.await
|
|
.unwrap_or(0);
|
|
|
|
Ok(Json(HostListResponse { hosts, total, limit, offset }))
|
|
}
|
|
|
|
// ── POST /api/v1/hosts ────────────────────────────────────────────────────────
|
|
|
|
async fn register_host(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Json(req): Json<CreateHostRequest>,
|
|
) -> Result<Json<Value>, (StatusCode, Json<Value>)> {
|
|
// Admin only
|
|
if !auth.role.is_admin() {
|
|
return Err((
|
|
StatusCode::FORBIDDEN,
|
|
Json(json!({ "error": { "code": "forbidden", "message": "Admin role required" } })),
|
|
));
|
|
}
|
|
|
|
// Resolve FQDN to IP address
|
|
let ip_address = resolve_fqdn(&req.fqdn).await.map_err(|e| {
|
|
(
|
|
StatusCode::BAD_REQUEST,
|
|
Json(json!({ "error": { "code": "fqdn_resolution_failed", "message": e } })),
|
|
)
|
|
})?;
|
|
|
|
let display_name = req.display_name.clone().unwrap_or_else(|| req.fqdn.clone());
|
|
let agent_port = req.agent_port.unwrap_or(12443);
|
|
let notes = req.notes.clone().unwrap_or_default();
|
|
|
|
// Insert host
|
|
let host_id: Uuid = sqlx::query_scalar(
|
|
r#"
|
|
INSERT INTO hosts (fqdn, ip_address, display_name, agent_port, notes)
|
|
VALUES ($1, $2::inet, $3, $4, $5)
|
|
RETURNING id
|
|
"#,
|
|
)
|
|
.bind(&req.fqdn)
|
|
.bind(&ip_address)
|
|
.bind(&display_name)
|
|
.bind(agent_port)
|
|
.bind(¬es)
|
|
.fetch_one(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
let msg = if e.to_string().contains("unique") {
|
|
"Host with this FQDN and IP already exists".to_string()
|
|
} else {
|
|
"Database error".to_string()
|
|
};
|
|
tracing::error!(error = %e, "Failed to register host");
|
|
(
|
|
StatusCode::CONFLICT,
|
|
Json(json!({ "error": { "code": "conflict", "message": msg } })),
|
|
)
|
|
})?;
|
|
|
|
// Assign to groups if specified
|
|
if let Some(group_ids) = &req.group_ids {
|
|
for gid in group_ids {
|
|
let _ = sqlx::query(
|
|
"INSERT INTO host_groups (host_id, group_id) VALUES ($1, $2) ON CONFLICT DO NOTHING",
|
|
)
|
|
.bind(host_id)
|
|
.bind(gid)
|
|
.execute(&state.db)
|
|
.await;
|
|
}
|
|
}
|
|
|
|
// Audit log
|
|
log_event(
|
|
&state.db,
|
|
AuditAction::HostRegistered,
|
|
Some(auth.user_id),
|
|
Some(&auth.username),
|
|
Some("host"),
|
|
Some(&host_id.to_string()),
|
|
json!({ "fqdn": req.fqdn, "ip": ip_address }),
|
|
None,
|
|
None,
|
|
).await;
|
|
|
|
tracing::info!(host_id = %host_id, fqdn = %req.fqdn, "Host registered");
|
|
Ok(Json(json!({ "id": host_id, "message": "Host registered" })))
|
|
}
|
|
|
|
// ── GET /api/v1/hosts/:id ─────────────────────────────────────────────────────
|
|
|
|
async fn get_host(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Path(id): Path<Uuid>,
|
|
) -> Result<Json<Value>, (StatusCode, Json<Value>)> {
|
|
if !auth.role.is_admin() {
|
|
let can_access = operator_can_access_host(&state.db, auth.user_id, id)
|
|
.await
|
|
.unwrap_or(false);
|
|
if !can_access {
|
|
return Err((
|
|
StatusCode::FORBIDDEN,
|
|
Json(json!({ "error": { "code": "forbidden", "message": "Access denied" } })),
|
|
));
|
|
}
|
|
}
|
|
|
|
let host: Option<Value> = sqlx::query_scalar(
|
|
r#"
|
|
SELECT row_to_json(h) FROM (
|
|
SELECT id, fqdn, ip_address::text AS ip_address, display_name,
|
|
os_family, os_name, arch, agent_version, health_status,
|
|
last_health_at, last_patch_at, agent_port, notes,
|
|
registered_at, updated_at
|
|
FROM hosts WHERE id = $1
|
|
) h
|
|
"#,
|
|
)
|
|
.bind(id)
|
|
.fetch_optional(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, "Failed to get host");
|
|
(
|
|
StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })),
|
|
)
|
|
})?;
|
|
|
|
host.map(Json).ok_or_else(|| (
|
|
StatusCode::NOT_FOUND,
|
|
Json(json!({ "error": { "code": "not_found", "message": "Host not found" } })),
|
|
))
|
|
}
|
|
|
|
// ── DELETE /api/v1/hosts/:id ──────────────────────────────────────────────────
|
|
|
|
async fn remove_host(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Path(id): Path<Uuid>,
|
|
) -> Result<Json<Value>, (StatusCode, Json<Value>)> {
|
|
if !auth.role.is_admin() {
|
|
return Err((
|
|
StatusCode::FORBIDDEN,
|
|
Json(json!({ "error": { "code": "forbidden", "message": "Admin role required" } })),
|
|
));
|
|
}
|
|
|
|
// Fetch FQDN for audit before deletion
|
|
let fqdn: Option<String> = sqlx::query_scalar("SELECT fqdn FROM hosts WHERE id = $1")
|
|
.bind(id)
|
|
.fetch_optional(&state.db)
|
|
.await
|
|
.unwrap_or(None);
|
|
|
|
let result = sqlx::query("DELETE FROM hosts WHERE id = $1")
|
|
.bind(id)
|
|
.execute(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, "Failed to remove host");
|
|
(
|
|
StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })),
|
|
)
|
|
})?;
|
|
|
|
if result.rows_affected() == 0 {
|
|
return Err((
|
|
StatusCode::NOT_FOUND,
|
|
Json(json!({ "error": { "code": "not_found", "message": "Host not found" } })),
|
|
));
|
|
}
|
|
|
|
log_event(
|
|
&state.db,
|
|
AuditAction::HostRemoved,
|
|
Some(auth.user_id),
|
|
Some(&auth.username),
|
|
Some("host"),
|
|
Some(&id.to_string()),
|
|
json!({ "fqdn": fqdn }),
|
|
None,
|
|
None,
|
|
).await;
|
|
|
|
tracing::info!(host_id = %id, "Host removed");
|
|
Ok(Json(json!({ "message": "Host removed" })))
|
|
}
|
|
|
|
// ── GET /api/v1/hosts/:id/groups ──────────────────────────────────────────────
|
|
|
|
async fn list_host_groups(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Path(id): Path<Uuid>,
|
|
) -> Result<Json<Vec<Group>>, (StatusCode, Json<Value>)> {
|
|
if !auth.role.is_admin() {
|
|
let can_access = operator_can_access_host(&state.db, auth.user_id, id)
|
|
.await.unwrap_or(false);
|
|
if !can_access {
|
|
return Err((StatusCode::FORBIDDEN,
|
|
Json(json!({ "error": { "code": "forbidden", "message": "Access denied" } }))));
|
|
}
|
|
}
|
|
|
|
let groups: Vec<Group> = sqlx::query_as(
|
|
r#"SELECT g.id, g.name, g.description, g.created_at, g.updated_at
|
|
FROM groups g
|
|
JOIN host_groups hg ON hg.group_id = g.id
|
|
WHERE hg.host_id = $1
|
|
ORDER BY g.name"#,
|
|
)
|
|
.bind(id)
|
|
.fetch_all(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, "Failed to list host groups");
|
|
(StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })))
|
|
})?;
|
|
|
|
Ok(Json(groups))
|
|
}
|
|
|
|
// ── POST /api/v1/hosts/:id/groups ─────────────────────────────────────────────
|
|
|
|
#[derive(Debug, Deserialize)]
|
|
struct AddToGroupRequest { group_id: Uuid }
|
|
|
|
async fn add_host_to_group(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Path(id): Path<Uuid>,
|
|
Json(req): Json<AddToGroupRequest>,
|
|
) -> Result<Json<Value>, (StatusCode, Json<Value>)> {
|
|
if !auth.role.is_admin() {
|
|
return Err((StatusCode::FORBIDDEN,
|
|
Json(json!({ "error": { "code": "forbidden", "message": "Admin role required" } }))));
|
|
}
|
|
|
|
sqlx::query(
|
|
"INSERT INTO host_groups (host_id, group_id) VALUES ($1, $2) ON CONFLICT DO NOTHING",
|
|
)
|
|
.bind(id)
|
|
.bind(req.group_id)
|
|
.execute(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, "Failed to add host to group");
|
|
(StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })))
|
|
})?;
|
|
|
|
log_event(&state.db, AuditAction::GroupMembershipChanged,
|
|
Some(auth.user_id), Some(&auth.username), Some("host"), Some(&id.to_string()),
|
|
json!({ "group_id": req.group_id, "action": "added" }), None, None).await;
|
|
|
|
Ok(Json(json!({ "message": "Host added to group" })))
|
|
}
|
|
|
|
// ── DELETE /api/v1/hosts/:id/groups/:group_id ─────────────────────────────────
|
|
|
|
async fn remove_host_from_group(
|
|
State(state): State<AppState>,
|
|
auth: AuthUser,
|
|
Path((id, group_id)): Path<(Uuid, Uuid)>,
|
|
) -> Result<Json<Value>, (StatusCode, Json<Value>)> {
|
|
if !auth.role.is_admin() {
|
|
return Err((StatusCode::FORBIDDEN,
|
|
Json(json!({ "error": { "code": "forbidden", "message": "Admin role required" } }))));
|
|
}
|
|
|
|
sqlx::query("DELETE FROM host_groups WHERE host_id = $1 AND group_id = $2")
|
|
.bind(id).bind(group_id)
|
|
.execute(&state.db).await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, "Failed to remove host from group");
|
|
(StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })))
|
|
})?;
|
|
|
|
log_event(&state.db, AuditAction::GroupMembershipChanged,
|
|
Some(auth.user_id), Some(&auth.username), Some("host"), Some(&id.to_string()),
|
|
json!({ "group_id": group_id, "action": "removed" }), None, None).await;
|
|
|
|
Ok(Json(json!({ "message": "Host removed from group" })))
|
|
}
|
|
|
|
// ── FQDN resolution ───────────────────────────────────────────────────────────
|
|
|
|
/// Resolve an FQDN (or IP) to its primary IP address.
|
|
/// If the input is already a valid IP, returns it as-is.
|
|
async fn resolve_fqdn(fqdn: &str) -> Result<String, String> {
|
|
use std::net::ToSocketAddrs;
|
|
// Try direct IP parse first
|
|
if fqdn.parse::<std::net::IpAddr>().is_ok() {
|
|
return Ok(fqdn.to_string());
|
|
}
|
|
// DNS resolution
|
|
let addr = format!("{fqdn}:0");
|
|
match tokio::task::spawn_blocking(move || addr.to_socket_addrs()).await {
|
|
Ok(Ok(mut addrs)) => addrs
|
|
.next()
|
|
.map(|a| a.ip().to_string())
|
|
.ok_or_else(|| format!("No addresses found for {fqdn}")),
|
|
_ => Err(format!("Failed to resolve FQDN: {fqdn}")),
|
|
}
|
|
}
|
|
|
|
// ── POST /api/v1/hosts/:id/refresh ───────────────────────────────────────────
|
|
|
|
/// Queue an on-demand health + patch refresh for a single host.
|
|
///
|
|
/// Sends a PostgreSQL NOTIFY on the `refresh_requested` channel; the
|
|
/// pm-worker refresh listener picks this up and polls the host immediately.
|
|
/// Requires Operator or Admin role (any authenticated user).
|
|
async fn refresh_host(
|
|
State(state): State<AppState>,
|
|
_auth: AuthUser,
|
|
Path(id): Path<Uuid>,
|
|
) -> Result<(StatusCode, Json<Value>), (StatusCode, Json<Value>)> {
|
|
// Verify the host exists.
|
|
let exists: bool = sqlx::query_scalar("SELECT EXISTS(SELECT 1 FROM hosts WHERE id = $1)")
|
|
.bind(id)
|
|
.fetch_one(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, %id, "refresh_host: db error checking host existence");
|
|
(
|
|
StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Database error" } })),
|
|
)
|
|
})?;
|
|
|
|
if !exists {
|
|
return Err((
|
|
StatusCode::NOT_FOUND,
|
|
Json(json!({ "error": { "code": "not_found", "message": "Host not found" } })),
|
|
));
|
|
}
|
|
|
|
// NOTIFY the worker's refresh listener.
|
|
sqlx::query("SELECT pg_notify('refresh_requested', $1)")
|
|
.bind(id.to_string())
|
|
.execute(&state.db)
|
|
.await
|
|
.map_err(|e| {
|
|
tracing::error!(error = %e, %id, "refresh_host: pg_notify failed");
|
|
(
|
|
StatusCode::INTERNAL_SERVER_ERROR,
|
|
Json(json!({ "error": { "code": "internal_error", "message": "Failed to queue refresh" } })),
|
|
)
|
|
})?;
|
|
|
|
tracing::info!(%id, "On-demand refresh queued");
|
|
|
|
Ok((
|
|
StatusCode::ACCEPTED,
|
|
Json(json!({ "message": "Refresh queued" })),
|
|
))
|
|
}
|