background-jobs/jobs-core/src/processor_map.rs
2024-02-04 23:35:47 -06:00

215 lines
6.9 KiB
Rust

use crate::{catch_unwind::catch_unwind, Job, JobError, JobInfo, ReturnJobInfo};
use serde_json::Value;
use std::{
collections::HashMap, future::Future, panic::AssertUnwindSafe, pin::Pin, sync::Arc,
time::Instant,
};
use tracing::{Instrument, Span};
use uuid::Uuid;
/// A generic function that processes a job
///
/// ProcessorMap stores these `ProcessFn` types that don't expose differences in Job types.
pub type ProcessFn<S> = Arc<
dyn Fn(Value, S) -> Pin<Box<dyn Future<Output = Result<(), JobError>> + Send>> + Send + Sync,
>;
pub type StateFn<S> = Arc<dyn Fn() -> S + Send + Sync>;
/// A type for storing the relationships between job names and the job itself
///
/// [`Job`]s must be registered with the `ProcessorMap` in the initialization phase of an
/// application before workers are spawned in order to handle queued jobs.
#[derive(Clone)]
pub struct ProcessorMap<S> {
inner: HashMap<String, ProcessFn<S>>,
state_fn: StateFn<S>,
}
/// A type for storing the relationships between job names and the job itself, with the
/// state pre-cached instead of being generated from the state function each time
///
/// [`Job`]s must be registered with the `ProcessorMap` in the initialization phase of an
/// application before workers are spawned in order to handle queued jobs.
#[derive(Clone)]
pub struct CachedProcessorMap<S> {
inner: HashMap<String, ProcessFn<S>>,
state: S,
}
impl<S> ProcessorMap<S>
where
S: Clone + 'static,
{
/// Intialize a `ProcessorMap`
///
/// The state passed into this method will be passed to all jobs executed through this
/// ProcessorMap. The state argument could be useful for containing a hook into something like
/// r2d2, or the address of an actor in an actix-based system.
pub fn new(state_fn: StateFn<S>) -> Self {
ProcessorMap {
inner: HashMap::new(),
state_fn,
}
}
/// Register a [`Job`] with this `ProcessorMap`.
///
/// `ProcessorMap`s are useless if no jobs are registerd before workers are spawned, so
/// make sure to register all your processors up-front.
pub fn register<J>(&mut self)
where
J: Job<State = S>,
{
self.inner.insert(
J::NAME.to_owned(),
Arc::new(move |value, state| crate::process::<J>(value, state)),
);
}
/// Initialize the State from the State Function
pub fn cached(&self) -> CachedProcessorMap<S> {
CachedProcessorMap {
inner: self.inner.clone(),
state: (self.state_fn)(),
}
}
/// Process a given job
///
/// This should not be called from outside implementations of a backgoround-jobs runtime. It is
/// intended for internal use.
pub async fn process(&self, job: JobInfo) -> ReturnJobInfo {
let span = job_span(&job);
let fut = async move {
let opt = self
.inner
.get(&job.name)
.map(|name| process(Arc::clone(name), (self.state_fn)(), job.clone()));
let res = if let Some(fut) = opt {
fut.await
} else {
let span = Span::current();
span.record(
"exception.message",
&tracing::field::display("Not registered"),
);
span.record(
"exception.details",
&tracing::field::display("Not registered"),
);
tracing::error!("Not registered");
ReturnJobInfo::unregistered(job.id)
};
res
};
fut.instrument(span).await
}
}
impl<S> CachedProcessorMap<S>
where
S: Clone + 'static,
{
/// Process a given job
///
/// This should not be called from outside implementations of a backgoround-jobs runtime. It is
/// intended for internal use.
pub async fn process(&self, job: JobInfo) -> ReturnJobInfo {
let span = job_span(&job);
let fut = async move {
let res = if let Some(name) = self.inner.get(&job.name) {
process(Arc::clone(name), self.state.clone(), job).await
} else {
let span = Span::current();
span.record(
"exception.message",
&tracing::field::display("Not registered"),
);
span.record(
"exception.details",
&tracing::field::display("Not registered"),
);
tracing::error!("Not registered");
ReturnJobInfo::unregistered(job.id)
};
res
};
fut.instrument(span).await
}
}
fn job_span(job: &JobInfo) -> Span {
tracing::info_span!(
"Job",
execution_id = tracing::field::display(&Uuid::now_v7()),
job.id = tracing::field::display(&job.id),
job.name = tracing::field::display(&job.name),
job.execution_time = tracing::field::Empty,
exception.message = tracing::field::Empty,
exception.details = tracing::field::Empty,
)
}
async fn process<S>(process_fn: ProcessFn<S>, state: S, job: JobInfo) -> ReturnJobInfo
where
S: Clone,
{
let args = job.args.clone();
let id = job.id;
let name = job.name.clone();
let queue = job.queue.clone();
let start = Instant::now();
let res = match std::panic::catch_unwind(AssertUnwindSafe(|| (process_fn)(args, state))) {
Ok(fut) => catch_unwind(fut).await,
Err(e) => Err(e),
};
let duration = start.elapsed();
let seconds = duration.as_micros() as f64 / 1_000_000_f64;
let span = Span::current();
span.record("job.execution_time", &tracing::field::display(&seconds));
metrics::histogram!("background-jobs.job.execution_time", "queue" => queue.clone(), "name" => name.clone()).record(seconds);
match res {
Ok(Ok(_)) => {
#[cfg(feature = "completion-logging")]
tracing::info!("Job {queue}: {name}-{id} completed");
ReturnJobInfo::pass(id)
}
Ok(Err(e)) => {
let display = format!("{e}");
span.record("exception.message", &tracing::field::display(&display));
let debug = format!("{e:?}");
span.record("exception.details", &tracing::field::display(&debug));
#[cfg(feature = "error-logging")]
tracing::warn!("Job {queue}: {name}-{id} errored");
ReturnJobInfo::fail(id)
}
Err(_) => {
span.record(
"exception.message",
&tracing::field::display("Job panicked"),
);
span.record(
"exception.details",
&tracing::field::display("Job panicked"),
);
#[cfg(feature = "error-logging")]
tracing::warn!("Job {queue}: {name}-{id} panicked");
ReturnJobInfo::fail(id)
}
}
}