backie/src/worker_pool.rs

271 lines
7.3 KiB
Rust
Raw Normal View History

use crate::diesel::r2d2;
use crate::diesel::PgConnection;
2021-06-23 10:48:03 +00:00
use crate::executor::Executor;
use crate::executor::RetentionMode;
use crate::executor::SleepParams;
use crate::queue::Queue;
use log::error;
use log::info;
2021-06-23 10:48:03 +00:00
use std::thread;
2021-06-24 05:23:02 +00:00
pub struct WorkerPool {
pub number_of_workers: u32,
pub worker_params: WorkerParams,
pub connection_pool: r2d2::Pool<r2d2::ConnectionManager<PgConnection>>,
2021-06-23 10:48:03 +00:00
}
2021-06-24 05:23:02 +00:00
pub struct WorkerThread {
2021-06-23 10:48:03 +00:00
pub name: String,
pub worker_params: WorkerParams,
2021-06-23 10:48:03 +00:00
pub restarts: u64,
pub connection_pool: r2d2::Pool<r2d2::ConnectionManager<PgConnection>>,
2021-06-23 10:48:03 +00:00
}
#[derive(Clone)]
pub struct WorkerParams {
pub retention_mode: Option<RetentionMode>,
pub sleep_params: Option<SleepParams>,
pub task_type: Option<String>,
}
impl Default for WorkerParams {
fn default() -> Self {
Self::new()
}
}
impl WorkerParams {
pub fn new() -> Self {
Self {
retention_mode: None,
sleep_params: None,
task_type: None,
}
}
pub fn set_retention_mode(&mut self, retention_mode: RetentionMode) {
self.retention_mode = Some(retention_mode);
}
pub fn set_sleep_params(&mut self, sleep_params: SleepParams) {
self.sleep_params = Some(sleep_params);
}
pub fn set_task_type(&mut self, task_type: String) {
self.task_type = Some(task_type);
}
}
2021-06-23 10:48:03 +00:00
impl WorkerPool {
pub fn new(number_of_workers: u32) -> Self {
let worker_params = WorkerParams::new();
let connection_pool = Queue::connection_pool(number_of_workers);
2021-06-23 10:48:03 +00:00
Self {
number_of_workers,
worker_params,
connection_pool,
}
}
pub fn new_with_params(number_of_workers: u32, worker_params: WorkerParams) -> Self {
let connection_pool = Queue::connection_pool(number_of_workers);
Self {
number_of_workers,
worker_params,
connection_pool,
2021-06-23 10:48:03 +00:00
}
}
pub fn start(&self) {
for idx in 1..self.number_of_workers + 1 {
let worker_type = self
.worker_params
.task_type
.clone()
.unwrap_or_else(|| "".to_string());
let name = format!("worker_{}{}", worker_type, idx);
WorkerThread::spawn_in_pool(
self.worker_params.clone(),
name,
0,
self.connection_pool.clone(),
)
2021-06-23 10:48:03 +00:00
}
}
}
impl WorkerThread {
pub fn new(
worker_params: WorkerParams,
name: String,
restarts: u64,
connection_pool: r2d2::Pool<r2d2::ConnectionManager<PgConnection>>,
) -> Self {
Self {
name,
worker_params,
restarts,
connection_pool,
}
2021-06-23 10:48:03 +00:00
}
pub fn spawn_in_pool(
worker_params: WorkerParams,
name: String,
restarts: u64,
connection_pool: r2d2::Pool<r2d2::ConnectionManager<PgConnection>>,
) {
2021-06-23 11:32:21 +00:00
let builder = thread::Builder::new().name(name.clone());
2021-06-23 10:48:03 +00:00
info!(
"starting a worker thread {}, number of restarts {}",
name, restarts
);
builder
.spawn(move || {
// when _job is dropped, it will be restarted (see Drop trait impl)
let _job = WorkerThread::new(
worker_params.clone(),
name,
restarts,
connection_pool.clone(),
);
match connection_pool.get() {
Ok(connection) => {
let mut executor = Executor::new(connection);
if let Some(task_type_str) = worker_params.task_type {
executor.set_task_type(task_type_str);
}
if let Some(retention_mode) = worker_params.retention_mode {
executor.set_retention_mode(retention_mode);
}
if let Some(sleep_params) = worker_params.sleep_params {
executor.set_sleep_params(sleep_params);
}
executor.run_tasks();
}
Err(error) => {
error!("Failed to get postgres connection: {:?}", error);
}
}
2021-06-23 10:48:03 +00:00
})
.unwrap();
}
}
impl Drop for WorkerThread {
fn drop(&mut self) {
WorkerThread::spawn_in_pool(
self.worker_params.clone(),
self.name.clone(),
self.restarts + 1,
self.connection_pool.clone(),
)
2021-06-23 10:48:03 +00:00
}
}
#[cfg(test)]
mod job_pool_tests {
2021-07-11 10:18:53 +00:00
use super::WorkerParams;
2021-06-23 10:48:03 +00:00
use super::WorkerPool;
use crate::executor::Error;
2021-07-11 10:18:53 +00:00
use crate::executor::RetentionMode;
2021-06-23 10:48:03 +00:00
use crate::executor::Runnable;
use crate::queue::Queue;
use crate::queue::Task;
2021-06-23 10:48:03 +00:00
use crate::schema::fang_tasks;
use crate::typetag;
2021-06-23 10:48:03 +00:00
use diesel::pg::PgConnection;
use diesel::prelude::*;
use serde::{Deserialize, Serialize};
2021-06-23 10:48:03 +00:00
use std::thread;
use std::time::Duration;
#[derive(Serialize, Deserialize)]
struct MyJob {
pub number: u16,
pub current_thread_name: String,
}
impl MyJob {
pub fn new(number: u16) -> Self {
let handle = thread::current();
let current_thread_name = handle.name().unwrap().to_string();
Self {
number,
current_thread_name,
}
}
}
fn get_all_tasks(conn: &PgConnection) -> Vec<Task> {
fang_tasks::table
.filter(fang_tasks::task_type.eq("worker_pool_test"))
.get_results::<Task>(conn)
.unwrap()
2021-06-23 10:48:03 +00:00
}
#[typetag::serde]
impl Runnable for MyJob {
fn run(&self, connection: &PgConnection) -> Result<(), Error> {
2021-06-23 10:48:03 +00:00
thread::sleep(Duration::from_secs(3));
let new_job = MyJob::new(self.number + 1);
Queue::push_task_query(connection, &new_job).unwrap();
2021-06-23 10:48:03 +00:00
Ok(())
}
fn task_type(&self) -> String {
"worker_pool_test".to_string()
}
2021-06-23 10:48:03 +00:00
}
// this test is ignored because it commits data to the db
#[test]
#[ignore]
fn tasks_are_split_between_two_threads() {
let queue = Queue::new();
2021-07-11 10:18:53 +00:00
let mut worker_params = WorkerParams::new();
worker_params.set_retention_mode(RetentionMode::KeepAll);
let job_pool = WorkerPool::new_with_params(2, worker_params);
2021-06-23 10:48:03 +00:00
queue.push_task(&MyJob::new(100)).unwrap();
queue.push_task(&MyJob::new(200)).unwrap();
2021-06-23 10:48:03 +00:00
job_pool.start();
thread::sleep(Duration::from_secs(100));
let tasks = get_all_tasks(&queue.connection);
2021-06-23 10:48:03 +00:00
assert!(tasks.len() > 40);
let test_worker1_jobs = tasks.clone().into_iter().filter(|job| {
serde_json::to_string(&job.metadata)
.unwrap()
.contains("worker_1")
});
let test_worker2_jobs = tasks.into_iter().filter(|job| {
serde_json::to_string(&job.metadata)
.unwrap()
.contains("worker_2")
});
2021-06-23 10:48:03 +00:00
assert!(test_worker1_jobs.count() > 20);
assert!(test_worker2_jobs.count() > 20);
2021-06-23 10:48:03 +00:00
}
}