tokio-concurrency

Tokio Concurrency Patterns

This skill provides advanced concurrency patterns for building scalable async applications with Tokio.

Fan-Out/Fan-In Pattern

Distribute work across multiple workers and collect results:

use futures::stream::{self, StreamExt};

pub async fn fan_out_fan_in<T, R>( items: Vec<T>, concurrency: usize, process: impl Fn(T) -> Pin<Box<dyn Future<Output = R> + Send>> + Send + Sync + 'static, ) -> Vec<R> where T: Send + 'static, R: Send + 'static, { stream::iter(items) .map(|item| process(item)) .buffer_unordered(concurrency) .collect() .await }

// Usage let results = fan_out_fan_in( items, 10, |item| Box::pin(async move { process_item(item).await }) ).await;

Pipeline Processing

Chain async processing stages:

use tokio::sync::mpsc;

pub struct Pipeline<T> { stages: Vec<Box<dyn Stage<T>>>, }

#[async_trait::async_trait] pub trait Stage<T>: Send { async fn process(&self, item: T) -> T; }

impl<T: Send + 'static> Pipeline<T> { pub fn new() -> Self { Self { stages: Vec::new() } }

pub fn add_stage&#x3C;S: Stage&#x3C;T> + 'static>(mut self, stage: S) -> Self {
    self.stages.push(Box::new(stage));
    self
}

pub async fn run(self, mut input: mpsc::Receiver&#x3C;T>) -> mpsc::Receiver&#x3C;T> {
    let (tx, rx) = mpsc::channel(100);

    tokio::spawn(async move {
        while let Some(mut item) = input.recv().await {
            // Process through all stages
            for stage in &#x26;self.stages {
                item = stage.process(item).await;
            }

            if tx.send(item).await.is_err() {
                break;
            }
        }
    });

    rx
}

}

// Usage let pipeline = Pipeline::new() .add_stage(ValidationStage) .add_stage(TransformStage) .add_stage(EnrichmentStage);

let output = pipeline.run(input_channel).await;

Rate Limiting

Control operation rate using token bucket or leaky bucket:

use tokio::time::{interval, Duration, Instant}; use tokio::sync::Semaphore; use std::sync::Arc;

pub struct RateLimiter { semaphore: Arc<Semaphore>, rate: usize, period: Duration, }

impl RateLimiter { pub fn new(rate: usize, period: Duration) -> Self { let limiter = Self { semaphore: Arc::new(Semaphore::new(rate)), rate, period, };

    // Refill tokens
    let semaphore = limiter.semaphore.clone();
    let rate = limiter.rate;
    let period = limiter.period;

    tokio::spawn(async move {
        let mut interval = interval(period);
        loop {
            interval.tick().await;
            // Add permits up to max
            for _ in 0..rate {
                if semaphore.available_permits() &#x3C; rate {
                    semaphore.add_permits(1);
                }
            }
        }
    });

    limiter
}

pub async fn acquire(&#x26;self) {
    self.semaphore.acquire().await.unwrap().forget();
}

}

// Usage let limiter = RateLimiter::new(100, Duration::from_secs(1));

for _ in 0..1000 { limiter.acquire().await; make_request().await; }

Parallel Task Execution with Join

Execute multiple tasks in parallel and wait for all:

use tokio::try_join;

pub async fn parallel_operations() -> Result<(String, Vec<User>, Config), Error> { try_join!( fetch_data(), fetch_users(), load_config() ) }

// With manual spawning for CPU-bound work pub async fn parallel_cpu_work(items: Vec<Item>) -> Vec<Result<Processed, Error>> { let handles: Vec<_> = items .into_iter() .map(|item| { tokio::task::spawn_blocking(move || { expensive_cpu_work(item) }) }) .collect();

let mut results = Vec::new();
for handle in handles {
    results.push(handle.await.unwrap());
}
results

}

Coordinated Shutdown with CancellationToken

Manage hierarchical cancellation:

use tokio_util::sync::CancellationToken; use tokio::select;

pub struct Coordinator { token: CancellationToken, tasks: Vec<tokio::task::JoinHandle<()>>, }

impl Coordinator { pub fn new() -> Self { Self { token: CancellationToken::new(), tasks: Vec::new(), } }

pub fn spawn&#x3C;F>(&#x26;mut self, f: F)
where
    F: Future&#x3C;Output = ()> + Send + 'static,
{
    let token = self.token.child_token();
    let handle = tokio::spawn(async move {
        select! {
            _ = token.cancelled() => {}
            _ = f => {}
        }
    });
    self.tasks.push(handle);
}

pub async fn shutdown(self) {
    self.token.cancel();

    for task in self.tasks {
        let _ = task.await;
    }
}

}

// Usage let mut coordinator = Coordinator::new();

coordinator.spawn(worker1()); coordinator.spawn(worker2()); coordinator.spawn(worker3());

// Later... coordinator.shutdown().await;

Async Trait Patterns

Work around async trait limitations:

use async_trait::async_trait;

#[async_trait] pub trait AsyncService { async fn process(&self, input: String) -> Result<String, Error>; }

// Alternative without async-trait pub trait AsyncServiceManual { fn process<'a>( &'a self, input: String, ) -> Pin<Box<dyn Future<Output = Result<String, Error>> + Send + 'a>>; }

// Implementation struct MyService;

#[async_trait] impl AsyncService for MyService { async fn process(&self, input: String) -> Result<String, Error> { // async implementation Ok(input.to_uppercase()) } }

Shared State Management

Safe concurrent access to shared state:

use tokio::sync::RwLock; use std::sync::Arc;

pub struct SharedState { data: Arc<RwLock<HashMap<String, String>>>, }

impl SharedState { pub fn new() -> Self { Self { data: Arc::new(RwLock::new(HashMap::new())), } }

pub async fn get(&#x26;self, key: &#x26;str) -> Option&#x3C;String> {
    let data = self.data.read().await;
    data.get(key).cloned()
}

pub async fn set(&#x26;self, key: String, value: String) {
    let mut data = self.data.write().await;
    data.insert(key, value);
}

// Batch operations
pub async fn get_many(&#x26;self, keys: &#x26;[String]) -> Vec&#x3C;Option&#x3C;String>> {
    let data = self.data.read().await;
    keys.iter()
        .map(|key| data.get(key).cloned())
        .collect()
}

}

// Clone is cheap (Arc) impl Clone for SharedState { fn clone(&self) -> Self { Self { data: self.data.clone(), } } }

Work Stealing Queue

Implement work stealing for load balancing:

use tokio::sync::mpsc; use std::sync::Arc;

pub struct WorkQueue<T> { queues: Vec<mpsc::Sender<T>>, receivers: Vec<mpsc::Receiver<T>>, next: Arc<AtomicUsize>, }

impl<T: Send + 'static> WorkQueue<T> { pub fn new(workers: usize, capacity: usize) -> Self { let mut queues = Vec::new(); let mut receivers = Vec::new();

    for _ in 0..workers {
        let (tx, rx) = mpsc::channel(capacity);
        queues.push(tx);
        receivers.push(rx);
    }

    Self {
        queues,
        receivers,
        next: Arc::new(AtomicUsize::new(0)),
    }
}

pub async fn submit(&#x26;self, work: T) -> Result&#x3C;(), mpsc::error::SendError&#x3C;T>> {
    let idx = self.next.fetch_add(1, Ordering::Relaxed) % self.queues.len();
    self.queues[idx].send(work).await
}

pub fn spawn_workers&#x3C;F>(mut self, process: F)
where
    F: Fn(T) -> Pin&#x3C;Box&#x3C;dyn Future&#x3C;Output = ()> + Send>> + Send + Sync + Clone + 'static,
{
    for mut rx in self.receivers.drain(..) {
        let process = process.clone();
        tokio::spawn(async move {
            while let Some(work) = rx.recv().await {
                process(work).await;
            }
        });
    }
}

}

Circuit Breaker for Resilience

Prevent cascading failures:

use std::sync::atomic::{AtomicU64, Ordering}; use tokio::time::{Instant, Duration};

pub enum CircuitState { Closed, Open(Instant), HalfOpen, }

pub struct CircuitBreaker { state: Arc<RwLock<CircuitState>>, failure_count: AtomicU64, threshold: u64, timeout: Duration, }

impl CircuitBreaker { pub fn new(threshold: u64, timeout: Duration) -> Self { Self { state: Arc::new(RwLock::new(CircuitState::Closed)), failure_count: AtomicU64::new(0), threshold, timeout, } }

pub async fn call&#x3C;F, T, E>(&#x26;self, f: F) -> Result&#x3C;T, CircuitBreakerError&#x3C;E>>
where
    F: Future&#x3C;Output = Result&#x3C;T, E>>,
{
    // Check if circuit is open
    let state = self.state.read().await;
    match *state {
        CircuitState::Open(opened_at) => {
            if opened_at.elapsed() &#x3C; self.timeout {
                return Err(CircuitBreakerError::Open);
            }
            drop(state);
            *self.state.write().await = CircuitState::HalfOpen;
        }
        _ => {}
    }
    drop(state);

    // Execute request
    match f.await {
        Ok(result) => {
            self.on_success().await;
            Ok(result)
        }
        Err(e) => {
            self.on_failure().await;
            Err(CircuitBreakerError::Inner(e))
        }
    }
}

async fn on_success(&#x26;self) {
    self.failure_count.store(0, Ordering::SeqCst);
    let mut state = self.state.write().await;
    if matches!(*state, CircuitState::HalfOpen) {
        *state = CircuitState::Closed;
    }
}

async fn on_failure(&#x26;self) {
    let failures = self.failure_count.fetch_add(1, Ordering::SeqCst) + 1;
    if failures >= self.threshold {
        *self.state.write().await = CircuitState::Open(Instant::now());
    }
}

}

Batching Operations

Batch multiple operations for efficiency:

use tokio::time::{interval, Duration};

pub struct Batcher<T> { tx: mpsc::Sender<T>, }

impl<T: Send + 'static> Batcher<T> { pub fn new<F>( batch_size: usize, batch_timeout: Duration, process: F, ) -> Self where F: Fn(Vec<T>) -> Pin<Box<dyn Future<Output = ()> + Send>> + Send + 'static, { let (tx, mut rx) = mpsc::channel(1000);

    tokio::spawn(async move {
        let mut batch = Vec::with_capacity(batch_size);
        let mut interval = interval(batch_timeout);

        loop {
            tokio::select! {
                item = rx.recv() => {
                    match item {
                        Some(item) => {
                            batch.push(item);
                            if batch.len() >= batch_size {
                                process(std::mem::replace(&#x26;mut batch, Vec::with_capacity(batch_size))).await;
                            }
                        }
                        None => break,
                    }
                }
                _ = interval.tick() => {
                    if !batch.is_empty() {
                        process(std::mem::replace(&#x26;mut batch, Vec::with_capacity(batch_size))).await;
                    }
                }
            }
        }

        // Process remaining items
        if !batch.is_empty() {
            process(batch).await;
        }
    });

    Self { tx }
}

pub async fn submit(&#x26;self, item: T) -> Result&#x3C;(), mpsc::error::SendError&#x3C;T>> {
    self.tx.send(item).await
}

}

Best Practices

Use appropriate concurrency limits - Don't spawn unbounded tasks
Implement backpressure - Use bounded channels and semaphores
Handle cancellation - Support cooperative cancellation with tokens
Avoid lock contention - Minimize lock scope, prefer channels
Use rate limiting - Protect external services
Implement circuit breakers - Prevent cascading failures
Batch operations - Reduce overhead for small operations
Profile concurrency - Use tokio-console to understand behavior
Use appropriate synchronization - RwLock for read-heavy, Mutex for write-heavy
Design for failure - Always consider what happens when operations fail

tokio-concurrency

Safety Notice

Copy this and send it to your AI assistant to learn

Source Transparency

Related Skills

documentation-update

git-troubleshooting

git-advanced