http-rs · yoshuawuyts · Dec 26, 2020 · Dec 26, 2020 · Dec 27, 2020 · Dec 27, 2020
diff --git a/Cargo.toml b/Cargo.toml
@@ -38,12 +38,14 @@ async-session  = { version = "2.0.1", optional = true }
 async-sse = "4.0.1"
 async-std = { version = "1.6.5", features = ["unstable"] }
 async-trait = "0.1.41"
+exponential-backoff = "1.0.0"
 femme = { version = "2.1.1", optional = true }
 futures-util = "0.3.6"
 http-client = { version = "6.1.0", default-features = false }
 http-types = "2.5.0"
 kv-log-macro = "1.0.7"
 log = { version = "0.4.11", features = ["std"] }
+pid-lite = "1.1.0"
 pin-project-lite = "0.1.10"
 route-recognizer = "0.2.0"
 serde = "1.0.117"

diff --git a/examples/hello.rs b/examples/hello.rs
@@ -1,5 +1,5 @@
 #[async_std::main]
-async fn main() -> Result<(), std::io::Error> {
+async fn main() -> std::io::Result<()> {
     tide::log::start();
     let mut app = tide::new();
     app.at("/").get(|_| async { Ok("Hello, world!") });

diff --git a/src/lib.rs b/src/lib.rs
@@ -75,6 +75,7 @@ mod router;
 mod server;
 
 pub mod convert;
+pub mod limit;
 pub mod listener;
 pub mod log;
 pub mod prelude;

diff --git a/src/limit/load_shedder.rs b/src/limit/load_shedder.rs
@@ -0,0 +1,169 @@
+// https://github.com/asecurityteam/loadshed
+
+use crate::{Middleware, Next, Request, Response};
+
+use async_std::sync::{Arc, RwLock};
+use http_types::headers::RETRY_AFTER;
+use std::time::{Duration, Instant};
+
+use async_trait::async_trait;
+use exponential_backoff::Backoff;
+use pid_lite::Controller;
+
+const SESSION_KEY: &str = "load_shedder::backoff_attempt";
+const RETRIES: u32 = 28;
+const MIN_RETRY: Duration = Duration::from_secs(2);
+const MAX_RETRY: Duration = Duration::from_secs(12);
+
+/// Proportional request rejection based on load metrics.
+///
+/// This middleware requires the session middleware to be enabled in order to
+/// track the exponential backoff value per-client.
+///
+/// # What is this purpose of this?
+///
+/// This middleware starts rejecting requests once a threshold has been reached
+/// telling clients to try again. This enables a service to cope with sudden
+/// increases in traffic without going down.
+///
+/// # How does this work?
+///
+/// This middleware sets a target number of requests it can process concurrently.
+/// Once capacity has been achieved it starts yielding back `503: service
+/// unavailable` in order to shed load. Responses also include a `Retry-After`
+/// header which sets a time in the future when to retry again
+///
+/// Internally capacity is governed through a [PID
+/// controller](https://en.wikipedia.org/wiki/PID_controller). This enables
+/// gradually scaling up load which prevents suddenly overwhelming the system and
+/// potentially crashing.
+///
+/// # What should clients implement?
+///
+/// Ideally a client will understand it can retry `503` requests, and will retry
+/// with the `Retry-After` value from the response after the timeout has elapsed.
+///
+/// # What other mitigations can be applied?
+///
+/// Always use a CDN which provides DDoS protection, and correctly configure your
+/// firewalls. Beyond that there are many kinds of rate limiters, and
+/// [Stripe has an excellent blog post](https://stripe.com/blog/rate-limiters)
+/// listing which exist and how to reason about them.
+///
+/// # Updating limits at runtime
+///
+/// Some systems may be employing an external control plane to configure the
+/// limits and will want to be able to configure the load shed target too. This
+/// can be done by cloning the instantiated middleware, and calling `set_target`
+/// on it in response to a command from the control plane. This will update the
+/// limit shared by all instances of the middleware immediately.
+#[derive(Debug, Clone)]
+pub struct LoadShedder {
+    inner: Arc<RwLock<Inner>>,
+    /// The current amount of requests in flight.
+    counter: Arc<()>,
+    /// The number of middleware instances in use. This number is substracted
+    /// from the `counter` to arrive at the correct number of requests currently
+    /// in flight.
+    instance_count: Arc<()>,
+}
+
+#[derive(Debug)]
+struct Inner {
+    /// The PID controller governing the load.
+    controller: Controller,
+    /// The target number of concurrent requests we can have before we start
+    /// shedding load.
+    current_target: f64,
+    /// The last time at which the counter was updated.
+    last_time: Instant,
+}
+
+impl LoadShedder {
+    /// Create a new instance of `LoadShedMiddleware`.
+    ///
+    /// `target` defines the desired amount of concurrent requests we want to
+    /// reach in order to optimize throughput on this service. By default the
+    /// middleware is configured with the following tuning:
+    /// - `p_gain`: `0.5`
+    /// - `i_gain`: `0.1
+    /// - `d_gain`: `0.2`
+    pub fn new(target: usize) -> Self {
+        Self::with_gain(target, 0.5, 0.1, 0.2)
+    }
+
+    /// Create a new instance of `LoadShedMiddleware` with custom tuning parameters.
+    // TODO: pass a callback so it can be "dark applied".
+    // TODO: consider "dark applying" a first-class mode that we should enable
+    pub fn with_gain(target: usize, p_gain: f64, i_gain: f64, d_gain: f64) -> Self {
+        let target = target as f64;
+        let mut controller = Controller::new(target, p_gain, i_gain, d_gain);
+        let correction = controller.update(0.0);
+        Self {
+            inner: Arc::new(RwLock::new(Inner {
+                controller,
+                current_target: correction,
+                last_time: Instant::now(),
+            })),
+            counter: Arc::new(()),
+            instance_count: Arc::new(()),
+        }
+    }
+
+    /// Get the target value.
+    pub async fn target(&self) -> f64 {
+        let guard = self.inner.read().await;
+        guard.controller.target()
+    }
+
+    /// Set the target value.
+    pub async fn set_target(&mut self, target: f64) {
+        let mut guard = self.inner.write().await;
+        guard.controller.set_target(target);
+    }
+}
+
+#[async_trait]
+impl<State: Clone + Send + Sync + 'static> Middleware<State> for LoadShedder {
+    async fn handle(&self, mut req: Request<State>, next: Next<'_, State>) -> crate::Result {
+        // Init the middleware's request state.
+        let instance_count = Arc::strong_count(&self.instance_count);
+        let count_guard = self.counter.clone();
+        let current_count = Arc::strong_count(&count_guard) - instance_count;
+        let session = req.session_mut();
+
+        // Update the PID controller if needed.
+        let now = Instant::now();
+        let last_time = self.inner.read().await.last_time;
+        if now.duration_since(last_time) > Duration::from_secs(1) {
+            let mut guard = self.inner.write().await;
+            guard.last_time = now;
+            guard.current_target += guard.controller.update(current_count as f64);
+        }
+
+        // Check whether a 503 should be returned.
+        let guard = self.inner.read().await;
+        if current_count > guard.current_target as usize {
+            log::error!(
+                "Load shedding middleware engaged. target count: {}, current target: {}, current count: {}",
+                guard.controller.target(),
+                guard.current_target,
+                current_count
+            );
+
+            let backoff = Backoff::new(RETRIES, MIN_RETRY, MAX_RETRY);
+            let attempt = session.get::<u32>(SESSION_KEY).unwrap_or(0);
+            let dur = backoff.next(attempt).unwrap(); // Safe because no max backoff is set.
+            session.insert(SESSION_KEY, attempt + 1)?;
+            let res = Response::builder(503).header(RETRY_AFTER, format!("{}", dur.as_secs()));
+            return Ok(res.into());
+        }
+
+        session.remove(SESSION_KEY);
+
+        // Finish running the request.
+        let res = next.run(req).await;
+        drop(count_guard);
+        Ok(res)
+    }
+}
diff --git a/src/limit/mod.rs b/src/limit/mod.rs
@@ -0,0 +1,6 @@
+//! HTTP rate, size, and load limiting middleware.
+#[cfg(feature = "sessions")]
+mod load_shedder;
+
+#[cfg(feature = "sessions")]
+pub use load_shedder::LoadShedder;