From c531e03d35a4ace1dc643ea46bf3c567550cbc9a Mon Sep 17 00:00:00 2001
From: Yoshua Wuyts <yoshuawuyts+github@gmail.com>
Date: Sat, 26 Dec 2020 23:45:39 +0100
Subject: [PATCH 1/4] init load shed middleware

---
 Cargo.toml        |   1 +
 src/lib.rs        |   1 +
 src/limit/load.rs | 135 ++++++++++++++++++++++++++++++++++++++++++++++
 src/limit/mod.rs  |   4 ++
 4 files changed, 141 insertions(+)
 create mode 100644 src/limit/load.rs
 create mode 100644 src/limit/mod.rs
diff --git a/Cargo.toml b/Cargo.toml
index 334655623..381898986 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -48,6 +48,7 @@ pin-project-lite = "0.1.10"
 route-recognizer = "0.2.0"
 serde = "1.0.117"
 serde_json = "1.0.59"
+pid-lite = "1.1.0"
 
 [dev-dependencies]
 async-std = { version = "1.6.5", features = ["unstable", "attributes"] }
diff --git a/src/lib.rs b/src/lib.rs
index 13b835870..755595e41 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -75,6 +75,7 @@ mod router;
 mod server;
 
 pub mod convert;
+pub mod limit;
 pub mod listener;
 pub mod log;
 pub mod prelude;
diff --git a/src/limit/load.rs b/src/limit/load.rs
new file mode 100644
index 000000000..d279fbf2d
--- /dev/null
+++ b/src/limit/load.rs
@@ -0,0 +1,135 @@
+// https://github.com/asecurityteam/loadshed
+
+use crate::{Middleware, Next, Request, Response};
+
+use async_std::sync::{Arc, RwLock};
+use std::time::{Duration, Instant};
+
+use async_trait::async_trait;
+use pid_lite::Controller;
+
+/// Proportional request rejection based on load metrics.
+///
+/// # What is this purpose of this?
+///
+/// This middleware starts rejecting requests once a threshold has been reached
+/// telling clients to try again. This enables a service to cope with sudden
+/// increases in traffic without going down.
+///
+/// # How does this work?
+///
+/// This middleware sets a target number of requests it can process concurrently.
+/// Once capacity has been achieved it starts yielding back `503: service
+/// unavailable` in order to shed load. Responses also include a `Retry-After`
+/// header which sets a time in the future when to retry again
+///
+/// Internally capacity is governed through a [PID
+/// controller](https://en.wikipedia.org/wiki/PID_controller). This enables
+/// gradually scaling up load which prevents suddenly overwhelming the system and
+/// potentially crashing.
+///
+/// # What should clients implement?
+///
+/// Ideally a client will understand it can retry `503` requests, and will retry
+/// with the `Retry-After` value from the response after the timeout has elapsed.
+///
+/// # What other mitigations can be applied?
+///
+/// Always use a CDN which provides DDoS protection, and correctly configure your
+/// firewalls. Beyond that there are many kinds of rate limiters, and
+/// [Stripe has an excellent blog post](https://stripe.com/blog/rate-limiters)
+/// listing which exist and how to reason about them.
+#[derive(Debug)]
+pub struct LoadShedMiddleware {
+    inner: RwLock<Inner>,
+    /// The current amount of requests in flight.
+    counter: Arc<()>,
+    // TODO: create another Arc to count how many instance of this middleware exist.
+}
+
+#[derive(Debug)]
+struct Inner {
+    /// The PID controller governing the load.
+    controller: Controller,
+    /// The target number of concurrent requests we can have before we start
+    /// shedding load.
+    current_target: f64,
+    last_time: Instant,
+}
+
+impl LoadShedMiddleware {
+    /// Create a new instance of `LoadShedMiddleware`.
+    ///
+    /// `target` defines the desired amount of concurrent requests we want to
+    /// reach in order to optimize throughput on this service.
+    pub fn new(target: f64) -> Self {
+        Self::with_gain(target, 0.5, 0.1, 0.2)
+    }
+
+    /// Create a new instance of `LoadShedMiddleware` with custom tuning parameters.
+    /// TODO: pass a callback so it can be "dark applied".
+    /// TODO: consider "dark applying" a first-class mode that we should enable
+    /// TODO: apply `log` logs.
+    pub fn with_gain(target: f64, p_gain: f64, i_gain: f64, d_gain: f64) -> Self {
+        let current_target = 0.0;
+        let mut controller = Controller::new(target, p_gain, i_gain, d_gain);
+        let _correction = controller.update(current_target);
+        Self {
+            inner: RwLock::new(Inner {
+                controller,
+                current_target,
+                last_time: Instant::now(),
+            }),
+            counter: Arc::new(()),
+        }
+    }
+
+    /// Get the target value.
+    pub async fn target(&self) -> f64 {
+        let guard = self.inner.read().await;
+        guard.controller.target()
+    }
+
+    /// Set the target value.
+    pub async fn set_target(&mut self, target: f64) {
+        let mut guard = self.inner.write().await;
+        guard.controller.set_target(target);
+    }
+}
+
+#[async_trait]
+impl<State: Clone + Send + Sync + 'static> Middleware<State> for LoadShedMiddleware {
+    async fn handle(&self, req: Request<State>, next: Next<'_, State>) -> crate::Result {
+        // Init the middleware's request state.
+        let count_guard = self.counter.clone();
+        let current_count = Arc::strong_count(&count_guard);
+
+        // Update the PID controller if needed.
+        let now = Instant::now();
+        let last_time = self.inner.read().await.last_time;
+        let elapsed = now.duration_since(last_time);
+        drop(last_time);
+        if elapsed > Duration::from_secs(1) {
+            let mut guard = self.inner.write().await;
+            guard.last_time = now;
+            let correction = guard.controller.update(current_count as f64);
+            guard.current_target += correction;
+        }
+
+        // Check whether a 503 should be returned.
+        let guard = self.inner.read().await;
+        if current_count > guard.current_target as usize {
+            println!(
+                "Load shedding middleware engaged. target count: {}, current count: {}",
+                guard.controller.target(),
+                current_count
+            );
+            return Ok(Response::new(503));
+        }
+
+        // Finish running the request.
+        let res = next.run(req).await;
+        drop(count_guard);
+        Ok(res)
+    }
+}
diff --git a/src/limit/mod.rs b/src/limit/mod.rs
new file mode 100644
index 000000000..8fc92736b
--- /dev/null
+++ b/src/limit/mod.rs
@@ -0,0 +1,4 @@
+//! HTTP rate, size, and load limiting middleware.
+mod load;
+
+pub use load::LoadShedMiddleware;

From 9bc486133c15a4c52b34ed9a8135d99e4bf9bfe4 Mon Sep 17 00:00:00 2001
From: Yoshua Wuyts <yoshuawuyts+github@gmail.com>
Date: Sun, 27 Dec 2020 00:51:58 +0100
Subject: [PATCH 2/4] rename middleware

---
 examples/hello.rs                      |  5 +-
 src/limit/{load.rs => load_shedder.rs} | 70 ++++++++++++++++----------
 src/limit/mod.rs                       |  4 +-
 3 files changed, 50 insertions(+), 29 deletions(-)
 rename src/limit/{load.rs => load_shedder.rs} (64%)

diff --git a/examples/hello.rs b/examples/hello.rs
index f8dee0b2d..b75419f35 100644
--- a/examples/hello.rs
+++ b/examples/hello.rs
@@ -1,7 +1,10 @@
+use tide::limit::LoadShedder;
+
 #[async_std::main]
-async fn main() -> Result<(), std::io::Error> {
+async fn main() -> std::io::Result<()> {
     tide::log::start();
     let mut app = tide::new();
+    app.with(LoadShedder::new(0));
     app.at("/").get(|_| async { Ok("Hello, world!") });
     app.listen("127.0.0.1:8080").await?;
     Ok(())
diff --git a/src/limit/load.rs b/src/limit/load_shedder.rs
similarity index 64%
rename from src/limit/load.rs
rename to src/limit/load_shedder.rs
index d279fbf2d..fae43e7b6 100644
--- a/src/limit/load.rs
+++ b/src/limit/load_shedder.rs
@@ -3,6 +3,7 @@
 use crate::{Middleware, Next, Request, Response};
 
 use async_std::sync::{Arc, RwLock};
+use http_types::headers::RETRY_AFTER;
 use std::time::{Duration, Instant};
 
 use async_trait::async_trait;
@@ -39,12 +40,23 @@ use pid_lite::Controller;
 /// firewalls. Beyond that there are many kinds of rate limiters, and
 /// [Stripe has an excellent blog post](https://stripe.com/blog/rate-limiters)
 /// listing which exist and how to reason about them.
-#[derive(Debug)]
-pub struct LoadShedMiddleware {
-    inner: RwLock<Inner>,
+///
+/// # Updating limits at runtime
+///
+/// Some systems may be employing an external control plane to configure the
+/// limits and will want to be able to configure the load shed target too. This
+/// can be done by cloning the instantiated middleware, and calling `set_target`
+/// on it in response to a command from the control plane. This will update the
+/// limit shared by all instances of the middleware immediately.
+#[derive(Debug, Clone)]
+pub struct LoadShedder {
+    inner: Arc<RwLock<Inner>>,
     /// The current amount of requests in flight.
     counter: Arc<()>,
-    // TODO: create another Arc to count how many instance of this middleware exist.
+    /// The number of middleware instances in use. This number is substracted
+    /// from the `counter` to arrive at the correct number of requests currently
+    /// in flight.
+    instance_count: Arc<()>,
 }
 
 #[derive(Debug)]
@@ -54,33 +66,38 @@ struct Inner {
     /// The target number of concurrent requests we can have before we start
     /// shedding load.
     current_target: f64,
+    /// The last time at which the counter was updated.
     last_time: Instant,
 }
 
-impl LoadShedMiddleware {
+impl LoadShedder {
     /// Create a new instance of `LoadShedMiddleware`.
     ///
     /// `target` defines the desired amount of concurrent requests we want to
-    /// reach in order to optimize throughput on this service.
-    pub fn new(target: f64) -> Self {
+    /// reach in order to optimize throughput on this service. By default the
+    /// middleware is configured with the following tuning:
+    /// - `p_gain`: `0.5`
+    /// - `i_gain`: `0.1
+    /// - `d_gain`: `0.2`
+    pub fn new(target: usize) -> Self {
         Self::with_gain(target, 0.5, 0.1, 0.2)
     }
 
     /// Create a new instance of `LoadShedMiddleware` with custom tuning parameters.
-    /// TODO: pass a callback so it can be "dark applied".
-    /// TODO: consider "dark applying" a first-class mode that we should enable
-    /// TODO: apply `log` logs.
-    pub fn with_gain(target: f64, p_gain: f64, i_gain: f64, d_gain: f64) -> Self {
-        let current_target = 0.0;
+    // TODO: pass a callback so it can be "dark applied".
+    // TODO: consider "dark applying" a first-class mode that we should enable
+    pub fn with_gain(target: usize, p_gain: f64, i_gain: f64, d_gain: f64) -> Self {
+        let target = target as f64;
         let mut controller = Controller::new(target, p_gain, i_gain, d_gain);
-        let _correction = controller.update(current_target);
+        let correction = controller.update(0.0);
         Self {
-            inner: RwLock::new(Inner {
+            inner: Arc::new(RwLock::new(Inner {
                 controller,
-                current_target,
+                current_target: correction,
                 last_time: Instant::now(),
-            }),
+            })),
             counter: Arc::new(()),
+            instance_count: Arc::new(()),
         }
     }
 
@@ -98,33 +115,34 @@ impl LoadShedMiddleware {
 }
 
 #[async_trait]
-impl<State: Clone + Send + Sync + 'static> Middleware<State> for LoadShedMiddleware {
+impl<State: Clone + Send + Sync + 'static> Middleware<State> for LoadShedder {
     async fn handle(&self, req: Request<State>, next: Next<'_, State>) -> crate::Result {
         // Init the middleware's request state.
+        let instance_count = Arc::strong_count(&self.instance_count);
         let count_guard = self.counter.clone();
-        let current_count = Arc::strong_count(&count_guard);
+        let current_count = Arc::strong_count(&count_guard) - instance_count;
 
         // Update the PID controller if needed.
         let now = Instant::now();
         let last_time = self.inner.read().await.last_time;
-        let elapsed = now.duration_since(last_time);
-        drop(last_time);
-        if elapsed > Duration::from_secs(1) {
+        if now.duration_since(last_time) > Duration::from_secs(1) {
             let mut guard = self.inner.write().await;
             guard.last_time = now;
-            let correction = guard.controller.update(current_count as f64);
-            guard.current_target += correction;
+            guard.current_target += guard.controller.update(current_count as f64);
         }
 
         // Check whether a 503 should be returned.
         let guard = self.inner.read().await;
         if current_count > guard.current_target as usize {
-            println!(
-                "Load shedding middleware engaged. target count: {}, current count: {}",
+            log::error!(
+                "Load shedding middleware engaged. target count: {}, current target: {}, current count: {}",
                 guard.controller.target(),
+                guard.current_target,
                 current_count
             );
-            return Ok(Response::new(503));
+            // TODO: apply `Retry-After` header.
+            let res = Response::builder(503).header(RETRY_AFTER, "2");
+            return Ok(res.into());
         }
 
         // Finish running the request.
diff --git a/src/limit/mod.rs b/src/limit/mod.rs
index 8fc92736b..f3f0cffd8 100644
--- a/src/limit/mod.rs
+++ b/src/limit/mod.rs
@@ -1,4 +1,4 @@
 //! HTTP rate, size, and load limiting middleware.
-mod load;
+mod load_shedder;
 
-pub use load::LoadShedMiddleware;
+pub use load_shedder::LoadShedder;

From 26de80f9df8a99752b32c831d87e371208fd61c7 Mon Sep 17 00:00:00 2001
From: Yoshua Wuyts <yoshuawuyts+github@gmail.com>
Date: Sun, 27 Dec 2020 01:51:12 +0100
Subject: [PATCH 3/4] fix load shedder

---
 Cargo.toml                |  3 ++-
 examples/hello.rs         |  3 ---
 src/limit/load_shedder.rs | 22 +++++++++++++++++++---
 3 files changed, 21 insertions(+), 7 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 381898986..6e0a68784 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -38,17 +38,18 @@ async-session  = { version = "2.0.1", optional = true }
 async-sse = "4.0.1"
 async-std = { version = "1.6.5", features = ["unstable"] }
 async-trait = "0.1.41"
+exponential-backoff = "1.0.0"
 femme = { version = "2.1.1", optional = true }
 futures-util = "0.3.6"
 http-client = { version = "6.1.0", default-features = false }
 http-types = "2.5.0"
 kv-log-macro = "1.0.7"
 log = { version = "0.4.11", features = ["std"] }
+pid-lite = "1.1.0"
 pin-project-lite = "0.1.10"
 route-recognizer = "0.2.0"
 serde = "1.0.117"
 serde_json = "1.0.59"
-pid-lite = "1.1.0"
 
 [dev-dependencies]
 async-std = { version = "1.6.5", features = ["unstable", "attributes"] }
diff --git a/examples/hello.rs b/examples/hello.rs
index b75419f35..71674c37e 100644
--- a/examples/hello.rs
+++ b/examples/hello.rs
@@ -1,10 +1,7 @@
-use tide::limit::LoadShedder;
-
 #[async_std::main]
 async fn main() -> std::io::Result<()> {
     tide::log::start();
     let mut app = tide::new();
-    app.with(LoadShedder::new(0));
     app.at("/").get(|_| async { Ok("Hello, world!") });
     app.listen("127.0.0.1:8080").await?;
     Ok(())
diff --git a/src/limit/load_shedder.rs b/src/limit/load_shedder.rs
index fae43e7b6..cf35041d8 100644
--- a/src/limit/load_shedder.rs
+++ b/src/limit/load_shedder.rs
@@ -7,10 +7,19 @@ use http_types::headers::RETRY_AFTER;
 use std::time::{Duration, Instant};
 
 use async_trait::async_trait;
+use exponential_backoff::Backoff;
 use pid_lite::Controller;
 
+const SESSION_KEY: &str = "load_shedder::backoff_attempt";
+const RETRIES: u32 = 28;
+const MIN_RETRY: Duration = Duration::from_secs(2);
+const MAX_RETRY: Duration = Duration::from_secs(12);
+
 /// Proportional request rejection based on load metrics.
 ///
+/// This middleware requires the session middleware to be enabled in order to
+/// track the exponential backoff value per-client.
+///
 /// # What is this purpose of this?
 ///
 /// This middleware starts rejecting requests once a threshold has been reached
@@ -116,11 +125,12 @@ impl LoadShedder {
 
 #[async_trait]
 impl<State: Clone + Send + Sync + 'static> Middleware<State> for LoadShedder {
-    async fn handle(&self, req: Request<State>, next: Next<'_, State>) -> crate::Result {
+    async fn handle(&self, mut req: Request<State>, next: Next<'_, State>) -> crate::Result {
         // Init the middleware's request state.
         let instance_count = Arc::strong_count(&self.instance_count);
         let count_guard = self.counter.clone();
         let current_count = Arc::strong_count(&count_guard) - instance_count;
+        let session = req.session_mut();
 
         // Update the PID controller if needed.
         let now = Instant::now();
@@ -140,11 +150,17 @@ impl<State: Clone + Send + Sync + 'static> Middleware<State> for LoadShedder {
                 guard.current_target,
                 current_count
             );
-            // TODO: apply `Retry-After` header.
-            let res = Response::builder(503).header(RETRY_AFTER, "2");
+
+            let backoff = Backoff::new(RETRIES, MIN_RETRY, MAX_RETRY);
+            let attempt = session.get::<u32>(SESSION_KEY).unwrap_or(0);
+            let dur = backoff.next(attempt).unwrap(); // Safe because no max backoff is set.
+            session.insert(SESSION_KEY, attempt + 1)?;
+            let res = Response::builder(503).header(RETRY_AFTER, format!("{}", dur.as_secs()));
             return Ok(res.into());
         }
 
+        session.remove(SESSION_KEY);
+
         // Finish running the request.
         let res = next.run(req).await;
         drop(count_guard);

From aa88c182c99bf06faa3b30b61161ceccaf10c11f Mon Sep 17 00:00:00 2001
From: Yoshua Wuyts <yoshuawuyts+github@gmail.com>
Date: Sun, 27 Dec 2020 02:01:56 +0100
Subject: [PATCH 4/4] fix feature flag

---
 src/limit/mod.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/limit/mod.rs b/src/limit/mod.rs
index f3f0cffd8..6a782003c 100644
--- a/src/limit/mod.rs
+++ b/src/limit/mod.rs
@@ -1,4 +1,6 @@
 //! HTTP rate, size, and load limiting middleware.
+#[cfg(feature = "sessions")]
 mod load_shedder;
 
+#[cfg(feature = "sessions")]
 pub use load_shedder::LoadShedder;