Skip to content
Snippets Groups Projects
Commit 644f962c authored by Ian Jackson's avatar Ian Jackson :speech_balloon:
Browse files

Merge branch 'move-retry-delay' into 'main'

Move RetryDelay into tor-basic-utils

See merge request tpo/core/arti!411
parents 3e12cf26 09f750c2
No related branches found
No related tags found
No related merge requests found
......@@ -3129,6 +3129,7 @@ name = "tor-basic-utils"
version = "0.1.0"
dependencies = [
"educe",
"rand 0.8.5",
]
[[package]]
......
......@@ -7,10 +7,12 @@ license = "MIT OR Apache-2.0"
homepage = "https://gitlab.torproject.org/tpo/core/arti/-/wikis/home"
description = "General helpers used by Tor"
keywords = ["tor", "arti"]
categories = ["rust-patterns"] # We must put *something* here and this will do
# We must put *something* here and this will do
categories = ["rust-patterns"]
repository = "https://gitlab.torproject.org/tpo/core/arti.git/"
[dependencies]
rand = "0.8"
[dev-dependencies]
educe = "0.4.6"
......@@ -41,6 +41,8 @@
use std::fmt;
pub mod retry;
// ----------------------------------------------------------------------
/// Function with the signature of `Debug::fmt` that just prints `".."`
......
//! An implementation of the "decorrelated jitter" algorithm for scheduling retries.
//!
//! See [`RetryDelay`] for more information.
use std::time::Duration;
use rand::Rng;
/// An implementation for retrying a remote operation based on a [decorrelated
/// jitter] schedule.
///
/// The algorithm used here has several desirable properties:
/// * It is randomized, so that multiple timeouts don't have a danger of
/// getting synchronized with each other and hammering the same servers all
/// at once.
/// * It tends on average to wait longer and longer over time, so that if the
/// server is down, it won't get pummeled by a zillion failing clients
/// when it comes back up.
/// * It has a chance of retrying promptly, which results in better client
/// performance on average.
///
/// For a more full specification, see [`dir-spec.txt`].
///
/// [decorrelated jitter]:
/// https://aws.amazon.com/blogs/architecture/exponential-backoff-and-jitter/
/// [`dir-spec.txt`]: https://spec.torproject.org/dir-spec
#[derive(Clone, Debug)]
pub struct RetryDelay {
/// The last delay that this retry delay returned (in msec), or 0
/// if this never returned a delay.
last_delay_ms: u32,
/// The lowest allowable delay (in msec).
low_bound_ms: u32,
}
/// Lowest possible lower bound, in milliseconds.
// We're doing this in MS, and Tor does it in seconds, so I'm
// multiplying the minimum by 1000 here.
const MIN_LOW_BOUND: u32 = 1000;
/// Largest possible lower bound, in milliseconds.
const MAX_LOW_BOUND: u32 = std::u32::MAX - 1;
/// Maximum amount to multiply the previous delay by.
const MAX_DELAY_MULT: u32 = 3;
impl RetryDelay {
/// Construct a new RetryDelay from a given base delay in
/// milliseconds.
///
/// The base delay defines the lowest possible interval that can
/// be returned.
///
/// # Limitations
///
/// If the base delay is less than 1000, a base delay of 1000 is
/// used instead, since that's what the C tor implementation does.
pub fn from_msec(base_delay_msec: u32) -> Self {
let low_bound_ms = base_delay_msec.clamp(MIN_LOW_BOUND, MAX_LOW_BOUND);
RetryDelay {
last_delay_ms: 0,
low_bound_ms,
}
}
/// Construct a new RetryDelay from a given base delay.
///
/// See from_msec for more information.
pub fn from_duration(d: Duration) -> Self {
let msec = d.as_millis();
let msec = std::cmp::min(msec, u128::from(MAX_LOW_BOUND)) as u32;
RetryDelay::from_msec(msec)
}
/// Helper: Return a lower and upper bound for the next delay to
/// be yielded.
///
/// Values are in milliseconds.
fn delay_bounds(&self) -> (u32, u32) {
let low = self.low_bound_ms;
let high = std::cmp::max(
// We don't need a saturating_add here, since low is always
// less than high, so low cannot be equal to u32::MAX.
low + 1,
self.last_delay_ms.saturating_mul(MAX_DELAY_MULT),
);
(low, high)
}
/// Return the next delay to be used (in milliseconds), according
/// to a given random number generator.
fn next_delay_msec<R: Rng>(&mut self, rng: &mut R) -> u32 {
let (low, high) = self.delay_bounds();
assert!(low < high);
let val = rng.gen_range(low..high);
self.last_delay_ms = val;
val
}
/// Return the next delay to be used (as a [`Duration`]),
/// according to a given random number generator.
pub fn next_delay<R: Rng>(&mut self, rng: &mut R) -> Duration {
Duration::from_millis(u64::from(self.next_delay_msec(rng)))
}
}
impl Default for RetryDelay {
fn default() -> Self {
RetryDelay::from_msec(0)
}
}
#[cfg(test)]
mod test {
use super::*;
#[test]
fn init() {
let rd = RetryDelay::from_msec(2000);
assert_eq!(rd.last_delay_ms, 0);
assert_eq!(rd.low_bound_ms, 2000);
let rd = RetryDelay::from_msec(0);
assert_eq!(rd.last_delay_ms, 0);
assert_eq!(rd.low_bound_ms, 1000);
let rd = RetryDelay::from_duration(Duration::new(1, 500_000_000));
assert_eq!(rd.last_delay_ms, 0);
assert_eq!(rd.low_bound_ms, 1500);
}
#[test]
fn bounds() {
let mut rd = RetryDelay::from_msec(1000);
assert_eq!(rd.delay_bounds(), (1000, 1001));
rd.last_delay_ms = 1500;
assert_eq!(rd.delay_bounds(), (1000, 4500));
rd.last_delay_ms = 3_000_000_000;
assert_eq!(rd.delay_bounds(), (1000, std::u32::MAX));
}
#[test]
fn rng() {
let mut rd = RetryDelay::from_msec(50);
let real_low_bound = std::cmp::max(50, MIN_LOW_BOUND);
let mut rng = rand::thread_rng();
for _ in 1..100 {
let (b_lo, b_hi) = rd.delay_bounds();
assert!(b_lo == real_low_bound);
assert!(b_hi > b_lo);
let delay = rd.next_delay(&mut rng).as_millis() as u32;
assert_eq!(delay, rd.last_delay_ms);
assert!(delay >= b_lo);
assert!(delay < b_hi);
}
}
}
//! Implement a timer for retrying a single failed fetch or object,
//! using the [decorrelated jitter] algorithm.
//! Configure timers for a timer for retrying a single failed fetch or object.
//!
//! For a more full specification, see [`dir-spec.txt`].
//!
//! [decorrelated jitter]: https://aws.amazon.com/blogs/architecture/exponential-backoff-and-jitter/
//! [`dir-spec.txt`]: https://spec.torproject.org/dir-spec
//! For a more information on the algorithm, see
//! [`RetryDelay`](tor_basic_utils::retry::RetryDelay).
use rand::Rng;
use std::convert::TryInto;
use std::num::{NonZeroU32, NonZeroU8};
use std::time::Duration;
use serde::Deserialize;
/// An implementation for retrying downloads based on a decorrelated jitter
/// schedule.
///
/// The algorithm used here has several desirable properties:
/// * It is randomized, so that multiple timeouts don't have a
/// danger of getting synchronized with each other and hammering the
/// same directory servers all at once.
/// * It tends on average to wait longer and longer over time, so
/// that if the directory server is down, it won't get pummeled by
/// a zillion failing clients when it comes back up.
/// * It has a chance of retrying promptly, which results in better
/// client performance on average.
pub struct RetryDelay {
/// The last delay that this retry delay returned (in msec), or 0
/// if this never returned a delay.
last_delay_ms: u32,
/// The lowest allowable delay (in msec).
low_bound_ms: u32,
}
/// Lowest possible lower bound, in milliseconds.
// We're doing this in MS, and Tor does it in seconds, so I'm
// multiplying the minimum by 1000 here.
const MIN_LOW_BOUND: u32 = 1000;
/// Largest possible lower bound, in milliseconds.
const MAX_LOW_BOUND: u32 = std::u32::MAX - 1;
/// Maximum amount to multiply the previous delay by.
const MAX_DELAY_MULT: u32 = 3;
impl RetryDelay {
/// Construct a new RetryDelay from a given base delay in
/// milliseconds.
///
/// The base delay defines the lowest possible interval that can
/// be returned.
///
/// # Limitations
///
/// If the base delay is less than 1000, a base delay of 1000 is
/// used instead, since that's what the C tor implementation does.
pub fn from_msec(base_delay_msec: u32) -> Self {
let low_bound_ms = base_delay_msec.clamp(MIN_LOW_BOUND, MAX_LOW_BOUND);
RetryDelay {
last_delay_ms: 0,
low_bound_ms,
}
}
/// Construct a new RetryDelay from a given base delay.
///
/// See from_msec for more information.
pub fn from_duration(d: Duration) -> Self {
let msec = d.as_millis();
let msec = std::cmp::min(msec, u128::from(MAX_LOW_BOUND)) as u32;
RetryDelay::from_msec(msec)
}
/// Helper: Return a lower and upper bound for the next delay to
/// be yielded.
fn delay_bounds(&self) -> (u32, u32) {
let low = self.low_bound_ms;
let high = std::cmp::max(
// We don't need a saturating_add here, since low is always
// less than high, so low cannot be equal to u32::MAX.
low + 1,
self.last_delay_ms.saturating_mul(MAX_DELAY_MULT),
);
(low, high)
}
/// Return the next delay to be used (in milliseconds), according
/// to a given random number generator.
pub fn next_delay_msec<R: Rng>(&mut self, rng: &mut R) -> u32 {
let (low, high) = self.delay_bounds();
assert!(low < high);
let val = rng.gen_range(low..high);
self.last_delay_ms = val;
val
}
/// Return the next delay to be used (as a [`Duration`]),
/// according to a given random number generator.
pub fn next_delay<R: Rng>(&mut self, rng: &mut R) -> Duration {
Duration::from_millis(u64::from(self.next_delay_msec(rng)))
}
}
impl Default for RetryDelay {
fn default() -> Self {
RetryDelay::from_msec(0)
}
}
use tor_basic_utils::retry::RetryDelay;
/// Configuration for how many times to retry a download, with what
/// frequency.
......@@ -194,70 +95,31 @@ impl DownloadSchedule {
mod test {
use super::*;
#[test]
fn init() {
let rd = RetryDelay::from_msec(2000);
assert_eq!(rd.last_delay_ms, 0);
assert_eq!(rd.low_bound_ms, 2000);
let rd = RetryDelay::from_msec(0);
assert_eq!(rd.last_delay_ms, 0);
assert_eq!(rd.low_bound_ms, 1000);
let rd = RetryDelay::from_duration(Duration::new(1, 500_000_000));
assert_eq!(rd.last_delay_ms, 0);
assert_eq!(rd.low_bound_ms, 1500);
}
#[test]
fn bounds() {
let mut rd = RetryDelay::from_msec(1000);
assert_eq!(rd.delay_bounds(), (1000, 1001));
rd.last_delay_ms = 1500;
assert_eq!(rd.delay_bounds(), (1000, 4500));
rd.last_delay_ms = 3_000_000_000;
assert_eq!(rd.delay_bounds(), (1000, std::u32::MAX));
}
#[test]
fn rng() {
let mut rd = RetryDelay::from_msec(50);
let real_low_bound = std::cmp::max(50, MIN_LOW_BOUND);
let mut rng = rand::thread_rng();
for _ in 1..100 {
let (b_lo, b_hi) = rd.delay_bounds();
assert!(b_lo == real_low_bound);
assert!(b_hi > b_lo);
let delay = rd.next_delay(&mut rng).as_millis() as u32;
assert_eq!(delay, rd.last_delay_ms);
assert!(delay >= b_lo);
assert!(delay < b_hi);
}
}
#[test]
fn config() {
// default configuration is 3 tries, 1000 msec initial delay
let cfg = DownloadSchedule::default();
let one_sec = Duration::from_secs(1);
let zero_sec = Duration::from_secs(0);
let mut rng = rand::thread_rng();
assert_eq!(cfg.n_attempts(), 3);
let v: Vec<_> = cfg.attempts().collect();
assert_eq!(&v[..], &[0, 1, 2]);
let sched = cfg.schedule();
assert_eq!(sched.last_delay_ms, 0);
assert_eq!(sched.low_bound_ms, 1000);
assert_eq!(cfg.initial_delay, one_sec);
let mut sched = cfg.schedule();
assert_eq!(sched.next_delay(&mut rng), one_sec);
// Try a zero-attempt schedule, and have it get remapped to 1,1
let cfg = DownloadSchedule::new(0, Duration::new(0, 0), 0);
let cfg = DownloadSchedule::new(0, zero_sec, 0);
assert_eq!(cfg.n_attempts(), 1);
assert_eq!(cfg.parallelism(), 1);
let v: Vec<_> = cfg.attempts().collect();
assert_eq!(&v[..], &[0]);
let sched = cfg.schedule();
assert_eq!(sched.last_delay_ms, 0);
assert_eq!(sched.low_bound_ms, 1000);
assert_eq!(cfg.initial_delay, zero_sec);
let mut sched = cfg.schedule();
assert_eq!(sched.next_delay(&mut rng), one_sec);
}
}
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment