quiche/recovery/gcongestion/bbr2/
probe_bw.rs

1// Copyright (c) 2015 The Chromium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5// Copyright (C) 2023, Cloudflare, Inc.
6// All rights reserved.
7//
8// Redistribution and use in source and binary forms, with or without
9// modification, are permitted provided that the following conditions are
10// met:
11//
12//     * Redistributions of source code must retain the above copyright notice,
13//       this list of conditions and the following disclaimer.
14//
15//     * Redistributions in binary form must reproduce the above copyright
16//       notice, this list of conditions and the following disclaimer in the
17//       documentation and/or other materials provided with the distribution.
18//
19// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
20// IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
21// THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
23// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
24// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
25// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
26// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
27// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
28// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
29// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
31use std::ops::Add;
32use std::time::Duration;
33use std::time::Instant;
34
35use crate::recovery::gcongestion::Acked;
36use crate::recovery::gcongestion::Lost;
37
38use super::mode::Cycle;
39use super::mode::CyclePhase;
40use super::mode::Mode;
41use super::mode::ModeImpl;
42use super::network_model::BBRv2NetworkModel;
43use super::network_model::DEFAULT_MSS;
44use super::BBRv2CongestionEvent;
45use super::BwLoMode;
46use super::Limits;
47use super::PARAMS;
48
49#[derive(Debug)]
50pub(super) struct ProbeBW {
51    pub(super) model: BBRv2NetworkModel,
52    pub(super) cycle: Cycle,
53}
54
55#[derive(PartialEq, PartialOrd)]
56enum AdaptUpperBoundsResult {
57    AdaptedOk,
58    AdaptedProbedTooHigh,
59    NotAdaptedInflightHighNotSet,
60    NotAdaptedInvalidSample,
61}
62
63impl ModeImpl for ProbeBW {
64    fn enter(
65        &mut self, now: Instant, _congestion_event: Option<&BBRv2CongestionEvent>,
66    ) {
67        self.cycle.start_time = now;
68
69        match self.cycle.phase {
70            super::mode::CyclePhase::NotStarted => {
71                // First time entering PROBE_BW. Start a new probing cycle.
72                self.enter_probe_down(false, false, now)
73            },
74            super::mode::CyclePhase::Cruise => self.enter_probe_cruise(now),
75            super::mode::CyclePhase::Refill =>
76                self.enter_probe_refill(self.cycle.probe_up_rounds, now),
77            super::mode::CyclePhase::Up | super::mode::CyclePhase::Down => {},
78        }
79    }
80
81    fn on_congestion_event(
82        mut self, prior_in_flight: usize, event_time: Instant, _: &[Acked],
83        _: &[Lost], congestion_event: &mut BBRv2CongestionEvent,
84        target_bytes_inflight: usize,
85    ) -> Mode {
86        if congestion_event.end_of_round_trip {
87            if self.cycle.start_time != event_time {
88                self.cycle.rounds_since_probe += 1;
89            }
90
91            if self.cycle.phase_start_time != event_time {
92                self.cycle.rounds_in_phase += 1;
93            }
94        }
95
96        let mut switch_to_probe_rtt = false;
97
98        match self.cycle.phase {
99            CyclePhase::NotStarted => unreachable!(),
100            CyclePhase::Up => self.update_probe_up(
101                prior_in_flight,
102                target_bytes_inflight,
103                congestion_event,
104            ),
105            CyclePhase::Down => {
106                self.update_probe_down(target_bytes_inflight, congestion_event);
107                if self.cycle.phase != CyclePhase::Down &&
108                    self.model.maybe_expire_min_rtt(congestion_event)
109                {
110                    switch_to_probe_rtt = true;
111                }
112            },
113            CyclePhase::Cruise =>
114                self.update_probe_cruise(target_bytes_inflight, congestion_event),
115            CyclePhase::Refill =>
116                self.update_probe_refill(target_bytes_inflight, congestion_event),
117        }
118
119        // Do not need to set the gains if switching to PROBE_RTT, they will be
120        // set when `ProbeRTT::enter` is called.
121        if !switch_to_probe_rtt {
122            self.model.set_pacing_gain(self.cycle.phase.gain());
123            self.model.set_cwnd_gain(PARAMS.probe_bw_cwnd_gain);
124        }
125
126        if switch_to_probe_rtt {
127            self.into_probe_rtt(event_time, Some(congestion_event))
128        } else {
129            Mode::ProbeBW(self)
130        }
131    }
132
133    fn get_cwnd_limits(&self) -> Limits<usize> {
134        if self.cycle.phase == CyclePhase::Cruise {
135            let limit = self
136                .model
137                .inflight_lo()
138                .min(self.model.inflight_hi_with_headroom());
139            return Limits::no_greater_than(limit);
140        }
141
142        if self.cycle.phase == CyclePhase::Up &&
143            PARAMS.probe_up_ignore_inflight_hi
144        {
145            // Similar to STARTUP.
146            return Limits::no_greater_than(self.model.inflight_lo());
147        }
148
149        Limits::no_greater_than(
150            self.model.inflight_lo().min(self.model.inflight_hi()),
151        )
152    }
153
154    fn is_probing_for_bandwidth(&self) -> bool {
155        self.cycle.phase == CyclePhase::Refill ||
156            self.cycle.phase == CyclePhase::Up
157    }
158
159    fn on_exit_quiescence(
160        mut self, now: Instant, quiescence_start_time: Instant,
161    ) -> Mode {
162        self.model
163            .postpone_min_rtt_timestamp(now - quiescence_start_time);
164        Mode::ProbeBW(self)
165    }
166
167    fn leave(
168        &mut self, _now: Instant,
169        _congestion_event: Option<&BBRv2CongestionEvent>,
170    ) {
171    }
172}
173
174impl ProbeBW {
175    fn enter_probe_down(
176        &mut self, probed_too_high: bool, stopped_risky_probe: bool, now: Instant,
177    ) {
178        let cycle = &mut self.cycle;
179        cycle.last_cycle_probed_too_high = probed_too_high;
180        cycle.last_cycle_stopped_risky_probe = stopped_risky_probe;
181
182        cycle.phase = CyclePhase::Down;
183        cycle.start_time = now;
184        cycle.phase_start_time = now;
185        cycle.rounds_in_phase = 0;
186
187        if PARAMS.bw_lo_mode != BwLoMode::Default {
188            // Clear bandwidth lo if it was set in PROBE_UP, because losses in
189            // PROBE_UP should not permanently change bandwidth_lo.
190            // It's possible for bandwidth_lo to be set during REFILL, but if that
191            // was a valid value, it'll quickly be rediscovered.
192            self.model.clear_bandwidth_lo();
193        }
194
195        // Pick probe wait time.
196        // TODO(vlad): actually pick time
197        cycle.rounds_since_probe = 0;
198        cycle.probe_wait_time = Some(
199            PARAMS.probe_bw_probe_base_duration + Duration::from_micros(500),
200        );
201
202        cycle.probe_up_bytes = None;
203        cycle.probe_up_app_limited_since_inflight_hi_limited = false;
204        cycle.has_advanced_max_bw = false;
205        self.model.restart_round_early();
206    }
207
208    fn enter_probe_cruise(&mut self, now: Instant) {
209        if self.cycle.phase == CyclePhase::Down {
210            self.exit_probe_down();
211        }
212
213        let cycle = &mut self.cycle;
214
215        self.model.cap_inflight_lo(self.model.inflight_hi());
216        cycle.phase = CyclePhase::Cruise;
217        cycle.phase_start_time = now;
218        cycle.rounds_in_phase = 0;
219        cycle.is_sample_from_probing = false;
220    }
221
222    fn enter_probe_refill(&mut self, probe_up_rounds: usize, now: Instant) {
223        if self.cycle.phase == CyclePhase::Down {
224            self.exit_probe_down();
225        }
226
227        let cycle = &mut self.cycle;
228
229        cycle.phase = CyclePhase::Refill;
230        cycle.phase_start_time = now;
231        cycle.rounds_in_phase = 0;
232
233        cycle.is_sample_from_probing = false;
234        cycle.last_cycle_stopped_risky_probe = false;
235
236        self.model.clear_bandwidth_lo();
237        self.model.clear_inflight_lo();
238        cycle.probe_up_rounds = probe_up_rounds;
239        cycle.probe_up_acked = 0;
240        self.model.restart_round_early();
241    }
242
243    fn enter_probe_up(&mut self, now: Instant, cwnd: usize) {
244        let cycle = &mut self.cycle;
245
246        cycle.phase = CyclePhase::Up;
247        cycle.phase_start_time = now;
248        cycle.rounds_in_phase = 0;
249        cycle.is_sample_from_probing = true;
250        self.raise_inflight_high_slope(cwnd);
251        self.model.restart_round_early();
252    }
253
254    fn exit_probe_down(&mut self) {
255        if !self.cycle.has_advanced_max_bw {
256            self.model.advance_max_bandwidth_filter();
257            self.cycle.has_advanced_max_bw = true;
258        }
259    }
260
261    fn update_probe_down(
262        &mut self, target_bytes_inflight: usize,
263        congestion_event: &BBRv2CongestionEvent,
264    ) {
265        if self.cycle.rounds_in_phase == 1 && congestion_event.end_of_round_trip {
266            self.cycle.is_sample_from_probing = false;
267
268            if !congestion_event.last_packet_send_state.is_app_limited {
269                self.model.advance_max_bandwidth_filter();
270                self.cycle.has_advanced_max_bw = true;
271            }
272
273            if self.cycle.last_cycle_stopped_risky_probe &&
274                !self.cycle.last_cycle_probed_too_high
275            {
276                self.enter_probe_refill(0, congestion_event.event_time);
277                return;
278            }
279        }
280
281        self.maybe_adapt_upper_bounds(target_bytes_inflight, congestion_event);
282
283        if self
284            .is_time_to_probe_bandwidth(target_bytes_inflight, congestion_event)
285        {
286            self.enter_probe_refill(0, congestion_event.event_time);
287            return;
288        }
289
290        if self.has_stayed_long_enough_in_probe_down(congestion_event) {
291            self.enter_probe_cruise(congestion_event.event_time);
292            return;
293        }
294
295        let inflight_with_headroom = self.model.inflight_hi_with_headroom();
296        let bytes_in_flight = congestion_event.bytes_in_flight;
297
298        if bytes_in_flight > inflight_with_headroom {
299            // Stay in PROBE_DOWN.
300            return;
301        }
302
303        // Transition to PROBE_CRUISE iff we've drained to target.
304        let bdp = self.model.bdp0();
305
306        if bytes_in_flight < bdp {
307            self.enter_probe_cruise(congestion_event.event_time);
308        }
309    }
310
311    fn update_probe_cruise(
312        &mut self, target_bytes_inflight: usize,
313        congestion_event: &BBRv2CongestionEvent,
314    ) {
315        self.maybe_adapt_upper_bounds(target_bytes_inflight, congestion_event);
316
317        if self
318            .is_time_to_probe_bandwidth(target_bytes_inflight, congestion_event)
319        {
320            self.enter_probe_refill(0, congestion_event.event_time);
321        }
322    }
323
324    fn update_probe_refill(
325        &mut self, target_bytes_inflight: usize,
326        congestion_event: &BBRv2CongestionEvent,
327    ) {
328        self.maybe_adapt_upper_bounds(target_bytes_inflight, congestion_event);
329
330        if self.cycle.rounds_in_phase > 0 && congestion_event.end_of_round_trip {
331            self.enter_probe_up(
332                congestion_event.event_time,
333                congestion_event.prior_cwnd,
334            );
335        }
336    }
337
338    fn update_probe_up(
339        &mut self, prior_in_flight: usize, target_bytes_inflight: usize,
340        congestion_event: &BBRv2CongestionEvent,
341    ) {
342        if self.maybe_adapt_upper_bounds(target_bytes_inflight, congestion_event) ==
343            AdaptUpperBoundsResult::AdaptedProbedTooHigh
344        {
345            self.enter_probe_down(true, false, congestion_event.event_time);
346            return;
347        }
348
349        self.probe_inflight_high_upward(congestion_event);
350
351        let mut is_risky = false;
352        let mut is_queuing = false;
353        if self.cycle.last_cycle_probed_too_high &&
354            prior_in_flight >= self.model.inflight_hi()
355        {
356            is_risky = true;
357        } else if self.cycle.rounds_in_phase > 0 {
358            if PARAMS.max_probe_up_queue_rounds > 0 {
359                if congestion_event.end_of_round_trip {
360                    self.model.check_persistent_queue(PARAMS.full_bw_threshold);
361                    if self.model.rounds_with_queueing() >=
362                        PARAMS.max_probe_up_queue_rounds
363                    {
364                        is_queuing = true;
365                    }
366                }
367            } else {
368                let mut queuing_threshold_extra_bytes =
369                    self.model.queueing_threshold_extra_bytes();
370                if PARAMS.add_ack_height_to_queueing_threshold {
371                    queuing_threshold_extra_bytes += self.model.max_ack_height();
372                }
373                let queuing_threshold = (PARAMS.full_bw_threshold *
374                    self.model.bdp0() as f32)
375                    as usize +
376                    queuing_threshold_extra_bytes;
377
378                is_queuing =
379                    congestion_event.bytes_in_flight >= queuing_threshold;
380            }
381        }
382
383        if is_risky || is_queuing {
384            self.enter_probe_down(false, is_risky, congestion_event.event_time);
385        }
386    }
387
388    fn is_time_to_probe_bandwidth(
389        &self, target_bytes_inflight: usize,
390        congestion_event: &BBRv2CongestionEvent,
391    ) -> bool {
392        if self.has_cycle_lasted(
393            self.cycle.probe_wait_time.unwrap(),
394            congestion_event,
395        ) {
396            return true;
397        }
398
399        if self.is_time_to_probe_for_reno_coexistence(
400            target_bytes_inflight,
401            1.0,
402            congestion_event,
403        ) {
404            return true;
405        }
406
407        false
408    }
409
410    fn maybe_adapt_upper_bounds(
411        &mut self, target_bytes_inflight: usize,
412        congestion_event: &BBRv2CongestionEvent,
413    ) -> AdaptUpperBoundsResult {
414        let send_state = congestion_event.last_packet_send_state;
415
416        if !send_state.is_valid {
417            return AdaptUpperBoundsResult::NotAdaptedInvalidSample;
418        }
419
420        // TODO(vlad): use BytesInFlight?
421        let mut inflight_at_send = send_state.bytes_in_flight;
422        if PARAMS.use_bytes_delivered_for_inflight_hi {
423            inflight_at_send = self.model.total_bytes_acked() -
424                congestion_event.last_packet_send_state.total_bytes_acked;
425        }
426
427        if self.cycle.is_sample_from_probing {
428            if self.model.is_inflight_too_high(
429                congestion_event,
430                PARAMS.probe_bw_full_loss_count,
431            ) {
432                self.cycle.is_sample_from_probing = false;
433                if !send_state.is_app_limited ||
434                    PARAMS.max_probe_up_queue_rounds > 0
435                {
436                    let inflight_target = (target_bytes_inflight as f32 *
437                        (1.0 - PARAMS.beta))
438                        as usize;
439
440                    let mut new_inflight_hi =
441                        inflight_at_send.max(inflight_target);
442
443                    if PARAMS.limit_inflight_hi_by_max_delivered {
444                        new_inflight_hi = self
445                            .model
446                            .max_bytes_delivered_in_round()
447                            .max(new_inflight_hi);
448                    }
449
450                    self.model.set_inflight_hi(new_inflight_hi);
451                }
452                return AdaptUpperBoundsResult::AdaptedProbedTooHigh;
453            }
454            return AdaptUpperBoundsResult::AdaptedOk;
455        }
456
457        if self.model.inflight_hi() == self.model.inflight_hi_default() {
458            return AdaptUpperBoundsResult::NotAdaptedInflightHighNotSet;
459        }
460
461        // Raise the upper bound for inflight.
462        if inflight_at_send > self.model.inflight_hi() {
463            self.model.set_inflight_hi(inflight_at_send);
464        }
465
466        AdaptUpperBoundsResult::AdaptedOk
467    }
468
469    fn has_cycle_lasted(
470        &self, duration: Duration, congestion_event: &BBRv2CongestionEvent,
471    ) -> bool {
472        (congestion_event.event_time - self.cycle.start_time) > duration
473    }
474
475    fn has_phase_lasted(
476        &self, duration: Duration, congestion_event: &BBRv2CongestionEvent,
477    ) -> bool {
478        (congestion_event.event_time - self.cycle.phase_start_time) > duration
479    }
480
481    fn is_time_to_probe_for_reno_coexistence(
482        &self, target_bytes_inflight: usize, probe_wait_fraction: f64,
483        _congestion_event: &BBRv2CongestionEvent,
484    ) -> bool {
485        if !PARAMS.enable_reno_coexistence {
486            return false;
487        }
488
489        let mut rounds = PARAMS.probe_bw_probe_max_rounds;
490        if PARAMS.probe_bw_probe_reno_gain > 0.0 {
491            let reno_rounds = (PARAMS.probe_bw_probe_reno_gain *
492                target_bytes_inflight as f32 /
493                DEFAULT_MSS as f32) as usize;
494            rounds = reno_rounds.min(rounds);
495        }
496
497        self.cycle.rounds_since_probe >=
498            (rounds as f64 * probe_wait_fraction) as usize
499    }
500
501    // Used to prevent a BBR2 flow from staying in PROBE_DOWN for too
502    // long, as seen in some multi-sender simulator tests.
503    fn has_stayed_long_enough_in_probe_down(
504        &self, congestion_event: &BBRv2CongestionEvent,
505    ) -> bool {
506        // Stay in PROBE_DOWN for at most the time of a min rtt, as it is done in
507        // BBRv1.
508        self.has_phase_lasted(self.model.min_rtt(), congestion_event)
509    }
510
511    fn raise_inflight_high_slope(&mut self, cwnd: usize) {
512        let growth_this_round = 1usize << self.cycle.probe_up_rounds;
513        // The number 30 below means `growth_this_round` is capped at 1G and the
514        // lower bound of `probe_up_bytes` is (practically) 1 mss, at this
515        // speed `inflight_hi`` grows by approximately 1 packet per packet acked.
516        self.cycle.probe_up_rounds = self.cycle.probe_up_rounds.add(1).min(30);
517        let probe_up_bytes = cwnd / growth_this_round;
518        self.cycle.probe_up_bytes = Some(probe_up_bytes.max(DEFAULT_MSS));
519    }
520
521    fn probe_inflight_high_upward(
522        &mut self, congestion_event: &BBRv2CongestionEvent,
523    ) {
524        if PARAMS.probe_up_ignore_inflight_hi {
525            // When inflight_hi is disabled in PROBE_UP, it increases when
526            // the number of bytes delivered in a round is larger inflight_hi.
527            return;
528        } else {
529            // TODO(vlad): probe_up_simplify_inflight_hi?
530            if congestion_event.prior_bytes_in_flight <
531                congestion_event.prior_cwnd
532            {
533                // Not fully utilizing cwnd, so can't safely grow.
534                return;
535            }
536
537            if congestion_event.prior_cwnd < self.model.inflight_hi() {
538                // Not fully using inflight_hi, so don't grow it.
539                return;
540            }
541
542            self.cycle.probe_up_acked += congestion_event.bytes_acked;
543        }
544
545        if let Some(probe_up_bytes) = self.cycle.probe_up_bytes.as_mut() {
546            if self.cycle.probe_up_acked >= *probe_up_bytes {
547                let delta = self.cycle.probe_up_acked / *probe_up_bytes;
548                self.cycle.probe_up_acked -= *probe_up_bytes;
549                let new_inflight_hi =
550                    self.model.inflight_hi() + delta * DEFAULT_MSS;
551                if new_inflight_hi > self.model.inflight_hi() {
552                    self.model.set_inflight_hi(new_inflight_hi);
553                }
554            }
555        }
556
557        if congestion_event.end_of_round_trip {
558            self.raise_inflight_high_slope(congestion_event.prior_cwnd);
559        }
560    }
561
562    fn into_probe_rtt(
563        mut self, now: Instant, congestion_event: Option<&BBRv2CongestionEvent>,
564    ) -> Mode {
565        self.leave(now, congestion_event);
566        let mut next_mode = Mode::probe_rtt(self.model, self.cycle);
567        next_mode.enter(now, congestion_event);
568        next_mode
569    }
570}