curl/lib/ratelimit.c
Stefan Eissing 1a57302d1a
ratelimit: download finetune
When a download size is known and rate limiting is in effect, adjust the
duration of each measurement step and its rate for maximum precision.

Since it is unpredictable how long the last bytes of a download will
take, download speed can be thrown off if the "last bytes" are a
significant amount of the total download. Make the "last bytes" small in
comparision to the rest and "stretch" the rate limit intervals to
accommodate the difference.

Fix ngtcp2 receive data acknowldgements to be based on a local window
size tracking. This allows window updates controlled by rate limits.

Fix ratelimit wait time calculation to accomodate negative tokens.

h3 rate limit, update timeers

Make download rate limits work correctly in ngtcp2. Fix multi handling
of rate limits to set a timer for when limits will update again.

Without running the transfer on limit updates, protocols like h2/h3 may
stall if the server does not send due to stream windows being too small.

scorecard: measure download speedlimits

When running scorecard with --limit-rate=n, show the reported download
speed averages plus percentage deviation from the limit.

Closes #20228
2026-01-16 16:42:31 +01:00

290 lines
8.5 KiB
C

/***************************************************************************
* _ _ ____ _
* Project ___| | | | _ \| |
* / __| | | | |_) | |
* | (__| |_| | _ <| |___
* \___|\___/|_| \_\_____|
*
* Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al.
*
* This software is licensed as described in the file COPYING, which
* you should have received as part of this distribution. The terms
* are also available at https://curl.se/docs/copyright.html.
*
* You may opt to use, copy, modify, merge, publish, distribute and/or sell
* copies of the Software, and permit persons to whom the Software is
* furnished to do so, under the terms of the COPYING file.
*
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
* KIND, either express or implied.
*
* SPDX-License-Identifier: curl
*
***************************************************************************/
#include "curl_setup.h"
#include "urldata.h"
#include "curl_trc.h"
#include "progress.h"
#include "ratelimit.h"
#define CURL_US_PER_SEC 1000000
#define CURL_RLIMIT_MIN_RATE (4 * 1024) /* minimum step rate */
#define CURL_RLIMIT_STEP_MIN_MS 2 /* minimum step duration */
static void rlimit_update(struct Curl_rlimit *r,
const struct curltime *pts)
{
timediff_t elapsed_us, elapsed_steps;
int64_t token_gain;
DEBUGASSERT(r->rate_per_step);
if((r->ts.tv_sec == pts->tv_sec) && (r->ts.tv_usec == pts->tv_usec))
return;
elapsed_us = curlx_ptimediff_us(pts, &r->ts);
if(elapsed_us < 0) { /* not going back in time */
DEBUGASSERT(0);
return;
}
elapsed_us += r->spare_us;
if(elapsed_us < r->step_us)
return;
/* we do the update */
r->ts = *pts;
elapsed_steps = elapsed_us / r->step_us;
r->spare_us = elapsed_us % r->step_us;
/* How many tokens did we gain since the last update? */
if(r->rate_per_step > (INT64_MAX / elapsed_steps))
token_gain = INT64_MAX;
else {
token_gain = r->rate_per_step * elapsed_steps;
}
if((INT64_MAX - token_gain) > r->tokens)
r->tokens += token_gain;
else
r->tokens = INT64_MAX;
/* Limit the token again by the burst rate (if set), so we
* do not suddenly have a huge number of tokens after inactivity. */
if(r->burst_per_step && (r->tokens > r->burst_per_step)) {
r->tokens = r->burst_per_step;
}
}
static void rlimit_tune_steps(struct Curl_rlimit *r,
int64_t tokens_total)
{
int64_t tokens_last, tokens_main, msteps;
/* Tune the ratelimit at the start *if* we know how many tokens
* are expected to be consumed in total.
* The reason for tuning is that rlimit provides tokens to be consumed
* per "step" which starts out to be a second. The tokens may be consumed
* in full at the beginning of a step. The remainder of the second will
* have no tokens available, effectively blocking the consumption and
* so keeping the "step average" in line.
* This works will up to the last step. When no more tokens are needed,
* no wait will happen and the last step would be too fast. This is
* especially noticeable when only a few steps are needed.
*
* Example: downloading 1.5kb with a ratelimit of 1k could be done in
* roughly 1 second (1k in the first second and the 0.5 at the start of
* the second one).
*
* The tuning tries to make the last step small, using only
* 1 percent of the total tokens (at least 1). The rest of the tokens
* are to be consumed in the steps before by adjusting the duration of
* the step and the amount of tokens it provides. */
if(!r->rate_per_step ||
(tokens_total <= 1) ||
(tokens_total > (INT64_MAX / 1000)))
return;
/* Calculate tokens for the last step and the ones before. */
tokens_last = tokens_total / 100;
if(!tokens_last) /* less than 100 total, just use 1 */
tokens_last = 1;
else if(tokens_last > CURL_RLIMIT_MIN_RATE)
tokens_last = CURL_RLIMIT_MIN_RATE;
DEBUGASSERT(tokens_last);
tokens_main = tokens_total - tokens_last;
DEBUGASSERT(tokens_main);
/* how many milli-steps will it take to consume those, give the
* original rate limit per second? */
DEBUGASSERT(r->step_us == CURL_US_PER_SEC);
msteps = (tokens_main * 1000 / r->rate_per_step);
if(msteps < CURL_RLIMIT_STEP_MIN_MS) {
/* Steps this small will not work. Do not tune. */
return;
}
else if(msteps < 1000) {
/* It needs less than one step to provide the needed tokens.
* Make it exactly that long and with exactly those tokens. */
r->step_us = (timediff_t)msteps * 1000;
r->rate_per_step = tokens_main;
r->tokens = r->rate_per_step;
}
else {
/* More than 1 step. Spread the remainder milli steps and
* the tokens they need to provide across all steps. If integer
* arithmetic can do it. */
curl_off_t ms_unaccounted = (msteps % 1000);
curl_off_t mstep_inc = (ms_unaccounted / (msteps / 1000));
if(mstep_inc) {
curl_off_t rate_inc = ((r->rate_per_step * mstep_inc) / 1000);
if(rate_inc) {
r->step_us = CURL_US_PER_SEC + ((timediff_t)mstep_inc * 1000);
r->rate_per_step += rate_inc;
r->tokens = r->rate_per_step;
}
}
}
if(r->burst_per_step)
r->burst_per_step = r->rate_per_step;
}
void Curl_rlimit_init(struct Curl_rlimit *r,
int64_t rate_per_sec,
int64_t burst_per_sec,
const struct curltime *pts)
{
DEBUGASSERT(rate_per_sec >= 0);
DEBUGASSERT(burst_per_sec >= rate_per_sec || !burst_per_sec);
DEBUGASSERT(pts);
r->rate_per_step = rate_per_sec;
r->burst_per_step = burst_per_sec;
r->step_us = CURL_US_PER_SEC;
r->spare_us = 0;
r->tokens = r->rate_per_step;
r->ts = *pts;
r->blocked = FALSE;
}
void Curl_rlimit_start(struct Curl_rlimit *r, const struct curltime *pts,
int64_t total_tokens)
{
r->tokens = r->rate_per_step;
r->spare_us = 0;
r->ts = *pts;
rlimit_tune_steps(r, total_tokens);
}
int64_t Curl_rlimit_per_step(struct Curl_rlimit *r)
{
return r->rate_per_step;
}
bool Curl_rlimit_active(struct Curl_rlimit *r)
{
return (r->rate_per_step > 0) || r->blocked;
}
bool Curl_rlimit_is_blocked(struct Curl_rlimit *r)
{
return r->blocked;
}
int64_t Curl_rlimit_avail(struct Curl_rlimit *r,
const struct curltime *pts)
{
if(r->blocked)
return 0;
else if(r->rate_per_step) {
rlimit_update(r, pts);
return r->tokens;
}
else
return INT64_MAX;
}
void Curl_rlimit_drain(struct Curl_rlimit *r,
size_t tokens,
const struct curltime *pts)
{
if(r->blocked || !r->rate_per_step)
return;
rlimit_update(r, pts);
#if 8 <= SIZEOF_SIZE_T
if(tokens > INT64_MAX) {
r->tokens = INT64_MAX;
}
else
#endif
{
int64_t val = (int64_t)tokens;
if((INT64_MIN + val) < r->tokens)
r->tokens -= val;
else
r->tokens = INT64_MIN;
}
}
timediff_t Curl_rlimit_wait_ms(struct Curl_rlimit *r,
const struct curltime *pts)
{
timediff_t wait_us, elapsed_us;
if(r->blocked || !r->rate_per_step)
return 0;
rlimit_update(r, pts);
if(r->tokens > 0)
return 0;
/* How much time will it take tokens to become positive again?
* Deduct `spare_us` and check against already elapsed time */
wait_us = r->step_us - r->spare_us;
if(r->tokens < 0) {
curl_off_t debt_pct = ((-r->tokens) * 100 / r->rate_per_step);
if(debt_pct)
wait_us += (r->step_us * debt_pct / 100);
}
elapsed_us = curlx_ptimediff_us(pts, &r->ts);
if(elapsed_us >= wait_us)
return 0;
wait_us -= elapsed_us;
return (wait_us + 999) / 1000; /* in milliseconds */
}
timediff_t Curl_rlimit_next_step_ms(struct Curl_rlimit *r,
const struct curltime *pts)
{
if(!r->blocked && r->rate_per_step) {
timediff_t elapsed_us, next_us;
elapsed_us = curlx_ptimediff_us(pts, &r->ts) + r->spare_us;
if(r->step_us > elapsed_us) {
next_us = r->step_us - elapsed_us;
return (next_us + 999) / 1000; /* in milliseconds */
}
}
return 0;
}
void Curl_rlimit_block(struct Curl_rlimit *r,
bool activate,
const struct curltime *pts)
{
if(!activate == !r->blocked)
return;
r->ts = *pts;
r->blocked = activate;
if(!r->blocked) {
/* Start rate limiting fresh. The amount of time this was blocked
* does not generate extra tokens. */
Curl_rlimit_start(r, pts, -1);
}
else {
r->tokens = 0;
}
}