Document functions and constants.

This commit is contained in:
Mike Perry 2009-09-08 01:31:29 -07:00
parent c9363df09f
commit 67cee75ca2
2 changed files with 123 additions and 31 deletions

View File

@ -112,7 +112,12 @@ circuitbuild_running_unit_tests(void)
unit_tests = 1; unit_tests = 1;
} }
/** DOCDOC */ /**
* Reset the build time state.
*
* Leave estimated paramters, timeout, and network liveness in tact
* for future use.
*/
void void
circuit_build_times_reset(circuit_build_times_t *cbt) circuit_build_times_reset(circuit_build_times_t *cbt)
{ {
@ -120,10 +125,15 @@ circuit_build_times_reset(circuit_build_times_t *cbt)
cbt->pre_timeouts = 0; cbt->pre_timeouts = 0;
cbt->total_build_times = 0; cbt->total_build_times = 0;
cbt->build_times_idx = 0; cbt->build_times_idx = 0;
cbt->computed = 0; cbt->have_computed_timeout = 0;
} }
/** DOCDOC */ /**
* Initialize the buildtimes structure for first use.
*
* Sets the initial timeout value based to either the
* config setting or BUILD_TIMEOUT_INITIAL_VALUE.
*/
void void
circuit_build_times_init(circuit_build_times_t *cbt) circuit_build_times_init(circuit_build_times_t *cbt)
{ {
@ -137,10 +147,11 @@ circuit_build_times_init(circuit_build_times_t *cbt)
} }
/** /**
* circuit_build_times is a circular array, so loop around when * Add a timeoutout value to the set of build times. Time units
* array is full * are milliseconds
* *
* time units are milliseconds * circuit_build_times is a circular array, so loop around when
* array is full.
*/ */
int int
circuit_build_times_add_time(circuit_build_times_t *cbt, build_time_t time) circuit_build_times_add_time(circuit_build_times_t *cbt, build_time_t time)
@ -169,7 +180,7 @@ circuit_build_times_add_time(circuit_build_times_t *cbt, build_time_t time)
} }
/** /**
* Find maximum circuit build time * Return maximum circuit build time
*/ */
static build_time_t static build_time_t
circuit_build_times_max(circuit_build_times_t *cbt) circuit_build_times_max(circuit_build_times_t *cbt)
@ -183,7 +194,7 @@ circuit_build_times_max(circuit_build_times_t *cbt)
return max_build_time; return max_build_time;
} }
/** DOCDOC */ /** Return minimum circuit build time */
static build_time_t static build_time_t
circuit_build_times_min(circuit_build_times_t *cbt) circuit_build_times_min(circuit_build_times_t *cbt)
{ {
@ -201,7 +212,13 @@ circuit_build_times_min(circuit_build_times_t *cbt)
} }
/** /**
* Calculate histogram * Calculate and return a histogram for the set of build times.
*
* Returns an allocated array of histrogram bins representing
* the frequency of index*BUILDTIME_BIN_WIDTH millisecond
* build times. Also outputs the number of bins in nbins.
*
* The return value must be freed by the caller.
*/ */
static uint32_t * static uint32_t *
circuit_build_times_create_histogram(circuit_build_times_t *cbt, circuit_build_times_create_histogram(circuit_build_times_t *cbt,
@ -225,7 +242,11 @@ circuit_build_times_create_histogram(circuit_build_times_t *cbt,
return histogram; return histogram;
} }
/** DOCDOC */ /**
* Return the most frequent build time (rounded to BUILDTIME_BIN_WIDTH ms).
*
* Ties go in favor of the slower time.
*/
static build_time_t static build_time_t
circuit_build_times_mode(circuit_build_times_t *cbt) circuit_build_times_mode(circuit_build_times_t *cbt)
{ {
@ -244,7 +265,8 @@ circuit_build_times_mode(circuit_build_times_t *cbt)
} }
/** /**
* output a histogram of current circuit build times. * Output a histogram of current circuit build times to
* the or_state_t state structure.
*/ */
void void
circuit_build_times_update_state(circuit_build_times_t *cbt, circuit_build_times_update_state(circuit_build_times_t *cbt,
@ -282,7 +304,11 @@ circuit_build_times_update_state(circuit_build_times_t *cbt,
if (histogram) tor_free(histogram); if (histogram) tor_free(histogram);
} }
/* Stolen from http://en.wikipedia.org/wiki/Fisher\u2013Yates_shuffle */ /**
* Shuffle the build times array.
*
* Stolen from http://en.wikipedia.org/wiki/Fisher\u2013Yates_shuffle
*/
static void static void
circuit_build_times_shuffle_array(circuit_build_times_t *cbt) circuit_build_times_shuffle_array(circuit_build_times_t *cbt)
{ {
@ -298,7 +324,13 @@ circuit_build_times_shuffle_array(circuit_build_times_t *cbt)
} }
} }
/** Load histogram from <b>state</b>. DOCDOC what else? */ /**
* Load histogram from <b>state</b>, shuffling the resulting array
* after we do so. Use this result to estimate parameters and
* calculate the timeout.
*
* Returns -1 and sets msg on error. Msg must be freed by the caller.
*/
int int
circuit_build_times_parse_state(circuit_build_times_t *cbt, circuit_build_times_parse_state(circuit_build_times_t *cbt,
or_state_t *state, char **msg) or_state_t *state, char **msg)
@ -368,7 +400,15 @@ circuit_build_times_parse_state(circuit_build_times_t *cbt,
return msg ? -1 : 0; return msg ? -1 : 0;
} }
/** DOCDOC */ /**
* Estimates the Xm and Alpha parameters using
* http://en.wikipedia.org/wiki/Pareto_distribution#Parameter_estimation
*
* The notable difference is that we use mode instead of min to estimate Xm.
* This is because our distribution is frechet-like. We claim this is
* an acceptable approximation because we are only concerned with the
* accuracy of the CDF of the tail.
*/
void void
circuit_build_times_update_alpha(circuit_build_times_t *cbt) circuit_build_times_update_alpha(circuit_build_times_t *cbt)
{ {
@ -407,8 +447,8 @@ circuit_build_times_update_alpha(circuit_build_times_t *cbt)
* in the distribution such that F(x) = quantile (ie quantile*100% * in the distribution such that F(x) = quantile (ie quantile*100%
* of the mass of the density function is below x on the curve). * of the mass of the density function is below x on the curve).
* *
* We use it to calculate the timeout and also synthetic values of * We use it to calculate the timeout and also to generate synthetic
* time for circuits that timeout before completion. * values of time for circuits that timeout before completion.
* *
* See http://en.wikipedia.org/wiki/Quantile_function, * See http://en.wikipedia.org/wiki/Quantile_function,
* http://en.wikipedia.org/wiki/Inverse_transform_sampling and * http://en.wikipedia.org/wiki/Inverse_transform_sampling and
@ -428,7 +468,7 @@ circuit_build_times_calculate_timeout(circuit_build_times_t *cbt,
return ret; return ret;
} }
/* Pareto CDF */ /** Pareto CDF */
double double
circuit_build_times_cdf(circuit_build_times_t *cbt, double x) circuit_build_times_cdf(circuit_build_times_t *cbt, double x)
{ {
@ -437,6 +477,12 @@ circuit_build_times_cdf(circuit_build_times_t *cbt, double x)
return ret; return ret;
} }
/**
* Generate a synthetic time using our distribution parameters.
*
* The return value will be between q_lo and q_hi quantile points
* on the CDF.
*/
build_time_t build_time_t
circuit_build_times_generate_sample(circuit_build_times_t *cbt, circuit_build_times_generate_sample(circuit_build_times_t *cbt,
double q_lo, double q_hi) double q_lo, double q_hi)
@ -451,12 +497,12 @@ circuit_build_times_generate_sample(circuit_build_times_t *cbt,
return ret; return ret;
} }
/** Generate points in [cutoff, 1.0) on the CDF. */
void void
circuit_build_times_add_timeout_worker(circuit_build_times_t *cbt, circuit_build_times_add_timeout_worker(circuit_build_times_t *cbt,
double quantile_cutoff) double quantile_cutoff)
{ {
/* Generate points in [cutoff, 1.0) on the CDF... We want to /* We want to stay a bit short of 1.0, because longtail is
* stay a bit short of 1.0 though, because longtail is
* loooooooooooooooooooooooooooooooooooooooooooooooooooong */ * loooooooooooooooooooooooooooooooooooooooooooooooooooong */
build_time_t gentime = circuit_build_times_generate_sample(cbt, build_time_t gentime = circuit_build_times_generate_sample(cbt,
quantile_cutoff, 0.98); quantile_cutoff, 0.98);
@ -478,6 +524,10 @@ circuit_build_times_add_timeout_worker(circuit_build_times_t *cbt,
circuit_build_times_add_time(cbt, gentime); circuit_build_times_add_time(cbt, gentime);
} }
/**
* Estimate an initial alpha parameter by solving the quantile
* function with a quantile point and a specific timeout value.
*/
void void
circuit_build_times_initial_alpha(circuit_build_times_t *cbt, circuit_build_times_initial_alpha(circuit_build_times_t *cbt,
double quantile, build_time_t timeout) double quantile, build_time_t timeout)
@ -491,6 +541,10 @@ circuit_build_times_initial_alpha(circuit_build_times_t *cbt,
cbt->alpha = ln(1.0-quantile)/(ln(cbt->Xm)-ln(timeout)); cbt->alpha = ln(1.0-quantile)/(ln(cbt->Xm)-ln(timeout));
} }
/**
* Generate synthetic timeout values for the timeouts
* that have happened before we estimated our parameters.
*/
static void static void
circuit_build_times_count_pretimeouts(circuit_build_times_t *cbt) circuit_build_times_count_pretimeouts(circuit_build_times_t *cbt)
{ {
@ -521,6 +575,10 @@ circuit_build_times_needs_circuits(circuit_build_times_t *cbt)
return 0; return 0;
} }
/**
* Returns true if we should build a timeout test circuit
* right now.
*/
int int
circuit_build_times_needs_circuits_now(circuit_build_times_t *cbt) circuit_build_times_needs_circuits_now(circuit_build_times_t *cbt)
{ {
@ -528,12 +586,19 @@ circuit_build_times_needs_circuits_now(circuit_build_times_t *cbt)
approx_time()-cbt->last_circ_at > BUILD_TIMES_TEST_FREQUENCY; approx_time()-cbt->last_circ_at > BUILD_TIMES_TEST_FREQUENCY;
} }
/**
* Called to indicate that the network showed some signs of liveness.
*/
void void
circuit_build_times_network_is_live(circuit_build_times_t *cbt) circuit_build_times_network_is_live(circuit_build_times_t *cbt)
{ {
cbt->network_last_live = approx_time(); cbt->network_last_live = approx_time();
} }
/**
* Returns true if the network showed some sign of liveness
* in the past NETWORK_LIVE_INTERVAL.
*/
int int
circuit_build_times_is_network_live(circuit_build_times_t *cbt) circuit_build_times_is_network_live(circuit_build_times_t *cbt)
{ {
@ -546,6 +611,15 @@ circuit_build_times_is_network_live(circuit_build_times_t *cbt)
return 1; return 1;
} }
/**
* Returns true if we have seen more than MAX_RECENT_TIMEOUT_RATE of
* the past RECENT_CIRCUITS time out. Used to detect if the network
* connection has changed significantly.
*
* Also resets the entire timeout history in this case and causes us
* to restart the process of building test circuits and estimating a
* new timeout.
*/
int int
circuit_build_times_check_too_many_timeouts(circuit_build_times_t *cbt) circuit_build_times_check_too_many_timeouts(circuit_build_times_t *cbt)
{ {
@ -631,7 +705,7 @@ circuit_build_times_add_timeout(circuit_build_times_t *cbt)
return; return;
} }
if (!cbt->computed) { if (!cbt->have_computed_timeout) {
/* Store a timeout before we have enough data as special */ /* Store a timeout before we have enough data as special */
cbt->pre_timeouts++; cbt->pre_timeouts++;
return; return;
@ -641,6 +715,10 @@ circuit_build_times_add_timeout(circuit_build_times_t *cbt)
circuit_build_times_add_timeout_worker(cbt, BUILDTIMEOUT_QUANTILE_CUTOFF); circuit_build_times_add_timeout_worker(cbt, BUILDTIMEOUT_QUANTILE_CUTOFF);
} }
/**
* Estimate a new timeout based on history and set our timeout
* variable accordingly.
*/
void void
circuit_build_times_set_timeout(circuit_build_times_t *cbt) circuit_build_times_set_timeout(circuit_build_times_t *cbt)
{ {
@ -659,7 +737,7 @@ circuit_build_times_set_timeout(circuit_build_times_t *cbt)
timeout = circuit_build_times_calculate_timeout(cbt, timeout = circuit_build_times_calculate_timeout(cbt,
BUILDTIMEOUT_QUANTILE_CUTOFF); BUILDTIMEOUT_QUANTILE_CUTOFF);
cbt->computed = 1; cbt->have_computed_timeout = 1;
cbt->timeout = lround(timeout/1000.0); cbt->timeout = lround(timeout/1000.0);
log_info(LD_CIRC, log_info(LD_CIRC,

View File

@ -2858,29 +2858,43 @@ void bridges_retry_all(void);
void entry_guards_free_all(void); void entry_guards_free_all(void);
/* Circuit Build Timeout "public" functions and structures. */ /* Circuit Build Timeout "public" functions and structures. */
#define RECENT_CIRCUITS 20
#define MIN_CIRCUITS_TO_OBSERVE 500
#define NCIRCUITS_TO_OBSERVE 5000 /* approx 1.5 weeks worth of circuits */
#define BUILDTIME_BIN_WIDTH 50
/** How many circuits count as recent when deciding if the
* connection has changed. */
#define RECENT_CIRCUITS 20
/** Maximum fraction of timeouts to tolerate in the past
* RECENT_CIRCUITS before calculating a new timeout */
#define MAX_RECENT_TIMEOUT_RATE 0.7999999 #define MAX_RECENT_TIMEOUT_RATE 0.7999999
/* TODO: This should be moved to the consensus */ /** Minimum circuits before estimating a timeout */
#define MIN_CIRCUITS_TO_OBSERVE 500
/** Total size of the circuit timeout history to accumulate.
* 5000 is approx 1.5 weeks worth of continual-use circuits. */
#define NCIRCUITS_TO_OBSERVE 5000
/** Width of the histogram bins in milliseconds */
#define BUILDTIME_BIN_WIDTH 50
/** Cuttof point on the CDF for our timeout estimation.
* TODO: This should be moved to the consensus */
#define BUILDTIMEOUT_QUANTILE_CUTOFF 0.8 #define BUILDTIMEOUT_QUANTILE_CUTOFF 0.8
typedef uint32_t build_time_t; typedef uint32_t build_time_t;
#define BUILD_TIME_MAX ((build_time_t)(INT32_MAX)) #define BUILD_TIME_MAX ((build_time_t)(INT32_MAX))
/* Have we received a cell in the last 90 seconds? */ /** Have we received a cell in the last 90 seconds? */
#define NETWORK_LIVE_INTERVAL 90 #define NETWORK_LIVE_INTERVAL 90
/** Initial circuit build timeout */
#define BUILD_TIMEOUT_INITIAL_VALUE 60 #define BUILD_TIMEOUT_INITIAL_VALUE 60
/* How often in seconds should we build a test circuit */ /** How often in seconds should we build a test circuit */
#define BUILD_TIMES_TEST_FREQUENCY 60 #define BUILD_TIMES_TEST_FREQUENCY 60
/* Save state every 5 circuits */ /** Save state every 10 circuits */
#define BUILD_TIMES_SAVE_STATE_EVERY 5 #define BUILD_TIMES_SAVE_STATE_EVERY 10
typedef struct { typedef struct {
build_time_t circuit_build_times[NCIRCUITS_TO_OBSERVE]; build_time_t circuit_build_times[NCIRCUITS_TO_OBSERVE];
@ -2891,7 +2905,7 @@ typedef struct {
int pre_timeouts; int pre_timeouts;
build_time_t Xm; build_time_t Xm;
double alpha; double alpha;
int computed; int have_computed_timeout;
int timeout; int timeout;
} circuit_build_times_t; } circuit_build_times_t;