Improve documentation
This commit is contained in:
parent
ed4c11e31d
commit
334d8ae9cd
@ -2,18 +2,23 @@ use core;
|
|||||||
|
|
||||||
use conv::ApproxFrom;
|
use conv::ApproxFrom;
|
||||||
|
|
||||||
/// Represent the arithmetic mean and the variance of a sequence of numbers.
|
/// Estimate the arithmetic mean and the variance of a sequence of numbers
|
||||||
|
/// ("population").
|
||||||
|
///
|
||||||
|
/// This can be used to estimate the standard error of the mean.
|
||||||
///
|
///
|
||||||
/// Everything is calculated iteratively using constant memory, so the sequence
|
/// Everything is calculated iteratively using constant memory, so the sequence
|
||||||
/// of numbers can be an iterator. The used algorithms try to avoid numerical
|
/// of numbers can be an iterator. The used algorithms try to avoid numerical
|
||||||
/// instabilities.
|
/// instabilities.
|
||||||
///
|
///
|
||||||
|
///
|
||||||
|
/// ## Example
|
||||||
|
///
|
||||||
/// ```
|
/// ```
|
||||||
/// use average::Average;
|
/// use average::Average;
|
||||||
///
|
///
|
||||||
/// let a: Average = (1..6).map(Into::into).collect();
|
/// let a: Average = (1..6).map(Into::into).collect();
|
||||||
/// assert_eq!(a.mean(), 3.0);
|
/// println!("The average is {} ± {}.", a.mean(), a.error());
|
||||||
/// assert_eq!(a.sample_variance(), 2.5);
|
|
||||||
/// ```
|
/// ```
|
||||||
#[derive(Debug, Clone)]
|
#[derive(Debug, Clone)]
|
||||||
pub struct Average {
|
pub struct Average {
|
||||||
@ -26,12 +31,12 @@ pub struct Average {
|
|||||||
}
|
}
|
||||||
|
|
||||||
impl Average {
|
impl Average {
|
||||||
/// Create a new average.
|
/// Create a new average estimator.
|
||||||
pub fn new() -> Average {
|
pub fn new() -> Average {
|
||||||
Average { avg: 0., n: 0, v: 0. }
|
Average { avg: 0., n: 0, v: 0. }
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Add a sample to the sequence of which the average is calculated.
|
/// Add an element sampled from the population.
|
||||||
pub fn add(&mut self, sample: f64) {
|
pub fn add(&mut self, sample: f64) {
|
||||||
// This algorithm introduced by Welford in 1962 trades numerical
|
// This algorithm introduced by Welford in 1962 trades numerical
|
||||||
// stability for a division inside the loop.
|
// stability for a division inside the loop.
|
||||||
@ -43,24 +48,24 @@ impl Average {
|
|||||||
self.v += delta * (sample - self.avg);
|
self.v += delta * (sample - self.avg);
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Determine whether the sequence is empty.
|
/// Determine whether the samples are empty.
|
||||||
pub fn is_empty(&self) -> bool {
|
pub fn is_empty(&self) -> bool {
|
||||||
self.n == 0
|
self.n == 0
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Estimate the mean of the sequence.
|
/// Estimate the mean of the population.
|
||||||
pub fn mean(&self) -> f64 {
|
pub fn mean(&self) -> f64 {
|
||||||
self.avg
|
self.avg
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Return the number of elements in the sequence.
|
/// Return the number of samples.
|
||||||
pub fn len(&self) -> u64 {
|
pub fn len(&self) -> u64 {
|
||||||
self.n
|
self.n
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Calculate the unbiased sample variance of the sequence.
|
/// Calculate the sample variance.
|
||||||
///
|
///
|
||||||
/// This assumes that the sequence consists of samples of a larger population.
|
/// This is an unbiased estimator of the variance of the population.
|
||||||
pub fn sample_variance(&self) -> f64 {
|
pub fn sample_variance(&self) -> f64 {
|
||||||
if self.n < 2 {
|
if self.n < 2 {
|
||||||
return 0.;
|
return 0.;
|
||||||
@ -68,9 +73,9 @@ impl Average {
|
|||||||
self.v / f64::approx_from(self.n - 1).unwrap()
|
self.v / f64::approx_from(self.n - 1).unwrap()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Calculate the population variance of the sequence.
|
/// Calculate the population variance of the sample.
|
||||||
///
|
///
|
||||||
/// This assumes that the sequence consists of the entire population.
|
/// This is a biased estimator of the variance of the population.
|
||||||
pub fn population_variance(&self) -> f64 {
|
pub fn population_variance(&self) -> f64 {
|
||||||
if self.n < 2 {
|
if self.n < 2 {
|
||||||
return 0.;
|
return 0.;
|
||||||
@ -78,7 +83,7 @@ impl Average {
|
|||||||
self.v / f64::approx_from(self.n).unwrap()
|
self.v / f64::approx_from(self.n).unwrap()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Estimate the standard error of the mean of the sequence.
|
/// Estimate the standard error of the mean of the population.
|
||||||
pub fn error(&self) -> f64 {
|
pub fn error(&self) -> f64 {
|
||||||
if self.n == 0 {
|
if self.n == 0 {
|
||||||
return 0.;
|
return 0.;
|
||||||
@ -86,7 +91,10 @@ impl Average {
|
|||||||
(self.sample_variance() / f64::approx_from(self.n).unwrap()).sqrt()
|
(self.sample_variance() / f64::approx_from(self.n).unwrap()).sqrt()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Merge the average of another sequence into this one.
|
/// Merge another sample into this one.
|
||||||
|
///
|
||||||
|
///
|
||||||
|
/// ## Example
|
||||||
///
|
///
|
||||||
/// ```
|
/// ```
|
||||||
/// use average::Average;
|
/// use average::Average;
|
||||||
|
25
src/lib.rs
25
src/lib.rs
@ -1,3 +1,28 @@
|
|||||||
|
//! This crate provides estimators for the weighted and unweighted average of a
|
||||||
|
//! sequence of numbers, and for their standard errors. The typical workflow
|
||||||
|
//! looks like this:
|
||||||
|
//!
|
||||||
|
//! 1. Initialize your estimator of choice (`Average`, `WeightedAverage` or
|
||||||
|
//! `WeightedAverage2`) with `new()`.
|
||||||
|
//! 2. Add some subset (called "samples") of the sequence of numbers (called
|
||||||
|
//! "population") for which you want to estimate the average, using `add()`
|
||||||
|
//! or `collect()`.
|
||||||
|
//! 3. Calculate the arithmetic mean with `mean()` and its standard error with
|
||||||
|
//! `error().
|
||||||
|
//!
|
||||||
|
//! You can run several estimators in parallel and merge them into one with
|
||||||
|
//! `merge()`.
|
||||||
|
//!
|
||||||
|
//! ## Example
|
||||||
|
//!
|
||||||
|
//! ```
|
||||||
|
//! use average::Average;
|
||||||
|
//!
|
||||||
|
//! let mut a: Average = (1..6).map(Into::into).collect();
|
||||||
|
//! a.add(42.);
|
||||||
|
//! println!("The average is {} ± {}.", a.mean(), a.error());
|
||||||
|
//! ```
|
||||||
|
|
||||||
#![no_std]
|
#![no_std]
|
||||||
|
|
||||||
extern crate conv;
|
extern crate conv;
|
||||||
|
@ -1,7 +1,20 @@
|
|||||||
use core;
|
use core;
|
||||||
|
|
||||||
/// Represent the weighted arithmetic mean and the weighted variance of a
|
/// Estimate the weighted arithmetic mean and the weighted variance of a
|
||||||
/// sequence of numbers.
|
/// sequence of numbers ("population").
|
||||||
|
///
|
||||||
|
/// This can be used to estimate the standard error of the weighted mean.
|
||||||
|
///
|
||||||
|
///
|
||||||
|
/// ## Example
|
||||||
|
///
|
||||||
|
/// ```
|
||||||
|
/// use average::WeightedAverage;
|
||||||
|
///
|
||||||
|
/// let a: WeightedAverage = (1..6).zip(1..6)
|
||||||
|
/// .map(|(x, w)| (f64::from(x), f64::from(w))).collect();
|
||||||
|
/// println!("The weighted average is {} ± {}.", a.mean(), a.error());
|
||||||
|
/// ```
|
||||||
#[derive(Debug, Clone)]
|
#[derive(Debug, Clone)]
|
||||||
pub struct WeightedAverage {
|
pub struct WeightedAverage {
|
||||||
/// Sum of the weights.
|
/// Sum of the weights.
|
||||||
@ -13,12 +26,12 @@ pub struct WeightedAverage {
|
|||||||
}
|
}
|
||||||
|
|
||||||
impl WeightedAverage {
|
impl WeightedAverage {
|
||||||
/// Create a new weighted average.
|
/// Create a new weighted average estimator.
|
||||||
pub fn new() -> WeightedAverage {
|
pub fn new() -> WeightedAverage {
|
||||||
WeightedAverage { weight_sum: 0., avg: 0., v: 0. }
|
WeightedAverage { weight_sum: 0., avg: 0., v: 0. }
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Add a sample to the weighted sequence of which the average is calculated.
|
/// Add a weighted element sampled from the population.
|
||||||
pub fn add(&mut self, sample: f64, weight: f64) {
|
pub fn add(&mut self, sample: f64, weight: f64) {
|
||||||
// This algorithm was suggested by West in 1979.
|
// This algorithm was suggested by West in 1979.
|
||||||
//
|
//
|
||||||
@ -32,7 +45,7 @@ impl WeightedAverage {
|
|||||||
self.v += weight * (sample - prev_avg) * (sample - self.avg);
|
self.v += weight * (sample - prev_avg) * (sample - self.avg);
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Determine whether the sequence is empty.
|
/// Determine whether the samples are empty.
|
||||||
pub fn is_empty(&self) -> bool {
|
pub fn is_empty(&self) -> bool {
|
||||||
self.weight_sum == 0. && self.v == 0. && self.avg == 0.
|
self.weight_sum == 0. && self.v == 0. && self.avg == 0.
|
||||||
}
|
}
|
||||||
@ -42,15 +55,14 @@ impl WeightedAverage {
|
|||||||
self.weight_sum
|
self.weight_sum
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Estimate the weighted mean of the sequence.
|
/// Estimate the weighted mean of the population.
|
||||||
pub fn mean(&self) -> f64 {
|
pub fn mean(&self) -> f64 {
|
||||||
self.avg
|
self.avg
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Calculate the population variance of the weighted sequence.
|
/// Calculate the weighted population variance of the sample.
|
||||||
///
|
///
|
||||||
/// This assumes that the sequence consists of the entire population and the
|
/// This is a biased estimator of the weighted variance of the population.
|
||||||
/// weights represent *frequency*.
|
|
||||||
pub fn population_variance(&self) -> f64 {
|
pub fn population_variance(&self) -> f64 {
|
||||||
if self.is_empty() {
|
if self.is_empty() {
|
||||||
0.
|
0.
|
||||||
@ -59,10 +71,9 @@ impl WeightedAverage {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Calculate the unbiased sample variance of the weighted sequence.
|
/// Calculate the weighted sample variance.
|
||||||
///
|
///
|
||||||
/// This assumes that the sequence consists of samples of a larger
|
/// This is an unbiased estimator of the weighted variance of the population.
|
||||||
/// population and the weights represent *frequency*.
|
|
||||||
///
|
///
|
||||||
/// Note that this will return 0 if the sum of the weights is <= 1.
|
/// Note that this will return 0 if the sum of the weights is <= 1.
|
||||||
pub fn sample_variance(&self) -> f64 {
|
pub fn sample_variance(&self) -> f64 {
|
||||||
@ -73,10 +84,10 @@ impl WeightedAverage {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Estimate the standard error of the weighted mean of the sequence.
|
/// Estimate the standard error of the weighted mean of the population.
|
||||||
///
|
///
|
||||||
/// Note that this will return 0 if the sum of the weights is 0.
|
/// Note that this will return 0 if the sum of the weights is 0.
|
||||||
/// For this estimator the sum of weights should be larger than 1.
|
/// For this estimator, the sum of weights should be larger than 1.
|
||||||
///
|
///
|
||||||
/// This biased estimator uses the weighted variance and the sum of weights.
|
/// This biased estimator uses the weighted variance and the sum of weights.
|
||||||
/// It considers the weights as (noninteger) counts of how often the sample
|
/// It considers the weights as (noninteger) counts of how often the sample
|
||||||
@ -97,7 +108,10 @@ impl WeightedAverage {
|
|||||||
(variance / self.weight_sum).sqrt()
|
(variance / self.weight_sum).sqrt()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Merge the weighted average of another sequence into this one.
|
/// Merge another sample into this one.
|
||||||
|
///
|
||||||
|
///
|
||||||
|
/// ## Example
|
||||||
///
|
///
|
||||||
/// ```
|
/// ```
|
||||||
/// use average::WeightedAverage;
|
/// use average::WeightedAverage;
|
||||||
|
@ -2,27 +2,40 @@ use core;
|
|||||||
|
|
||||||
use conv::ApproxFrom;
|
use conv::ApproxFrom;
|
||||||
|
|
||||||
/// Represent the weighted and unweighted arithmetic mean and the unweighted
|
/// Estimate the weighted and unweighted arithmetic mean and the unweighted
|
||||||
/// variance of a sequence of numbers.
|
/// variance of a sequence of numbers ("population").
|
||||||
|
///
|
||||||
|
/// This can be used to estimate the standard error of the weighted mean.
|
||||||
|
///
|
||||||
|
///
|
||||||
|
/// ## Example
|
||||||
|
///
|
||||||
|
/// ```
|
||||||
|
/// use average::WeightedAverage2 as WeightedAverage;
|
||||||
|
///
|
||||||
|
/// let a: WeightedAverage = (1..6).zip(1..6)
|
||||||
|
/// .map(|(x, w)| (f64::from(x), f64::from(w))).collect();
|
||||||
|
/// println!("The weighted average is {} ± {}.", a.weighted_mean(), a.error());
|
||||||
|
/// ```
|
||||||
#[derive(Debug, Clone)]
|
#[derive(Debug, Clone)]
|
||||||
pub struct WeightedAverage {
|
pub struct WeightedAverage {
|
||||||
/// Sum of the weights.
|
/// Sum of the weights.
|
||||||
weight_sum: f64,
|
weight_sum: f64,
|
||||||
/// Sum of the squares of the weights.
|
/// Sum of the squares of the weights.
|
||||||
weight_sum_sq: f64,
|
weight_sum_sq: f64,
|
||||||
/// Weighted verage value.
|
/// Weighted average value.
|
||||||
weighted_avg: f64,
|
weighted_avg: f64,
|
||||||
|
|
||||||
/// Number of samples.
|
/// Number of samples.
|
||||||
n: u64,
|
n: u64,
|
||||||
/// Unweighted verage value.
|
/// Unweighted average value.
|
||||||
unweighted_avg: f64,
|
unweighted_avg: f64,
|
||||||
/// Intermediate sum of squares for calculating the *unweighted* variance.
|
/// Intermediate sum of squares for calculating the *unweighted* variance.
|
||||||
v: f64,
|
v: f64,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl WeightedAverage {
|
impl WeightedAverage {
|
||||||
/// Create a new weighted average.
|
/// Create a new weighted and unweighted average estimator.
|
||||||
pub fn new() -> WeightedAverage {
|
pub fn new() -> WeightedAverage {
|
||||||
WeightedAverage {
|
WeightedAverage {
|
||||||
weight_sum: 0., weight_sum_sq: 0., weighted_avg: 0.,
|
weight_sum: 0., weight_sum_sq: 0., weighted_avg: 0.,
|
||||||
@ -30,7 +43,7 @@ impl WeightedAverage {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Add a sample to the weighted sequence of which the average is calculated.
|
/// Add a weighted element sampled from the population.
|
||||||
pub fn add(&mut self, sample: f64, weight: f64) {
|
pub fn add(&mut self, sample: f64, weight: f64) {
|
||||||
// The algorithm for the unweighted average was suggested by Welford in 1962.
|
// The algorithm for the unweighted average was suggested by Welford in 1962.
|
||||||
// The algorithm for the weighted average was suggested by West in 1979.
|
// The algorithm for the weighted average was suggested by West in 1979.
|
||||||
@ -51,7 +64,7 @@ impl WeightedAverage {
|
|||||||
self.v += delta * (sample - self.unweighted_avg);
|
self.v += delta * (sample - self.unweighted_avg);
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Determine whether the sequence is empty.
|
/// Determine whether the sample is empty.
|
||||||
pub fn is_empty(&self) -> bool {
|
pub fn is_empty(&self) -> bool {
|
||||||
self.n == 0
|
self.n == 0
|
||||||
}
|
}
|
||||||
@ -89,9 +102,9 @@ impl WeightedAverage {
|
|||||||
self.weight_sum * self.weight_sum / self.weight_sum_sq
|
self.weight_sum * self.weight_sum / self.weight_sum_sq
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Calculate the *unweighted* population variance of the sequence.
|
/// Calculate the *unweighted* population variance of the sample.
|
||||||
///
|
///
|
||||||
/// This assumes that the sequence consists of the entire population.
|
/// This is a biased estimator of the variance of the population.
|
||||||
pub fn population_variance(&self) -> f64 {
|
pub fn population_variance(&self) -> f64 {
|
||||||
if self.n < 2 {
|
if self.n < 2 {
|
||||||
return 0.;
|
return 0.;
|
||||||
@ -99,9 +112,9 @@ impl WeightedAverage {
|
|||||||
self.v / f64::approx_from(self.n).unwrap()
|
self.v / f64::approx_from(self.n).unwrap()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Calculate the *unweighted*, unbiased sample variance of the sequence.
|
/// Calculate the *unweighted* sample variance.
|
||||||
///
|
///
|
||||||
/// This assumes that the sequence consists of samples of a larger population.
|
/// This is an unbiased estimator of the variance of the population.
|
||||||
pub fn sample_variance(&self) -> f64 {
|
pub fn sample_variance(&self) -> f64 {
|
||||||
if self.n < 2 {
|
if self.n < 2 {
|
||||||
return 0.;
|
return 0.;
|
||||||
@ -109,7 +122,7 @@ impl WeightedAverage {
|
|||||||
self.v / f64::approx_from(self.n - 1).unwrap()
|
self.v / f64::approx_from(self.n - 1).unwrap()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Estimate the standard error of the weighted mean of the sequence.
|
/// Estimate the standard error of the *weighted* mean of the sequence.
|
||||||
///
|
///
|
||||||
/// Returns 0 if the sum of weights is 0.
|
/// Returns 0 if the sum of weights is 0.
|
||||||
///
|
///
|
||||||
@ -126,14 +139,17 @@ impl WeightedAverage {
|
|||||||
(self.sample_variance() / effective_base).sqrt()
|
(self.sample_variance() / effective_base).sqrt()
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Merge the weighted average of another sequence into this one.
|
/// Merge another sample into this one.
|
||||||
|
///
|
||||||
|
///
|
||||||
|
/// ## Example
|
||||||
///
|
///
|
||||||
/// ```
|
/// ```
|
||||||
/// use average::WeightedAverage2 as WeightedAverage;
|
/// use average::WeightedAverage2 as WeightedAverage;
|
||||||
///
|
///
|
||||||
/// let weighted_sequence: &[(f64, f64)] = &[
|
/// let weighted_sequence: &[(f64, f64)] = &[
|
||||||
/// (1., 0.1), (2., 0.2), (3., 0.3), (4., 0.4), (5., 0.5),
|
/// (1., 0.1), (2., 0.2), (3., 0.3), (4., 0.4), (5., 0.5),
|
||||||
/// (6., 0.6), (7., 0.7), (8., 0.8), (9., 0.)];
|
/// (6., 0.6), (7., 0.7), (8., 0.8), (9., 0.9)];
|
||||||
/// let (left, right) = weighted_sequence.split_at(3);
|
/// let (left, right) = weighted_sequence.split_at(3);
|
||||||
/// let avg_total: WeightedAverage = weighted_sequence.iter().map(|&x| x).collect();
|
/// let avg_total: WeightedAverage = weighted_sequence.iter().map(|&x| x).collect();
|
||||||
/// let mut avg_left: WeightedAverage = left.iter().map(|&x| x).collect();
|
/// let mut avg_left: WeightedAverage = left.iter().map(|&x| x).collect();
|
||||||
|
Loading…
Reference in New Issue
Block a user