bingomanatee · February 18, 2014 18:23
diff --git a/smoothSeries_nor.js b/smoothSeries_nor.js
 (function (window) {

    var ss = function () {

 // # simple-statistics
 //
 // A simple, literate statistics system. The code below uses the
 // [Javascript module pattern](http://www.adequatelygood.com/2010/3/JavaScript-Module-Pattern-In-Depth),
 // eventually assigning `simple-statistics` to `ss` in browsers or the
 // `exports object for node.js
        var ss = {};

        // # [Linear Regression](http://en.wikipedia.org/wiki/Linear_regression)
        //
        // [Simple linear regression](http://en.wikipedia.org/wiki/Simple_linear_regression)
        // is a simple way to find a fitted line
        // between a set of coordinates.
        function linear_regression() {
            var linreg = {},
                data = [];

            // Assign data to the model. Data is assumed to be an array.
            linreg.data = function (x) {
                if (!arguments.length) {
                    return data;
                }
                data = x.slice();
                return linreg;
            };

            // Calculate the slope and y-intercept of the regression line
            // by calculating the least sum of squares
            linreg.mb = function () {
                var m, b;

                // Store data length in a local variable to reduce
                // repeated object property lookups
                var data_length = data.length;

                //if there's only one point, arbitrarily choose a slope of 0
                //and a y-intercept of whatever the y of the initial point is
                if (data_length === 1) {
                    m = 0;
                    b = data[0][1];
                } else {
                    // Initialize our sums and scope the `m` and `b`
                    // variables that define the line.
                    var sum_x = 0, sum_y = 0,
                        sum_xx = 0, sum_xy = 0;

                    // Use local variables to grab point values
                    // with minimal object property lookups
                    var point, x, y;

                    // Gather the sum of all x values, the sum of all
                    // y values, and the sum of x^2 and (x*y) for each
                    // value.
                    //
                    // In math notation, these would be SS_x, SS_y, SS_xx, and SS_xy
                    for (var i = 0; i < data_length; i++) {
                        point = data[i];
                        x = point[0];
                        y = point[1];

                        sum_x += x;
                        sum_y += y;

                        sum_xx += x * x;
                        sum_xy += x * y;
                    }

                    // `m` is the slope of the regression line
                    m = ((data_length * sum_xy) - (sum_x * sum_y)) /
                        ((data_length * sum_xx) - (sum_x * sum_x));

                    // `b` is the y-intercept of the line.
                    b = (sum_y / data_length) - ((m * sum_x) / data_length);
                }

                // Return both values as an object.
                return { m: m, b: b };
            };

            // a shortcut for simply getting the slope of the regression line
            linreg.m = function () {
                return linreg.mb().m;
            };

            // a shortcut for simply getting the y-intercept of the regression
            // line.
            linreg.b = function () {
                return linreg.mb().b;
            };

            // ## Fitting The Regression Line
            //
            // This is called after `.data()` and returns the
            // equation `y = f(x)` which gives the position
            // of the regression line at each point in `x`.
            linreg.line = function () {

                // Get the slope, `m`, and y-intercept, `b`, of the line.
                var mb = linreg.mb(),
                    m = mb.m,
                    b = mb.b;

                // Return a function that computes a `y` value for each
                // x value it is given, based on the values of `b` and `a`
                // that we just computed.
                return function (x) {
                    return b + (m * x);
                };
            };

            return linreg;
        }

        // # [R Squared](http://en.wikipedia.org/wiki/Coefficient_of_determination)
        //
        // The r-squared value of data compared with a function `f`
        // is the sum of the squared differences between the prediction
        // and the actual value.
        function r_squared(data, f) {
            if (data.length < 2) {
                return 1;
            }

            // Compute the average y value for the actual
            // data set in order to compute the
            // _total sum of squares_
            var sum = 0, average;
            for (var i = 0; i < data.length; i++) {
                sum += data[i][1];
            }
            average = sum / data.length;

            // Compute the total sum of squares - the
            // squared difference between each point
            // and the average of all points.
            var sum_of_squares = 0;
            for (var j = 0; j < data.length; j++) {
                sum_of_squares += Math.pow(average - data[j][1], 2);
            }

            // Finally estimate the error: the squared
            // difference between the estimate and the actual data
            // value at each point.
            var err = 0;
            for (var k = 0; k < data.length; k++) {
                err += Math.pow(data[k][1] - f(data[k][0]), 2);
            }

            // As the error grows larger, it's ratio to the
            // sum of squares increases and the r squared
            // value grows lower.
            return 1 - (err / sum_of_squares);
        }

        // # [Bayesian Classifier](http://en.wikipedia.org/wiki/Naive_Bayes_classifier)
        //
        // This is a naïve bayesian classifier that takes
        // singly-nested objects.
        function bayesian() {
            // The `bayes_model` object is what will be exposed
            // by this closure, with all of its extended methods, and will
            // have access to all scope variables, like `total_count`.
            var bayes_model = {},
            // The number of items that are currently
            // classified in the model
                total_count = 0,
            // Every item classified in the model
                data = {};

            // ## Train
            // Train the classifier with a new item, which has a single
            // dimension of Javascript literal keys and values.
            bayes_model.train = function (item, category) {
                // If the data object doesn't have any values
                // for this category, create a new object for it.
                if (!data[category]) {
                    data[category] = {};
                }

                // Iterate through each key in the item.
                for (var k in item) {
                    var v = item[k];
                    // Initialize the nested object `data[category][k][item[k]]`
                    // with an object of keys that equal 0.
                    if (data[category][k] === undefined) {
                        data[category][k] = {};
                    }
                    if (data[category][k][v] === undefined) {
                        data[category][k][v] = 0;
                    }

                    // And increment the key for this key/value combination.
                    data[category][k][item[k]]++;
                }
                // Increment the number of items classified
                total_count++;
            };

            // ## Score
            // Generate a score of how well this item matches all
            // possible categories based on its attributes
            bayes_model.score = function (item) {
                // Initialize an empty array of odds per category.
                var odds = {}, category;
                // Iterate through each key in the item,
                // then iterate through each category that has been used
                // in previous calls to `.train()`
                for (var k in item) {
                    var v = item[k];
                    for (category in data) {
                        // Create an empty object for storing key - value combinations
                        // for this category.
                        if (odds[category] === undefined) {
                            odds[category] = {};
                        }

                        // If this item doesn't even have a property, it counts for nothing,
                        // but if it does have the property that we're looking for from
                        // the item to categorize, it counts based on how popular it is
                        // versus the whole population.
                        if (data[category][k]) {
                            odds[category][k + '_' + v] = (data[category][k][v] || 0) / total_count;
                        } else {
                            odds[category][k + '_' + v] = 0;
                        }
                    }
                }

                // Set up a new object that will contain sums of these odds by category
                var odds_sums = {};

                for (category in odds) {
                    // Tally all of the odds for each category-combination pair -
                    // the non-existence of a category does not add anything to the
                    // score.
                    for (var combination in odds[category]) {
                        if (odds_sums[category] === undefined) {
                            odds_sums[category] = 0;
                        }
                        odds_sums[category] += odds[category][combination];
                    }
                }

                return odds_sums;
            };

            // Return the completed model.
            return bayes_model;
        }

        // # sum
        //
        // is simply the result of adding all numbers
        // together, starting from zero.
        //
        // This runs on `O(n)`, linear time in respect to the array
        function sum(x) {
            var value = 0;
            for (var i = 0; i < x.length; i++) {
                value += x[i];
            }
            return value;
        }

        // # mean
        //
        // is the sum over the number of values
        //
        // This runs on `O(n)`, linear time in respect to the array
        function mean(x) {
            // The mean of no numbers is null
            if (x.length === 0) {
                return null;
            }

            return sum(x) / x.length;
        }

        // # geometric mean
        //
        // a mean function that is more useful for numbers in different
        // ranges.
        //
        // this is the nth root of the input numbers multipled by each other
        //
        // This runs on `O(n)`, linear time in respect to the array
        function geometric_mean(x) {
            // The mean of no numbers is null
            if (x.length === 0) {
                return null;
            }

            // the starting value.
            var value = 1;

            for (var i = 0; i < x.length; i++) {
                // the geometric mean is only valid for positive numbers
                if (x[i] <= 0) {
                    return null;
                }

                // repeatedly multiply the value by each number
                value *= x[i];
            }

            return Math.pow(value, 1 / x.length);
        }

        // # min
        //
        // This is simply the minimum number in the set.
        //
        // This runs on `O(n)`, linear time in respect to the array
        function min(x) {
            var value;
            for (var i = 0; i < x.length; i++) {
                // On the first iteration of this loop, min is
                // undefined and is thus made the minimum element in the array
                if (x[i] < value || value === undefined) {
                    value = x[i];
                }
            }
            return value;
        }

        // # max
        //
        // This is simply the maximum number in the set.
        //
        // This runs on `O(n)`, linear time in respect to the array
        function max(x) {
            var value;
            for (var i = 0; i < x.length; i++) {
                // On the first iteration of this loop, max is
                // undefined and is thus made the maximum element in the array
                if (x[i] > value || value === undefined) {
                    value = x[i];
                }
            }
            return value;
        }

        // # [variance](http://en.wikipedia.org/wiki/Variance)
        //
        // is the sum of squared deviations from the mean
        //
        // depends on `mean()`
        function variance(x) {
            // The variance of no numbers is null
            if (x.length === 0) {
                return null;
            }

            var mean_value = mean(x),
                deviations = [];

            // Make a list of squared deviations from the mean.
            for (var i = 0; i < x.length; i++) {
                deviations.push(Math.pow(x[i] - mean_value, 2));
            }

            // Find the mean value of that list
            return mean(deviations);
        }

        // # [standard deviation](http://en.wikipedia.org/wiki/Standard_deviation)
        //
        // is just the square root of the variance.
        //
        // depends on `variance()`
        function standard_deviation(x) {
            // The standard deviation of no numbers is null
            if (x.length === 0) {
                return null;
            }

            return Math.sqrt(variance(x));
        }

        // The sum of deviations to the Nth power.
        // When n=2 it's the sum of squared deviations.
        // When n=3 it's the sum of cubed deviations.
        //
        // depends on `mean()`
        function sum_nth_power_deviations(x, n) {
            var mean_value = mean(x),
                sum = 0;

            for (var i = 0; i < x.length; i++) {
                sum += Math.pow(x[i] - mean_value, n);
            }

            return sum;
        }

        // # [variance](http://en.wikipedia.org/wiki/Variance)
        //
        // is the sum of squared deviations from the mean
        //
        // depends on `sum_nth_power_deviations`
        function sample_variance(x) {
            // The variance of no numbers is null
            if (x.length <= 1) {
                return null;
            }

            var sum_squared_deviations_value = sum_nth_power_deviations(x, 2);

            // Find the mean value of that list
            return sum_squared_deviations_value / (x.length - 1);
        }

        // # [standard deviation](http://en.wikipedia.org/wiki/Standard_deviation)
        //
        // is just the square root of the variance.
        //
        // depends on `sample_variance()`
        function sample_standard_deviation(x) {
            // The standard deviation of no numbers is null
            if (x.length <= 1) {
                return null;
            }

            return Math.sqrt(sample_variance(x));
        }

        // # [covariance](http://en.wikipedia.org/wiki/Covariance)
        //
        // sample covariance of two datasets:
        // how much do the two datasets move together?
        // x and y are two datasets, represented as arrays of numbers.
        //
        // depends on `mean()`
        function sample_covariance(x, y) {

            // The two datasets must have the same length which must be more than 1
            if (x.length <= 1 || x.length != y.length) {
                return null;
            }

            // determine the mean of each dataset so that we can judge each
            // value of the dataset fairly as the difference from the mean. this
            // way, if one dataset is [1, 2, 3] and [2, 3, 4], their covariance
            // does not suffer because of the difference in absolute values
            var xmean = mean(x),
                ymean = mean(y),
                sum = 0;

            // for each pair of values, the covariance increases when their
            // difference from the mean is associated - if both are well above
            // or if both are well below
            // the mean, the covariance increases significantly.
            for (var i = 0; i < x.length; i++) {
                sum += (x[i] - xmean) * (y[i] - ymean);
            }

            // the covariance is weighted by the length of the datasets.
            return sum / (x.length - 1);
        }

        // # [correlation](http://en.wikipedia.org/wiki/Correlation_and_dependence)
        //
        // Gets a measure of how correlated two datasets are, between -1 and 1
        //
        // depends on `sample_standard_deviation()` and `sample_covariance()`
        function sample_correlation(x, y) {
            var cov = sample_covariance(x, y),
                xstd = sample_standard_deviation(x),
                ystd = sample_standard_deviation(y);

            if (cov === null || xstd === null || ystd === null) {
                return null;
            }

            return cov / xstd / ystd;
        }

        // # [median](http://en.wikipedia.org/wiki/Median)
        //
        // The middle number of a list. This is often a good indicator of 'the middle'
        // when there are outliers that skew the `mean()` value.
        function median(x) {
            // The median of an empty list is null
            if (x.length === 0) {
                return null;
            }

            // Sorting the array makes it easy to find the center, but
            // use `.slice()` to ensure the original array `x` is not modified
            var sorted = x.slice().sort(function (a, b) {
                return a - b;
            });

            // If the length of the list is odd, it's the central number
            if (sorted.length % 2 === 1) {
                return sorted[(sorted.length - 1) / 2];
                // Otherwise, the median is the average of the two numbers
                // at the center of the list
            } else {
                var a = sorted[(sorted.length / 2) - 1];
                var b = sorted[(sorted.length / 2)];
                return (a + b) / 2;
            }
        }

        // # [mode](http://bit.ly/W5K4Yt)
        // This implementation is inspired by [science.js](https://github.com/jasondavies/science.js/blob/master/src/stats/mode.js)
        function mode(x) {

            // Handle edge cases:
            // The median of an empty list is null
            if (x.length === 0) {
                return null;
            }
            else if (x.length === 1) {
                return x[0];
            }

            // Sorting the array lets us iterate through it below and be sure
            // that every time we see a new number it's new and we'll never
            // see the same number twice
            var sorted = x.slice().sort(function (a, b) {
                return a - b;
            });

            // This assumes it is dealing with an array of size > 1, since size
            // 0 and 1 are handled immediately. Hence it starts at index 1 in the
            // array.
            var last = sorted[0],
            // store the mode as we find new modes
                value,
            // store how many times we've seen the mode
                max_seen = 0,
            // how many times the current candidate for the mode
            // has been seen
                seen_this = 1;

            // end at sorted.length + 1 to fix the case in which the mode is
            // the highest number that occurs in the sequence. the last iteration
            // compares sorted[i], which is undefined, to the highest number
            // in the series
            for (var i = 1; i < sorted.length + 1; i++) {
                // we're seeing a new number pass by
                if (sorted[i] !== last) {
                    // the last number is the new mode since we saw it more
                    // often than the old one
                    if (seen_this > max_seen) {
                        max_seen = seen_this;
                        seen_this = 1;
                        value = last;
                    }
                    last = sorted[i];
                    // if this isn't a new number, it's one more occurrence of
                    // the potential mode
                } else {
                    seen_this++;
                }
            }
            return value;
        }

        // # [t-test](http://en.wikipedia.org/wiki/Student's_t-test)
        //
        // This is to compute a one-sample t-test, comparing the mean
        // of a sample to a known value, x.
        //
        // in this case, we're trying to determine whether the
        // population mean is equal to the value that we know, which is `x`
        // here. usually the results here are used to look up a
        // [p-value](http://en.wikipedia.org/wiki/P-value), which, for
        // a certain level of significance, will let you determine that the
        // null hypothesis can or cannot be rejected.
        //
        // Depends on `standard_deviation()` and `mean()`
        function t_test(sample, x) {
            // The mean of the sample
            var sample_mean = mean(sample);

            // The standard deviation of the sample
            var sd = standard_deviation(sample);

            // Square root the length of the sample
            var rootN = Math.sqrt(sample.length);

            // Compute the known value against the sample,
            // returning the t value
            return (sample_mean - x) / (sd / rootN);
        }

        // # [2-sample t-test](http://en.wikipedia.org/wiki/Student's_t-test)
        //
        // This is to compute two sample t-test.
        // Tests whether "mean(X)-mean(Y) = difference", (
        // in the most common case, we often have `difference == 0` to test if two samples
        // are likely to be taken from populations with the same mean value) with
        // no prior knowledge on stdandard deviations of both samples
        // other than the fact that they have the same standard deviation.
        //
        // Usually the results here are used to look up a
        // [p-value](http://en.wikipedia.org/wiki/P-value), which, for
        // a certain level of significance, will let you determine that the
        // null hypothesis can or cannot be rejected.
        //
        // `diff` can be omitted if it equals 0.
        //
        // [This is used to confirm or deny](http://www.monarchlab.org/Lab/Research/Stats/2SampleT.aspx)
        // a null hypothesis that the two populations that have been sampled into
        // `sample_x` and `sample_y` are equal to each other.
        //
        // Depends on `sample_variance()` and `mean()`
        function t_test_two_sample(sample_x, sample_y, difference) {
            var n = sample_x.length,
                m = sample_y.length;

            // If either sample doesn't actually have any values, we can't
            // compute this at all, so we return `null`.
            if (!n || !m) {
                return null;
            }

            // default difference (mu) is zero
            if (!difference) {
                difference = 0;
            }

            var meanX = mean(sample_x),
                meanY = mean(sample_y);

            var weightedVariance = ((n - 1) * sample_variance(sample_x) +
                (m - 1) * sample_variance(sample_y)) / (n + m - 2);

            return (meanX - meanY - difference) /
                Math.sqrt(weightedVariance * (1 / n + 1 / m));
        }

        // # quantile
        // This is a population quantile, since we assume to know the entire
        // dataset in this library. Thus I'm trying to follow the
        // [Quantiles of a Population](http://en.wikipedia.org/wiki/Quantile#Quantiles_of_a_population)
        // algorithm from wikipedia.
        //
        // Sample is a one-dimensional array of numbers,
        // and p is either a decimal number from 0 to 1 or an array of decimal
        // numbers from 0 to 1.
        // In terms of a k/q quantile, p = k/q - it's just dealing with fractions or dealing
        // with decimal values.
        // When p is an array, the result of the function is also an array containing the appropriate
        // quantiles in input order
        function quantile(sample, p) {

            // We can't derive quantiles from an empty list
            if (sample.length === 0) {
                return null;
            }

            // Sort a copy of the array. We'll need a sorted array to index
            // the values in sorted order.
            var sorted = sample.slice().sort(function (a, b) {
                return a - b;
            });

            if (p.length) {
                // Initialize the result array
                var results = [];
                // For each requested quantile
                for (var i = 0; i < p.length; i++) {
                    results[i] = quantile_sorted(sorted, p[i]);
                }
                return results;
            } else {
                return quantile_sorted(sorted, p);
            }
        }

        function quantile_sorted(sample, p) {
            var idx = (sample.length) * p;
            if (p < 0 || p > 1) {
                return null;
            } else if (p === 1) {
                // If p is 1, directly return the last element
                return sample[sample.length - 1];
            } else if (p === 0) {
                // If p is 0, directly return the first element
                return sample[0];
            } else if (idx % 1 !== 0) {
                // If p is not integer, return the next element in array
                return sample[Math.ceil(idx) - 1];
            } else if (sample.length % 2 === 0) {
                // If the list has even-length, we'll take the average of this number
                // and the next value, if there is one
                return (sample[idx - 1] + sample[idx]) / 2;
            } else {
                // Finally, in the simple case of an integer value
                // with an odd-length list, return the sample value at the index.
                return sample[idx];
            }
        }

        // # [Interquartile range](http://en.wikipedia.org/wiki/Interquartile_range)
        //
        // A measure of statistical dispersion, or how scattered, spread, or
        // concentrated a distribution is. It's computed as the difference betwen
        // the third quartile and first quartile.
        function iqr(sample) {
            // We can't derive quantiles from an empty list
            if (sample.length === 0) {
                return null;
            }

            // Interquartile range is the span between the upper quartile,
            // at `0.75`, and lower quartile, `0.25`
            return quantile(sample, 0.75) - quantile(sample, 0.25);
        }

        // # [Median Absolute Deviation](http://en.wikipedia.org/wiki/Median_absolute_deviation)
        //
        // The Median Absolute Deviation (MAD) is a robust measure of statistical
        // dispersion. It is more resilient to outliers than the standard deviation.
        function mad(x) {
            // The mad of nothing is null
            if (!x || x.length === 0) {
                return null;
            }

            var median_value = median(x),
                median_absolute_deviations = [];

            // Make a list of absolute deviations from the median
            for (var i = 0; i < x.length; i++) {
                median_absolute_deviations.push(Math.abs(x[i] - median_value));
            }

            // Find the median value of that list
            return median(median_absolute_deviations);
        }

        // ## Compute Matrices for Jenks
        //
        // Compute the matrices required for Jenks breaks. These matrices
        // can be used for any classing of data with `classes <= n_classes`
        function jenksMatrices(data, n_classes) {

            // in the original implementation, these matrices are referred to
            // as `LC` and `OP`
            //
            // * lower_class_limits (LC): optimal lower class limits
            // * variance_combinations (OP): optimal variance combinations for all classes
            var lower_class_limits = [],
                variance_combinations = [],
            // loop counters
                i, j,
            // the variance, as computed at each step in the calculation
                variance = 0;

            // Initialize and fill each matrix with zeroes
            for (i = 0; i < data.length + 1; i++) {
                var tmp1 = [], tmp2 = [];
                // despite these arrays having the same values, we need
                // to keep them separate so that changing one does not change
                // the other
                for (j = 0; j < n_classes + 1; j++) {
                    tmp1.push(0);
                    tmp2.push(0);
                }
                lower_class_limits.push(tmp1);
                variance_combinations.push(tmp2);
            }

            for (i = 1; i < n_classes + 1; i++) {
                lower_class_limits[1][i] = 1;
                variance_combinations[1][i] = 0;
                // in the original implementation, 9999999 is used but
                // since Javascript has `Infinity`, we use that.
                for (j = 2; j < data.length + 1; j++) {
                    variance_combinations[j][i] = Infinity;
                }
            }

            for (var l = 2; l < data.length + 1; l++) {

                // `SZ` originally. this is the sum of the values seen thus
                // far when calculating variance.
                var sum = 0,
                // `ZSQ` originally. the sum of squares of values seen
                // thus far
                    sum_squares = 0,
                // `WT` originally. This is the number of
                    w = 0,
                // `IV` originally
                    i4 = 0;

                // in several instances, you could say `Math.pow(x, 2)`
                // instead of `x * x`, but this is slower in some browsers
                // introduces an unnecessary concept.
                for (var m = 1; m < l + 1; m++) {

                    // `III` originally
                    var lower_class_limit = l - m + 1,
                        val = data[lower_class_limit - 1];

                    // here we're estimating variance for each potential classing
                    // of the data, for each potential number of classes. `w`
                    // is the number of data points considered so far.
                    w++;

                    // increase the current sum and sum-of-squares
                    sum += val;
                    sum_squares += val * val;

                    // the variance at this point in the sequence is the difference
                    // between the sum of squares and the total x 2, over the number
                    // of samples.
                    variance = sum_squares - (sum * sum) / w;

                    i4 = lower_class_limit - 1;

                    if (i4 !== 0) {
                        for (j = 2; j < n_classes + 1; j++) {
                            // if adding this element to an existing class
                            // will increase its variance beyond the limit, break
                            // the class at this point, setting the `lower_class_limit`
                            // at this point.
                            if (variance_combinations[l][j] >=
                                (variance + variance_combinations[i4][j - 1])) {
                                lower_class_limits[l][j] = lower_class_limit;
                                variance_combinations[l][j] = variance +
                                    variance_combinations[i4][j - 1];
                            }
                        }
                    }
                }

                lower_class_limits[l][1] = 1;
                variance_combinations[l][1] = variance;
            }

            // return the two matrices. for just providing breaks, only
            // `lower_class_limits` is needed, but variances can be useful to
            // evaluage goodness of fit.
            return {
                lower_class_limits:    lower_class_limits,
                variance_combinations: variance_combinations
            };
        }

        // ## Pull Breaks Values for Jenks
        //
        // the second part of the jenks recipe: take the calculated matrices
        // and derive an array of n breaks.
        function jenksBreaks(data, lower_class_limits, n_classes) {

            var k = data.length - 1,
                kclass = [],
                countNum = n_classes;

            // the calculation of classes will never include the upper and
            // lower bounds, so we need to explicitly set them
            kclass[n_classes] = data[data.length - 1];
            kclass[0] = data[0];

            // the lower_class_limits matrix is used as indexes into itself
            // here: the `k` variable is reused in each iteration.
            while (countNum > 1) {
                kclass[countNum - 1] = data[lower_class_limits[k][countNum] - 2];
                k = lower_class_limits[k][countNum] - 1;
                countNum--;
            }

            return kclass;
        }

        // # [Jenks natural breaks optimization](http://en.wikipedia.org/wiki/Jenks_natural_breaks_optimization)
        //
        // Implementations: [1](http://danieljlewis.org/files/2010/06/Jenks.pdf) (python),
        // [2](https://github.com/vvoovv/djeo-jenks/blob/master/main.js) (buggy),
        // [3](https://github.com/simogeo/geostats/blob/master/lib/geostats.js#L407) (works)
        //
        // Depends on `jenksBreaks()` and `jenksMatrices()`
        function jenks(data, n_classes) {

            if (n_classes > data.length) {
                return null;
            }

            // sort data in numerical order, since this is expected
            // by the matrices function
            data = data.slice().sort(function (a, b) {
                return a - b;
            });

            // get our basic matrices
            var matrices = jenksMatrices(data, n_classes),
            // we only need lower class limits here
                lower_class_limits = matrices.lower_class_limits;

            // extract n_classes out of the computed matrices
            return jenksBreaks(data, lower_class_limits, n_classes);

        }

        // # [Skewness](http://en.wikipedia.org/wiki/Skewness)
        //
        // A measure of the extent to which a probability distribution of a
        // real-valued random variable "leans" to one side of the mean.
        // The skewness value can be positive or negative, or even undefined.
        //
        // Implementation is based on the adjusted Fisher-Pearson standardized
        // moment coefficient, which is the version found in Excel and several
        // statistical packages including Minitab, SAS and SPSS.
        //
        // Depends on `sum_nth_power_deviations()` and `sample_standard_deviation`
        function sample_skewness(x) {
            // The skewness of less than three arguments is null
            if (x.length < 3) {
                return null;
            }

            var n = x.length,
                cubed_s = Math.pow(sample_standard_deviation(x), 3),
                sum_cubed_deviations = sum_nth_power_deviations(x, 3);

            return n * sum_cubed_deviations / ((n - 1) * (n - 2) * cubed_s);
        }

        // # Standard Normal Table
        // A standard normal table, also called the unit normal table or Z table,
        // is a mathematical table for the values of Φ (phi), which are the values of
        // the cumulative distribution function of the normal distribution.
        // It is used to find the probability that a statistic is observed below,
        // above, or between values on the standard normal distribution, and by
        // extension, any normal distribution.
        //
        // The probabilities are taken from http://en.wikipedia.org/wiki/Standard_normal_table
        // The table used is the cumulative, and not cumulative from 0 to mean
        // (even though the latter has 5 digits precision, instead of 4).
        var standard_normal_table = [
            /*  z      0.00    0.01    0.02    0.03    0.04    0.05    0.06    0.07    0.08    0.09 */
            /* 0.0 */ 0.5000, 0.5040, 0.5080, 0.5120, 0.5160, 0.5199, 0.5239, 0.5279, 0.5319, 0.5359,
            /* 0.1 */ 0.5398, 0.5438, 0.5478, 0.5517, 0.5557, 0.5596, 0.5636, 0.5675, 0.5714, 0.5753,
            /* 0.2 */ 0.5793, 0.5832, 0.5871, 0.5910, 0.5948, 0.5987, 0.6026, 0.6064, 0.6103, 0.6141,
            /* 0.3 */ 0.6179, 0.6217, 0.6255, 0.6293, 0.6331, 0.6368, 0.6406, 0.6443, 0.6480, 0.6517,
            /* 0.4 */ 0.6554, 0.6591, 0.6628, 0.6664, 0.6700, 0.6736, 0.6772, 0.6808, 0.6844, 0.6879,
            /* 0.5 */ 0.6915, 0.6950, 0.6985, 0.7019, 0.7054, 0.7088, 0.7123, 0.7157, 0.7190, 0.7224,
            /* 0.6 */ 0.7257, 0.7291, 0.7324, 0.7357, 0.7389, 0.7422, 0.7454, 0.7486, 0.7517, 0.7549,
            /* 0.7 */ 0.7580, 0.7611, 0.7642, 0.7673, 0.7704, 0.7734, 0.7764, 0.7794, 0.7823, 0.7852,
            /* 0.8 */ 0.7881, 0.7910, 0.7939, 0.7967, 0.7995, 0.8023, 0.8051, 0.8078, 0.8106, 0.8133,
            /* 0.9 */ 0.8159, 0.8186, 0.8212, 0.8238, 0.8264, 0.8289, 0.8315, 0.8340, 0.8365, 0.8389,
            /* 1.0 */ 0.8413, 0.8438, 0.8461, 0.8485, 0.8508, 0.8531, 0.8554, 0.8577, 0.8599, 0.8621,
            /* 1.1 */ 0.8643, 0.8665, 0.8686, 0.8708, 0.8729, 0.8749, 0.8770, 0.8790, 0.8810, 0.8830,
            /* 1.2 */ 0.8849, 0.8869, 0.8888, 0.8907, 0.8925, 0.8944, 0.8962, 0.8980, 0.8997, 0.9015,
            /* 1.3 */ 0.9032, 0.9049, 0.9066, 0.9082, 0.9099, 0.9115, 0.9131, 0.9147, 0.9162, 0.9177,
            /* 1.4 */ 0.9192, 0.9207, 0.9222, 0.9236, 0.9251, 0.9265, 0.9279, 0.9292, 0.9306, 0.9319,
            /* 1.5 */ 0.9332, 0.9345, 0.9357, 0.9370, 0.9382, 0.9394, 0.9406, 0.9418, 0.9429, 0.9441,
            /* 1.6 */ 0.9452, 0.9463, 0.9474, 0.9484, 0.9495, 0.9505, 0.9515, 0.9525, 0.9535, 0.9545,
            /* 1.7 */ 0.9554, 0.9564, 0.9573, 0.9582, 0.9591, 0.9599, 0.9608, 0.9616, 0.9625, 0.9633,
            /* 1.8 */ 0.9641, 0.9649, 0.9656, 0.9664, 0.9671, 0.9678, 0.9686, 0.9693, 0.9699, 0.9706,
            /* 1.9 */ 0.9713, 0.9719, 0.9726, 0.9732, 0.9738, 0.9744, 0.9750, 0.9756, 0.9761, 0.9767,
            /* 2.0 */ 0.9772, 0.9778, 0.9783, 0.9788, 0.9793, 0.9798, 0.9803, 0.9808, 0.9812, 0.9817,
            /* 2.1 */ 0.9821, 0.9826, 0.9830, 0.9834, 0.9838, 0.9842, 0.9846, 0.9850, 0.9854, 0.9857,
            /* 2.2 */ 0.9861, 0.9864, 0.9868, 0.9871, 0.9875, 0.9878, 0.9881, 0.9884, 0.9887, 0.9890,
            /* 2.3 */ 0.9893, 0.9896, 0.9898, 0.9901, 0.9904, 0.9906, 0.9909, 0.9911, 0.9913, 0.9916,
            /* 2.4 */ 0.9918, 0.9920, 0.9922, 0.9925, 0.9927, 0.9929, 0.9931, 0.9932, 0.9934, 0.9936,
            /* 2.5 */ 0.9938, 0.9940, 0.9941, 0.9943, 0.9945, 0.9946, 0.9948, 0.9949, 0.9951, 0.9952,
            /* 2.6 */ 0.9953, 0.9955, 0.9956, 0.9957, 0.9959, 0.9960, 0.9961, 0.9962, 0.9963, 0.9964,
            /* 2.7 */ 0.9965, 0.9966, 0.9967, 0.9968, 0.9969, 0.9970, 0.9971, 0.9972, 0.9973, 0.9974,
            /* 2.8 */ 0.9974, 0.9975, 0.9976, 0.9977, 0.9977, 0.9978, 0.9979, 0.9979, 0.9980, 0.9981,
            /* 2.9 */ 0.9981, 0.9982, 0.9982, 0.9983, 0.9984, 0.9984, 0.9985, 0.9985, 0.9986, 0.9986,
            /* 3.0 */ 0.9987, 0.9987, 0.9987, 0.9988, 0.9988, 0.9989, 0.9989, 0.9989, 0.9990, 0.9990
        ];

        // # [Cumulative Standard Normal Probability](http://en.wikipedia.org/wiki/Standard_normal_table)
        //
        // Since probability tables cannot be
        // printed for every normal distribution, as there are an infinite variety
        // of normal distributions, it is common practice to convert a normal to a
        // standard normal and then use the standard normal table to find probabilities
        function cumulative_std_normal_probability(z) {

            // Calculate the position of this value.
            var absZ = Math.abs(z),
            // Each row begins with a different
            // significant digit: 0.5, 0.6, 0.7, and so on. So the row is simply
            // this value's significant digit: 0.567 will be in row 0, so row=0,
            // 0.643 will be in row 1, so row=10.
                row = Math.floor(absZ * 10),
                column = 10 * (Math.floor(absZ * 100) / 10 - Math.floor(absZ * 100 / 10)),
                index = Math.min((row * 10) + column, standard_normal_table.length - 1);

            // The index we calculate must be in the table as a positive value,
            // but we still pay attention to whether the input is postive
            // or negative, and flip the output value as a last step.
            if (z >= 0) {
                return standard_normal_table[index];
            } else {
                // due to floating-point arithmetic, values in the table with
                // 4 significant figures can nevertheless end up as repeating
                // fractions when they're computed here.
                return +(1 - standard_normal_table[index]).toFixed(4);
            }
        }

        // # [Z-Score, or Standard Score](http://en.wikipedia.org/wiki/Standard_score)
        //
        // The standard score is the number of standard deviations an observation
        // or datum is above or below the mean. Thus, a positive standard score
        // represents a datum above the mean, while a negative standard score
        // represents a datum below the mean. It is a dimensionless quantity
        // obtained by subtracting the population mean from an individual raw
        // score and then dividing the difference by the population standard
        // deviation.
        //
        // The z-score is only defined if one knows the population parameters;
        // if one only has a sample set, then the analogous computation with
        // sample mean and sample standard deviation yields the
        // Student's t-statistic.
        function z_score(x, mean, standard_deviation) {
            return (x - mean) / standard_deviation;
        }

        // # Mixin
        //
        // Mixin simple_statistics to the Array native object. This is an optional
        // feature that lets you treat simple_statistics as a native feature
        // of Javascript.
        function mixin() {
            var support = !!(Object.defineProperty && Object.defineProperties);
            if (!support) {
                throw new Error('without defineProperty, simple-statistics cannot be mixed in');
            }

            // only methods which work on basic arrays in a single step
            // are supported
            var arrayMethods = ['median', 'standard_deviation', 'sum',
                'sample_skewness',
                'mean', 'min', 'max', 'quantile', 'geometric_mean'];

            // create a closure with a method name so that a reference
            // like `arrayMethods[i]` doesn't follow the loop increment
            function wrap(method) {
                return function () {
                    // cast any arguments into an array, since they're
                    // natively objects
                    var args = Array.prototype.slice.apply(arguments);
                    // make the first argument the array itself
                    args.unshift(this);
                    // return the result of the ss method
                    return ss[method].apply(ss, args);
                };
            }

            // for each array function, define a function off of the Array
            // prototype which automatically gets the array as the first
            // argument. We use [defineProperty](https://developer.mozilla.org/en-US/docs/JavaScript/Reference/Global_Objects/Object/defineProperty)
            // because it allows these properties to be non-enumerable:
            // `for (var in x)` loops will not run into problems with this
            // implementation.
            for (var i = 0; i < arrayMethods.length; i++) {
                Object.defineProperty(Array.prototype, arrayMethods[i], {
                    value:        wrap(arrayMethods[i]),
                    configurable: true,
                    enumerable:   false,
                    writable:     true
                });
            }
        }

        ss.linear_regression = linear_regression;
        ss.standard_deviation = standard_deviation;
        ss.r_squared = r_squared;
        ss.median = median;
        ss.mean = mean;
        ss.mode = mode;
        ss.min = min;
        ss.max = max;
        ss.sum = sum;
        ss.quantile = quantile;
        ss.quantile_sorted = quantile_sorted;
        ss.iqr = iqr;
        ss.mad = mad;

        ss.sample_covariance = sample_covariance;
        ss.sample_correlation = sample_correlation;
        ss.sample_variance = sample_variance;
        ss.sample_standard_deviation = sample_standard_deviation;
        ss.sample_skewness = sample_skewness;

        ss.geometric_mean = geometric_mean;
        ss.variance = variance;
        ss.t_test = t_test;
        ss.t_test_two_sample = t_test_two_sample;

        // jenks
        ss.jenksMatrices = jenksMatrices;
        ss.jenksBreaks = jenksBreaks;
        ss.jenks = jenks;

        ss.bayesian = bayesian;

        // Normal distribution
        ss.z_score = z_score;
        ss.cumulative_std_normal_probability = cumulative_std_normal_probability;
        ss.standard_normal_table = standard_normal_table;

        // Alias this into its common name
        ss.average = mean;
        ss.interquartile_range = iqr;
        ss.mixin = mixin;
        ss.median_absolute_deviation = mad;

        return ss;
    }

    /* **************** TESTING UTILITY ********** */
    var assert = {
        ok: function (value, msg, debug) {
            if (!msg) {
                msg = 'not ok';
            }

            if (!value) {
                throw new Error('assert.ok FAIL: ' + msg);
            }
            if (debug) {
                console.log('ok: ', +msg);
            }
        },

        equal: function (a, b, msg, debug) {
            if (!msg) {
                msg = 'not equal';
            }

            if (a != b) {
                throw new Error('assert.equal FAIL: ' + a + '!= ' + b);
            }

            if (debug) {
                console.log('equal: ' + a + ',' + b + ' ' + msg);
            }
        },

        objEqual: function (a, b, msg, debug) {
            a = JSON.stringify(a);
            b = JSON.stringify(b);
            assert.equal(a, b, msg, debug);
        },

        objNotEqual: function (a, b, msg, debug) {
            a = JSON.stringify(a);
            b = JSON.stringify(b);
            if (a == b) {
                throw new Error('not supposed to equal: ' + a + ' vs. ' + b);
            }
            if (debug) {
                console.log('not equal: ' + a + ',' + b + ' ' + msg);
            }
        }
    }

    /* **************** CORE smoothSeries ********** */
    var DEBUG = false;

    /**
     * the average distance between the item and its neighbors values.
     * @param series {Array(number)}
     * @returns {Array|*}
     * @private
     */
    function _change(series) {
        if (series.length < 2) {
            return [0];
        }
        return _.map(series, function (item, index) {
            switch (index) {
                case 0:
                    return Math.abs(item - series[index + 1]);
                    break;

                case series.length - 1:
                    return Math.abs(item - series[index - 1]);
                    break;

                default:
                    return (Math.abs(item - series[index - 1]) +
                        Math.abs(item - series[index + 1])) / 2.0;

            }
        });
    }

    /**
     * this is a function that takes in an arbitrary series of data and
     * removes elements whose strange data spikes have been smoothed out.
     * @param numbers an array of numbers, or an array of vertexes (arrays of numbers).
     * @param index
     * @param threshold
     * @returns {*}
     */

    function smoothSeries(numbers, index, threshold) {

        if (!threshold) {
            threshold = 1;
        }
        if (arguments.length > 1) {
            numbers = _.map(numbers, function (item) {

                if (!_.isArray(item)) {
                    throw new Error('non array element in series');
                }
                var value = item[index];

                if (!_.isNumber(value)) {
                    throw new Error('non numeric data in series');
                }

                return value;
            });
        } else {
            numbers = numbers.slice(0);
        }

        var d1 = _change(numbers);
        var stdev = ss.standard_deviation(d1);
        var average = ss.average(d1);
        var thr = Math.max(threshold, stdev);
        var max_acceptable = average + thr;

        if (DEBUG) {
            console.log('numbers: ', numbers);
            console.log('average change: ', average);
            console.log('stdev: ', stdev);
            console.log('thr: ', thr);
            console.log('max_acceptable: ', max_acceptable);
            console.log('d1: ', d1);
        }

        return _.map(numbers, function (value, index) {
            if (d1[index] > max_acceptable) {
                switch (index) {
                    case 0:
                        return numbers[index + 1];
                        break;

                    case numbers.length - 1:
                        return numbers[index - 1];
                        break;

                    default:
                        return (numbers[index + 1] + numbers[index - 1]) / 2;
                }
            } else {
                return value;
            }
        });
    };

    var TEST = false;

    if (TEST) {
        (function (smoothSeries) {

            var data = [1, 2, 3, 4, 5];

            var smoothData = smoothSeries(data);

            assert.objEqual(data, smoothData, 'smooth series not changed', DEBUG);

            var data2 = [1, 2, 100, 4, 5];
            var smoothData2 = smoothSeries(data2);

            assert.objEqual(data, smoothData2, 'jump in series averaged', DEBUG);

            var data3 = [1, 2, 5, 4, 6];

            assert.objEqual(data3, smoothSeries(data3), 'slighthly jumpy series not changed', DEBUG);

            var data4 = [1, 2, 7, 4, 6];

            assert.objNotEqual(data4, smoothSeries(data4), 'rather jumpy series changed', DEBUG);

            var vectors = [
                [1, 2, 3],
                [2, 2, 3],
                [3, 2, 3]
            ];

            assert.objEqual([1, 2, 3], smoothSeries(vectors, 0), 'extracting value from a vector', DEBUG);

            assert.objEqual(smoothSeries([
                [1, 2, 3],
                [2, 2, 3],
                [7, 2, 3],
                [4, 2, 3],
                [6, 2, 3]
            ], 0), [1, 2, 3, 4, 6], 'rather jumpy vector series changed', DEBUG);

        })(smoothSeries);
    }

    window.smoothSeries = smoothSeries;
 })(window);