UNPKG

probability-distributions/index.js

Version:
24.8 kBJavaScriptView Raw
1/* ================================================================
* probability-distributions by Matt Asher (me[at]mattasher.com)
* Originally created for StatisticsBlog.com
*
* first created at : Sat Oct 10 2015
*
* ================================================================
* Copyright 2015 Matt Asher
*
* Licensed under the MIT License
* You may not use this file except in compliance with the License.
*
* ================================================================ */
14
15var crypto = require('crypto');
16
17// Shortcuts
18var exp = Math.exp;
19var ln = Math.log;
20var PI = Math.PI;
21var pow = Math.pow;
22
23module.exports = {
24
  /**
   * This is the core function for generating entropy
   *
   * @param len number of bytes of entropy to create
   * @returns {number} A pseduo random number between 0 and 1
   *
   */
  prng: function(len) {
      if(len === undefined) len=16;
34
      var entropy = crypto.randomBytes(len);
      var result = 0;
37
      for(var i=0; i<len; i++) {
          result = result + Number(entropy[i])/Math.pow(256,(i+1))
      }
      return result
  },
43
44
45
46
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer.
   * @param alpha First shape parameter
   * @param beta Second shape parameter
   * @param loc Location or Non-centrality parameter
   */
  rbeta: function(n, alpha, beta, loc) {
      // Uses relationship with gamma to calculate
56
      // Validations
      n = this._v(n, "n");
      alpha = this._v(alpha, "nn", 1);
      beta = this._v(beta, "nn", 1);
      loc =  this._v(loc, "r", 0);
62
      var toReturn = [];
64
      for(var i=0; i<n; i++) {
          var g1 = this.rgamma(1, alpha, 1)[0];
          var g2 = this.rgamma(1, beta, 1)[0];
68
69
          toReturn[i] = loc + g1/(g1+g2);
      }
      return toReturn
73
  },
75
76
  /**
   *
   * @param n Number of variates to return.
   * @param size Number of Bernoulli trials to be summed up. Defaults to 1
   * @param p Probability of a "success". Defaults to 0.5
   * @returns {Array} Random variates array
   */
  rbinom: function(n, size, p) {
      n = this._v(n, "n");
      size = this._v(size, "nni", 1);
      p = this._v(p, "p", 0.5);
88
      var toReturn = [];
90
      for(var i=0; i<n; i++) {
          var result = 0;
          for(var j=0; j<size; j++) {
              if(this.prng() < p) {
                  result++
              }
          }
          toReturn[i] = result;
      }
      return toReturn
  },
102
103
  /**
   *
   * @param n The number of variates to create
   * @param loc Location parameter
   * @param scale Scale parameter
   * @returns {Array} Random variates array
   */
  rcauchy: function(n, loc, scale) {
      n = this._v(n, "n");
      loc = this._v(loc, "r", 0);
      scale = this._v(scale, "nn", 1);
115
      var toReturn = [];
      for(var i=0; i<n; i++) {
          var x = scale * Math.tan(PI * (this.prng()-0.5))+loc;
119
          toReturn[i] = x;
      }
122
      return toReturn
  },
125
  /**
   *
   * @param n The number of variates to create
   * @param df Degrees of freedom for the distribution
   * @param ncp Non-centrality parameter
   * @returns {Array} Random variates array
   */
  rchisq: function(n, df, ncp) {
      n = this._v(n, "n");
      df = this._v(df, "nn");
      ncp = this._v(ncp, "r", 0);
137
      var toReturn = [];
      for(var i=0; i<n; i++) {
          // Start at ncp
          var x = ncp;
          for(var j=0; j<df; j++) {
              x = x + Math.pow(this.rnorm(1)[0],2);
          }
          toReturn[i] = x;
      }
      return toReturn
  },
149
  /**
   *
   * @param x Where to sample the density
   * @param rate The rate parameter. Must be a positive number
   * @returns {Number} The density given the parameter values
   */
  dexp: function(x, rate) {
      x = this._v(x, "r");
      rate = this._v(rate, "pos", 1);
      if(x < 0) return 0
160
      return rate * exp(-rate * x)
  },
163
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer.
   * @param rate The rate parameter. Must be a positive number
   */
  rexp: function(n, rate) {
      n = this._v(n, "n");
      rate = this._v(rate, "pos", 1);
172
      var toReturn = [];
174
      for(var i=0; i<n; i++) {
176
          toReturn[i] =  -ln(this.prng())/rate;
      }
179
      return toReturn
  },
182
  /**
   *
   * @param n The number of variates to create
   * @param df1 Degrees of freedom for the first parameter
   * @param df2 Degrees of freedom for the first parameter
   * @returns {Array} Random variates array
   */
  rf: function(n, df1, df2) {
      n = this._v(n, "n");
      df1 = this._v(df1, "nn");
      df2 = this._v(df2, "nn");
194
      var toReturn = [];
      for(var i=0; i<n; i++) {
          var num = this.rchisq(1, df1)[0]/df1;
          var denom = this.rchisq(1, df2)[0]/df2;
199
          toReturn[i] = num/denom;
      }
202
      return toReturn
204
  },
206
207
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer
   * @param alpha
   * @param rate
   * @returns {Array} Random variates array
   */
  rgamma: function(n, alpha, rate) {
      // Adapted from https://github.com/mvarshney/simjs-source/ & scipy
      n = this._v(n, "n");
      alpha = this._v(alpha, "nn");
      rate = this._v(rate, "pos", 1);
220
      var LOG4 = ln(4.0);
      var SG_MAGICCONST = 1.0 + ln(4.5);
      var beta = 1/rate;
224
      var toReturn = [];
      for(var i = 0; i<n; i++) {
227
          /* Based on Python 2.6 source code of random.py.
           */
230
          if (alpha > 1.0) {
              var ainv = Math.sqrt(2.0 * alpha - 1.0);
              var bbb = alpha - LOG4;
              var ccc = alpha + ainv;
235
              while (true) {
                  var u1 = this.prng();
                  if ((u1 < 1e-7) || (u > 0.9999999)) {
                      continue;
                  }
                  var u2 = 1.0 - this.prng();
                  var v = ln(u1 / (1.0 - u1)) / ainv;
                  var x = alpha * exp(v);
                  var z = u1 * u1 * u2;
                  var r = bbb + ccc * v - x;
                  if ((r + SG_MAGICCONST - 4.5 * z >= 0.0) || (r >= ln(z))) {
                      var result = x * beta;
                      break;
                  }
              }
          } else if (alpha == 1.0) {
              var u = this.prng();
              while (u <= 1e-7) {
                  u = this.prng();
              }
              var result = - ln(u) * beta;
          } else {
              while (true) {
                  var u = this.prng();
                  var b = (Math.E + alpha) / Math.E;
                  var p = b * u;
                  if (p <= 1.0) {
                      var x = Math.pow(p, 1.0 / alpha);
                  } else {
                      var x = - ln((b - p) / alpha);
                  }
                  var u1 = this.prng();
                  if (p > 1.0) {
                      if (u1 <= Math.pow(x, (alpha - 1.0))) {
                          break;
                      }
                  } else if (u1 <= exp(-x)) {
                      break;
                  }
              }
              var result =  x * beta;
          }
278
          toReturn[i] = result;
      }
281
      return toReturn;
283
  },
285
286
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer
   * @param min Minimum value
   * @param max Maximum value
   * @param inclusive By default the minimum and maximum are inclusive. To make exclusive, set to false
   * @returns {Array}
   */
  rint: function(n, min, max, inclusive) {
      n = this._v(n, "n");
      min = this._v(min, "int");
      max = this._v(max, "int");
      if(inclusive === false) {
          min++;
          max--;
      }
303
      if(min > max) throw "Minimum value cannot be greater than maximum value. For non-inclusive, minimum and maximum must be separated by at least 2.";
305
      var toReturn = [];
307
      var raw = this.runif(n, min, max);
309
      for(var i=0; i<n; i++) {
          toReturn[i] = Math.round(raw[i]);
      }
313
      return toReturn
  },
316
  // Syntax as in R library VGAM
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer
   * @param loc Mean
   * @param scale Scale parameter
   * @returns {Array} Random variates array
   */
  rlaplace: function(n, loc, scale) {
      n = this._v(n, "n");
      loc = this._v(loc, "r", 0);
      scale = this._v(scale, "nn", 1);
329
      var toReturn = [];
331
      for(var i=0; i<n; i++) {
          var core = this.sample([-1,1])[0] * ln(this.prng());
334
          var x = loc - scale * core;
336
          toReturn[i] = x;
      }
339
      return toReturn
  },
342
343
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer.
   * @param meanlog The mean log.
   * @param sdlog Log SD. Must be greater than 0.
   * @returns {Array} Random variates array
   */
  rlnorm: function(n, meanlog, sdlog) {
      n = this._v(n, "n");
      meanlog = this._v(meanlog, "r", 0);
      sdlog = this._v(sdlog, "nn", 1);
355
      var toReturn = [];
357
      for(var i=0; i<n; i++) {
          var x = this.rnorm(1, meanlog, sdlog)[0];
360
          toReturn[i] = exp(x);
      }
363
      return toReturn
  },
366
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer.
   * @param size Number of hits required
   * @param p Hit probability
   * @param mu Optional way to specify hit probability
   * @returns {Array} Random variates array
   */
  rnbinom: function(n, size, p, mu) {
      n = this._v(n, "n");
      if(size === undefined) size=1;
      if(Math.round(size) != size) throw "Size must be a whole number";
      if(size < 1) throw "Size must be one or greater";
      if(p !== undefined && mu !== undefined) throw "You must specify probability or mean, not both";
      if(mu !== undefined) p = size/(size+mu);
      p = this._v(p, "p");
383
384
      var toReturn = [];
386
      for(var i=0; i<n; i++) {
388
          // Core distribution
          var result = 0;
          var leftToFind = size;
          while(leftToFind > 0) {
              result++;
              if(this.prng() < p) leftToFind--;
          }
396
          toReturn[i] = result - 1;
      }
399
      return toReturn
401
  },
403
  /**
   *
   * @param x Where to sample the density
   * @param mean Mean of the distribution
   * @param sd Standard deviation for the distribution
   * @returns {Number} The density given the parameter values
   */
  dnorm: function(x, mean, sd) {
      x = this._v(x, "r");
      mean = this._v(mean, "r", 0);
      sd = this._v(sd, "nn", 1);
415
      // Check for degeneracy
      if(sd === 0) {
          if(x === mean) return Infinity;
          return 0
      }
421
      var a = sd*(Math.sqrt(2*PI));
      var b = -(x-mean)*(x-mean);
      var c = 2*sd*sd;
425
      return (1/a)*exp(b/c)
  },
428
429
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer.
   * @param mean Mean of the distribution
   * @param sd Standard Deviation of the distribution
   * @returns {Array} Random variates array
   */
  rnorm: function(n, mean, sd) {
      // Adapted from http://blog.yjl.im/2010/09/simulating-normal-random-variable-using.html
439
      n = this._v(n, "n");
      mean = this._v(mean, "r", 0);
      sd = this._v(sd, "nn", 1);
443
      var toReturn = [];
445
      for(var i=0; i<n; i++) {
          var V1, V2, S, X;
448
          do {
              var U1 = this.prng();
              var U2 = this.prng();
              V1 = (2 * U1) - 1;
              V2 = (2 * U2) - 1;
              S = (V1 * V1) + (V2 * V2);
          } while (S > 1);
456
          X = Math.sqrt(-2 * ln(S) / S) * V1;
          X = mean + sd * X;
          toReturn.push(X);
      }
461
      return toReturn
  },
464
465
  /**
   *
   * @param x Where to sample the density
   * @param lambda Mean/variance
   * @returns {Number} The density given the parameter values
   */
  dpois: function(x, lambda) {
      x = this._v(x, "nni");
      lambda = this._v(lambda, "nn");
475
      // Check for degeneracy
      if(lambda === 0) {
          if(x === 0) return 1;
          return 0
      }
481
      var a = pow(lambda, x);
      var b = exp(-lambda);
      var c = this._factorial(x);
485
      return a*b/c
  },
488
489
  /**
   *
   * @param n The number of random variates to create. Must be a positive integer.
   * @param lambda Mean/Variance of the distribution
   * @returns {Array} Random variates array
   */
  rpois: function(n, lambda) {
      n = this._v(n, "n");
      lambda = this._v(lambda, "pos");
499
      var toReturn = [];
501
      for(var i=0; i<n; i++) {
503
          // Adapted from http://wiki.q-researchsoftware.com/wiki/How_to_Generate_Random_Numbers:_Poisson_Distribution
          if (lambda < 30) {
506
              var L = exp(-lambda);
              var p = 1;
              var k = 0;
              do {
                  k++;
                  p *= this.prng();
              } while (p > L);
              toReturn.push(k - 1);
515
          } else {
517
              // Roll our own
              // Fix total number of samples
              var samples = 10000;
              var p = lambda/samples;
              var k = 0;
              for(var j=0; j<samples; j++) {
                  if(this.prng() < p) {
                      k++
                  }
              }
              toReturn[i] = k;
          }
      }
531
      return toReturn
  },
534
  dunif: function(x, min, max) {
      x = this._v(x, "r");
      min = this._v(min, "r", 0);
      max = this._v(max, "r", 1);
      if(min > max) throw "Minimum value cannot be greater than maximum value";
540
      if(x < min || x > max) return 0;
      if(min === max) return Infinity;
543
544
      return 1/(max-min);
  },
547
548
  /**
   *
   * @param n  Number of variates to return
   * @param min Lower bound
   * @param max Upper bound
   * @returns {Array} Random variates array
   */
  runif: function(n, min, max) {
      n = this._v(n, "n");
      min = this._v(min, "r", 0);
      max = this._v(max, "r", 1);
      if(min > max) throw "Minimum value cannot be greater than maximum value";
561
      var toReturn = [];
563
      for(var i=0; i<n; i++) {
          var raw = this.prng();
          var scaled = min + raw*(max-min);
          toReturn.push(scaled)
      }
      return toReturn
  },
571
572
  /**
   *
   * @param collection Array of items to sample from
   * @param n Number of items to sample. If missing, n will be set to the length of the collection and it will shuffle
   * @param replace Sample with replacement? False by default
   * @param ratios Ratios to weight items. Can be any non-negative number. By default all items are given equal weight
   * @returns {Array} Array of sampled items
   */
  sample: function(collection, n, replace, ratios) {
582
      // Validations
      collection = this._v(collection, "a");
      n = this._v(n, "n", collection.length); // If n is undefined, sample the full array
      if(replace === undefined) replace = false;
      if(!replace && collection.length < n)
          throw "You cannot select " + n + " items from an array of length " + collection.length + " without replacement";
589
      if(ratios === undefined) {
          ratios = [];
          for(var m=0; m<collection.length; m++) { ratios[m] = 1 }
      }
594
      var cumulativeProbs = this._getCumulativeProbs(ratios, collection.length);
596
      // Main loop
      var toReturn = [];
599
      for(var i=0; i<n; i++) {
601
          var chosen = this._sampleOneIndex(cumulativeProbs);
603
          if(replace) {
              toReturn[i] = collection[chosen];
          } else {
607
              // Remove from collection and ratios
              toReturn[i] = collection.splice(chosen, 1)[0];
              ratios.splice(chosen, 1);
611
              // Make sure we aren't at the end
              if(ratios.length) {
                  cumulativeProbs = this._getCumulativeProbs(ratios, collection.length);
              }
          }
      }
618
      return toReturn;
620
  },
622
623
  // HELPERS
625
  /**
   *
   * @param ratios Array of non-negative numbers to be turned into CDF
   * @param len length of the collection
   * @returns {Array}
   * @private
   */
  _getCumulativeProbs: function(ratios, len) {
      if(len === undefined) throw "An error occurred: len was not sent to _getCumulativeProbs";
      if(ratios.length !== len) throw "Probabilities for sample must be same length as the array to sample from";
636
      var toReturn = [];
638
      if(ratios !== undefined) {
          ratios = this._v(ratios, "a");
          if(ratios.length !== len) throw "Probabilities array must be the same length as the array you are sampling from";
642
          var sum = 0;
          ratios.map(function(ratio) {
              ratio = this._v(ratio, "nn"); // Note validating as ANY non-negative number
              sum+= ratio;
              toReturn.push(sum);
          }.bind(this));
649
          // Divide by total to normalize
          for(var k=0; k<toReturn.length; k++) { toReturn[k] = toReturn[k]/sum }
          return toReturn
      }
  },
655
  _sampleOneIndex: function(cumulativeProbs) {
657
      var toTake = this.prng();
659
      // Find out where this lands in weights
      var cur = 0;
      while(toTake > cumulativeProbs[cur]) cur++;
663
      return cur;
  },
666
  _factorial: function(n) {
      var toReturn=1;
      for (var i = 2; i <= n; i++)
          toReturn = toReturn * i;
671
      return toReturn;
  },
674
  // Return default if undefined, otherwise validate
  _v: function(param, type, defaultParam) {
      if(param == null && defaultParam != null)
          return defaultParam;
679
      switch(type) {
681
          // Array of 1 item or more
          case "a":
              if(!Array.isArray(param) || !param.length) throw "Expected an array of length 1 or greater";
              return param;
686
          // Integer
          case "int":
              if(param !== Number(param)) throw "A required parameter is missing or not a number";
              if(param !== Math.round(param)) throw "Parameter must be a whole number";
              if(param === Infinity) throw 'Sent "infinity" as a parameter';
              return param;
693
          // Natural number
          case "n":
              if(param === undefined) throw "You must specify how many values you want";
              if(param !== Number(param)) throw "The number of values must be numeric";
              if(param !== Math.round(param)) throw "The number of values must be a whole number";
              if(param < 1) throw "The number of values must be a whole number of 1 or greater";
              if(param === Infinity) throw "The number of values cannot be infinite ;-)";
              return param;
702
          // Valid probability
          case "p":
              if(Number(param) !== param) throw "Probability value is missing or not a number";
              if(param > 1) throw "Probability values cannot be greater than 1";
              if(param < 0) throw "Probability values cannot be less than 0";
              return param;
709
          // Positive numbers
          case "pos":
              if(Number(param) !== param) throw "A required parameter is missing or not a number";
              if(param <= 0) throw "Parameter must be greater than 0";
              if(param === Infinity) throw 'Sent "infinity" as a parameter';
              return param;
716
          // Look for numbers (reals)
          case "r":
              if(Number(param) !== param) throw "A required parameter is missing or not a number";
              if(param === Infinity) throw 'Sent "infinity" as a parameter';
              return param;
722
          // Non negative real number
          case "nn":
              if(param !== Number(param)) throw "A required parameter is missing or not a number";
              if(param < 0) throw "Parameter cannot be less than 0";
              if(param === Infinity) throw 'Sent "infinity" as a parameter';
              return param;
729
          // Non negative whole number (integer)
          case "nni":
              if(param !== Number(param)) throw "A required parameter is missing or not a number";
              if(param !== Math.round(param)) throw "Parameter must be a whole number";
              if(param < 0) throw "Parameter cannot be less than zero";
              if(param === Infinity) throw 'Sent "infinity" as a parameter';
              return param;
737
      }
  },
740
741
  //    ________   _______  ______ _____  _____ __  __ ______ _   _ _______       _
  //   |  ____\ \ / /  __ \|  ____|  __ \|_   _|  \/  |  ____| \ | |__   __|/\   | |
  //   | |__   \ V /| |__) | |__  | |__) | | | | \  / | |__  |  \| |  | |  /  \  | |
  //   |  __|   > < |  ___/|  __| |  _  /  | | | |\/| |  __| | . ` |  | | / /\ \ | |
  //   | |____ / . \| |    | |____| | \ \ _| |_| |  | | |____| |\  |  | |/ ____ \| |____
  //   |______/_/ \_\_|    |______|_|  \_\_____|_|  |_|______|_| \_|  |_/_/    \_\______|
748
  /**
   *
   * @param n Number of variates to return
   * @param loc Starting point. Must be a non-negative integer. 0 for degenerate distribution of 0.
   * @param p Probability of moving towards finish
   * @param cap Maximum steps before giving up
   * @param trace Variable to track progress
   * @returns {Array} Random variates array
   *
   * The FML distribution is a is based on the number of steps taken to return to the origin
   * from a given position, with transition probabilities set at the beginning by picking a
   * random variate from U(0,1).
   */
  rfml: function (n, loc, p, cap, trace) {
      n = this._v(n, "n");
      loc = this._v(loc, "nni", 1);
      if(p === undefined) p=this.prng;
      cap = this._v(cap, "n", 10000);
      if(trace === undefined) trace={};
768
      var toReturn = [];
770
      for(var i=0; i<n; i++) {
          var x = 0;
          var s = loc;
          var currP = p();
          if(loc === 0) {
776
              toReturn[i] = 0;
          } else {
779
              do {
781
                  var trial = this.prng();
                  if(trial < currP) {
                      s++;
                      trace[String(i) + "_" + String(x)] = { problems: s, p: currP, result: 1 }
                  } else {
                      s--;
                      trace[String(i) + "_" + String(x)] = { problems: s, p: currP, result: -1 }
                  }
                  x++
              } while(s > 0 && x < cap);
792
              if(x === cap) x = -1; // Indicate we failed to do it in time.
              toReturn[i] = x;
          }
      }
      return toReturn
  },
799
  // http://www.statisticsblog.com/2013/05/uncovering-the-unreliable-friend-distribution-a-case-study-in-the-limits-of-mc-methods/
  /**
   *
   * The Unrelaible Friend distribution
   * @param n
   * @returns {Array} Random variates array
   */
  ruf: function(n) {
      n = this._v(n, "n");
809
      var toReturn = [];
811
      for(var i=0; i<n; i++) {
          toReturn[i] = this.rexp(1, this.prng())[0];
      }
815
      return toReturn
  }
818};
819
820// TODO: Add "perfect fake" functions: http://www.statisticsblog.com/2010/06/the-perfect-fake/
821// NOTES
822// Potential config options:
823// default entropy amount
824// Need pathway to make ready for secure applications (NIST/diehard?)
825// Always return a vector unless number is 1? This could be config option or put "1" at end of fcn to get 1 only
826// Separate out core random variate creation from number to create loop
827// TODO: To test out quality of randomness, stub in specific values for this.prng and make sure correct stuff is returned.
\No newline at end of file
1	`/* ================================================================`
2	`* probability-distributions by Matt Asher (me[at]mattasher.com)`
3	`* Originally created for StatisticsBlog.com`
4	`*`
5	`* first created at : Sat Oct 10 2015`
6	`*`
7	`* ================================================================`
8	`* Copyright 2015 Matt Asher`
9	`*`
10	`* Licensed under the MIT License`
11	`* You may not use this file except in compliance with the License.`
12	`*`
13	`* ================================================================ */`
14
15	`var crypto = require('crypto');`
16
17	`// Shortcuts`
18	`var exp = Math.exp;`
19	`var ln = Math.log;`
20	`var PI = Math.PI;`
21	`var pow = Math.pow;`
22
23	`module.exports = {`
24
25	`/**`
26	`* This is the core function for generating entropy`
27	`*`
28	`* @param len number of bytes of entropy to create`
29	`* @returns {number} A pseduo random number between 0 and 1`
30	`*`
31	`*/`
32	`prng: function(len) {`
33	`if(len === undefined) len=16;`
34
35	`var entropy = crypto.randomBytes(len);`
36	`var result = 0;`
37
38	`for(var i=0; i<len; i++) {`
39	`result = result + Number(entropy[i])/Math.pow(256,(i+1))`
40	`}`