All Downloads are FREE. Search and download functionalities are using the official Maven repository.

smile.stat.distribution.GeometricDistribution Maven / Gradle / Ivy

The newest version!
/*******************************************************************************
 * Copyright (c) 2010 Haifeng Li
 *   
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *  
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *******************************************************************************/
package smile.stat.distribution;

/**
 * The geometric distribution is a discrete probability distribution of the
 * number X of Bernoulli trials needed to get one success, supported on the set
 * {1, 2, 3, …}. Sometimes, people define that the probability distribution
 * of the number Y = X - 1 of failures before the first success, supported on
 * the set {0, 1, 2, 3, …}. To reduce the confusion, we denote the later as
 * shifted geometric distribution.
 * If the probability of success on each trial is p, then the probability that
 * the k-th trial (out of k trials) is the first success is
 * Pr(X = k) = (1 - p)k-1 p.
 * 

* Like its continuous analogue (the exponential distribution), the geometric * distribution is memoryless. That means that if you intend to repeat an * experiment until the first success, then, given that the first success has * not yet occurred, the conditional probability distribution of the number * of additional trials does not depend on how many failures have been * observed. The geometric distribution is in fact the only memoryless * discrete distribution. *

* Among all discrete probability distributions supported on {1, 2, 3, …} * with given expected value μ, the geometric distribution X with parameter * p = 1/μ is the one with the largest entropy. * @see ShiftedGeometricDistribution * * @author Haifeng Li */ public class GeometricDistribution extends DiscreteDistribution implements DiscreteExponentialFamily { /** * Probability of success on each trial. */ private double p; /** * The exponential distribution to generate Geometric distributed * random number. */ ExponentialDistribution expDist; /** * Constructor. * @param p the probability of success. */ public GeometricDistribution(double p) { if (p <= 0 || p > 1) { throw new IllegalArgumentException("Invalid p: " + p); } this.p = p; } /** * Constructor. Parameter will be estimated from the data by MLE. */ public GeometricDistribution(int[] data) { double sum = 0.0; for (int x : data) { if (x <= 0) { throw new IllegalArgumentException("Invalid value " + x); } sum += x; } p = data.length / sum; } /** * Returns the probability of success. */ public double getProb() { return p; } @Override public int npara() { return 1; } @Override public double mean() { return (1 - p) / p; } @Override public double var() { return (1 - p) / (p * p); } @Override public double sd() { return Math.sqrt(1 - p) / p; } /** * Shannon entropy. Not supported. */ @Override public double entropy() { throw new UnsupportedOperationException("Geometric distribution does not support entropy()"); } @Override public String toString() { return String.format("Geometric Distribution(%.4f)", p); } @Override public double rand() { if (expDist == null) { double lambda = -Math.log(1 - p); expDist = new ExponentialDistribution(lambda); } return Math.floor(expDist.rand()) + 1; } @Override public double p(int k) { if (k < 0) { return 0.0; } else { return Math.pow(1 - p, k) * p; } } @Override public double logp(int k) { if (k < 0) { return Double.NEGATIVE_INFINITY; } else { return k * Math.log(1 - p) + Math.log(p); } } @Override public double cdf(double k) { if (k < 0) { return 0.0; } else { return 1 - Math.pow(1 - p, k + 1); } } @Override public double quantile(double p) { if (p < 0.0 || p > 1.0) { throw new IllegalArgumentException("Invalid p: " + p); } int n = (int) Math.max(Math.sqrt(1 / this.p), 5.0); int nl, nu, inc = 1; if (p < cdf(n)) { do { n = Math.max(n - inc, 0); inc *= 2; } while (p < cdf(n) && n > 0); nl = n; nu = n + inc / 2; } else { do { n += inc; inc *= 2; } while (p > cdf(n)); nu = n; nl = n - inc / 2; } return quantile(p, nl, nu); } @Override public DiscreteMixture.Component M(int[] x, double[] posteriori) { double alpha = 0.0; double mean = 0.0; for (int i = 0; i < x.length; i++) { alpha += posteriori[i]; mean += x[i] * posteriori[i]; } mean /= alpha; DiscreteMixture.Component c = new DiscreteMixture.Component(); c.priori = alpha; c.distribution = new GeometricDistribution(1 / mean); return c; } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy