summaryrefslogtreecommitdiff
path: root/src/main/java/org/apache/commons/math3/stat/inference/BinomialTest.java
diff options
context:
space:
mode:
Diffstat (limited to 'src/main/java/org/apache/commons/math3/stat/inference/BinomialTest.java')
-rw-r--r--src/main/java/org/apache/commons/math3/stat/inference/BinomialTest.java160
1 files changed, 160 insertions, 0 deletions
diff --git a/src/main/java/org/apache/commons/math3/stat/inference/BinomialTest.java b/src/main/java/org/apache/commons/math3/stat/inference/BinomialTest.java
new file mode 100644
index 0000000..2efe091
--- /dev/null
+++ b/src/main/java/org/apache/commons/math3/stat/inference/BinomialTest.java
@@ -0,0 +1,160 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.commons.math3.stat.inference;
+
+import org.apache.commons.math3.distribution.BinomialDistribution;
+import org.apache.commons.math3.exception.MathIllegalArgumentException;
+import org.apache.commons.math3.exception.MathInternalError;
+import org.apache.commons.math3.exception.NotPositiveException;
+import org.apache.commons.math3.exception.NullArgumentException;
+import org.apache.commons.math3.exception.OutOfRangeException;
+import org.apache.commons.math3.exception.util.LocalizedFormats;
+
+/**
+ * Implements binomial test statistics.
+ * <p>
+ * Exact test for the statistical significance of deviations from a
+ * theoretically expected distribution of observations into two categories.
+ *
+ * @see <a href="http://en.wikipedia.org/wiki/Binomial_test">Binomial test (Wikipedia)</a>
+ * @since 3.3
+ */
+public class BinomialTest {
+
+ /**
+ * Returns whether the null hypothesis can be rejected with the given confidence level.
+ * <p>
+ * <strong>Preconditions</strong>:
+ * <ul>
+ * <li>Number of trials must be &ge; 0.</li>
+ * <li>Number of successes must be &ge; 0.</li>
+ * <li>Number of successes must be &le; number of trials.</li>
+ * <li>Probability must be &ge; 0 and &le; 1.</li>
+ * </ul>
+ *
+ * @param numberOfTrials number of trials performed
+ * @param numberOfSuccesses number of successes observed
+ * @param probability assumed probability of a single trial under the null hypothesis
+ * @param alternativeHypothesis type of hypothesis being evaluated (one- or two-sided)
+ * @param alpha significance level of the test
+ * @return true if the null hypothesis can be rejected with confidence {@code 1 - alpha}
+ * @throws NotPositiveException if {@code numberOfTrials} or {@code numberOfSuccesses} is negative
+ * @throws OutOfRangeException if {@code probability} is not between 0 and 1
+ * @throws MathIllegalArgumentException if {@code numberOfTrials} &lt; {@code numberOfSuccesses} or
+ * if {@code alternateHypothesis} is null.
+ * @see AlternativeHypothesis
+ */
+ public boolean binomialTest(int numberOfTrials, int numberOfSuccesses, double probability,
+ AlternativeHypothesis alternativeHypothesis, double alpha) {
+ double pValue = binomialTest(numberOfTrials, numberOfSuccesses, probability, alternativeHypothesis);
+ return pValue < alpha;
+ }
+
+ /**
+ * Returns the <i>observed significance level</i>, or
+ * <a href="http://www.cas.lancs.ac.uk/glossary_v1.1/hyptest.html#pvalue">p-value</a>,
+ * associated with a <a href="http://en.wikipedia.org/wiki/Binomial_test"> Binomial test</a>.
+ * <p>
+ * The number returned is the smallest significance level at which one can reject the null hypothesis.
+ * The form of the hypothesis depends on {@code alternativeHypothesis}.</p>
+ * <p>
+ * The p-Value represents the likelihood of getting a result at least as extreme as the sample,
+ * given the provided {@code probability} of success on a single trial. For single-sided tests,
+ * this value can be directly derived from the Binomial distribution. For the two-sided test,
+ * the implementation works as follows: we start by looking at the most extreme cases
+ * (0 success and n success where n is the number of trials from the sample) and determine their likelihood.
+ * The lower value is added to the p-Value (if both values are equal, both are added). Then we continue with
+ * the next extreme value, until we added the value for the actual observed sample.</p>
+ * <p>
+ * <strong>Preconditions</strong>:
+ * <ul>
+ * <li>Number of trials must be &ge; 0.</li>
+ * <li>Number of successes must be &ge; 0.</li>
+ * <li>Number of successes must be &le; number of trials.</li>
+ * <li>Probability must be &ge; 0 and &le; 1.</li>
+ * </ul></p>
+ *
+ * @param numberOfTrials number of trials performed
+ * @param numberOfSuccesses number of successes observed
+ * @param probability assumed probability of a single trial under the null hypothesis
+ * @param alternativeHypothesis type of hypothesis being evaluated (one- or two-sided)
+ * @return p-value
+ * @throws NotPositiveException if {@code numberOfTrials} or {@code numberOfSuccesses} is negative
+ * @throws OutOfRangeException if {@code probability} is not between 0 and 1
+ * @throws MathIllegalArgumentException if {@code numberOfTrials} &lt; {@code numberOfSuccesses} or
+ * if {@code alternateHypothesis} is null.
+ * @see AlternativeHypothesis
+ */
+ public double binomialTest(int numberOfTrials, int numberOfSuccesses, double probability,
+ AlternativeHypothesis alternativeHypothesis) {
+ if (numberOfTrials < 0) {
+ throw new NotPositiveException(numberOfTrials);
+ }
+ if (numberOfSuccesses < 0) {
+ throw new NotPositiveException(numberOfSuccesses);
+ }
+ if (probability < 0 || probability > 1) {
+ throw new OutOfRangeException(probability, 0, 1);
+ }
+ if (numberOfTrials < numberOfSuccesses) {
+ throw new MathIllegalArgumentException(
+ LocalizedFormats.BINOMIAL_INVALID_PARAMETERS_ORDER,
+ numberOfTrials, numberOfSuccesses);
+ }
+ if (alternativeHypothesis == null) {
+ throw new NullArgumentException();
+ }
+
+ // pass a null rng to avoid unneeded overhead as we will not sample from this distribution
+ final BinomialDistribution distribution = new BinomialDistribution(null, numberOfTrials, probability);
+ switch (alternativeHypothesis) {
+ case GREATER_THAN:
+ return 1 - distribution.cumulativeProbability(numberOfSuccesses - 1);
+ case LESS_THAN:
+ return distribution.cumulativeProbability(numberOfSuccesses);
+ case TWO_SIDED:
+ int criticalValueLow = 0;
+ int criticalValueHigh = numberOfTrials;
+ double pTotal = 0;
+
+ while (true) {
+ double pLow = distribution.probability(criticalValueLow);
+ double pHigh = distribution.probability(criticalValueHigh);
+
+ if (pLow == pHigh) {
+ pTotal += 2 * pLow;
+ criticalValueLow++;
+ criticalValueHigh--;
+ } else if (pLow < pHigh) {
+ pTotal += pLow;
+ criticalValueLow++;
+ } else {
+ pTotal += pHigh;
+ criticalValueHigh--;
+ }
+
+ if (criticalValueLow > numberOfSuccesses || criticalValueHigh < numberOfSuccesses) {
+ break;
+ }
+ }
+ return pTotal;
+ default:
+ throw new MathInternalError(LocalizedFormats. OUT_OF_RANGE_SIMPLE, alternativeHypothesis,
+ AlternativeHypothesis.TWO_SIDED, AlternativeHypothesis.LESS_THAN);
+ }
+ }
+}