Search code examples
javascipyp-valueapache-commons-math

zScore and p-value in Java (survival function)


What would be the java equivalent of the following code?

import scipy
from scipy.stats import zscore
zlist = [9967,11281,10752,10576,2366,11882,11798,]
z = zscore(zlist)
for e in z:
    print e,scipy.stats.norm.sf(abs(e))

Solution

  • And the answer is:

    private void run() {
        double[] values = {9967,11281,10752,10576,2366,11882,11798};
        double variance = StatUtils.populationVariance(values);
        double sd = Math.sqrt(variance);
        double mean = StatUtils.mean(values);
        NormalDistribution nd = new NormalDistribution();
        for ( double value: values ) {
            double stdscore = (value-mean)/sd;
            double sf = 1.0 - nd.cumulativeProbability(Math.abs(stdscore));
            System.out.println("" + stdscore + " " + sf);
        }
    }
    

    This is using The Apache Commons Mathematics Library

    EDIT: Or, even better:

    import java.util.function.BiConsumer;
    
    import org.apache.commons.math3.distribution.NormalDistribution;
    import org.apache.commons.math3.distribution.RealDistribution;
    import org.apache.commons.math3.stat.descriptive.DescriptiveStatistics;
    
    public class ZScore {
        public static void main(String[] args) {
            ZScore program = new ZScore();
            double[] values = {9967,11281,10752,10576,2366,11882,11798};
            program.computeZScoreAndSurvivalFunctions(
                new DescriptiveStatistics(values), 
                new NormalDistribution(), 
                (zscore, sf)->System.out.println(""+zscore+" "+sf)
            );
        }
    
        private void computeZScoreAndSurvivalFunctions(
            DescriptiveStatistics ds, 
            RealDistribution dist, 
            BiConsumer<Double, Double> consumer
        ) {
            double variance = ds.getPopulationVariance();
            double sd = Math.sqrt(variance);
            double mean = ds.getMean();
            for ( int index = 0; index < ds.getN(); ++index) {
                double zscore = (ds.getElement(index)-mean)/sd;
                double sf = 1.0 - dist.cumulativeProbability(Math.abs(zscore));
                consumer.accept(zscore, sf);
            }
        }
    }