Mercurial > hg > de.mpg.mpiwg.itgroup.digilib.plugin

<HTML>
<BODY BGCOLOR="white">
<PRE>
<FONT color="green">001</FONT>    /*<a name="line.1"></a>
<FONT color="green">002</FONT>     * Licensed to the Apache Software Foundation (ASF) under one or more<a name="line.2"></a>
<FONT color="green">003</FONT>     * contributor license agreements.  See the NOTICE file distributed with<a name="line.3"></a>
<FONT color="green">004</FONT>     * this work for additional information regarding copyright ownership.<a name="line.4"></a>
<FONT color="green">005</FONT>     * The ASF licenses this file to You under the Apache License, Version 2.0<a name="line.5"></a>
<FONT color="green">006</FONT>     * (the "License"); you may not use this file except in compliance with<a name="line.6"></a>
<FONT color="green">007</FONT>     * the License.  You may obtain a copy of the License at<a name="line.7"></a>
<FONT color="green">008</FONT>     *<a name="line.8"></a>
<FONT color="green">009</FONT>     *      http://www.apache.org/licenses/LICENSE-2.0<a name="line.9"></a>
<FONT color="green">010</FONT>     *<a name="line.10"></a>
<FONT color="green">011</FONT>     * Unless required by applicable law or agreed to in writing, software<a name="line.11"></a>
<FONT color="green">012</FONT>     * distributed under the License is distributed on an "AS IS" BASIS,<a name="line.12"></a>
<FONT color="green">013</FONT>     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.<a name="line.13"></a>
<FONT color="green">014</FONT>     * See the License for the specific language governing permissions and<a name="line.14"></a>
<FONT color="green">015</FONT>     * limitations under the License.<a name="line.15"></a>
<FONT color="green">016</FONT>     */<a name="line.16"></a>
<FONT color="green">017</FONT>    package org.apache.commons.math.stat.inference;<a name="line.17"></a>
<FONT color="green">018</FONT>    <a name="line.18"></a>
<FONT color="green">019</FONT>    import org.apache.commons.math.MathException;<a name="line.19"></a>
<FONT color="green">020</FONT>    import org.apache.commons.math.MathRuntimeException;<a name="line.20"></a>
<FONT color="green">021</FONT>    import org.apache.commons.math.distribution.TDistribution;<a name="line.21"></a>
<FONT color="green">022</FONT>    import org.apache.commons.math.distribution.TDistributionImpl;<a name="line.22"></a>
<FONT color="green">023</FONT>    import org.apache.commons.math.stat.StatUtils;<a name="line.23"></a>
<FONT color="green">024</FONT>    import org.apache.commons.math.stat.descriptive.StatisticalSummary;<a name="line.24"></a>
<FONT color="green">025</FONT>    <a name="line.25"></a>
<FONT color="green">026</FONT>    /**<a name="line.26"></a>
<FONT color="green">027</FONT>     * Implements t-test statistics defined in the {@link TTest} interface.<a name="line.27"></a>
<FONT color="green">028</FONT>     * &lt;p&gt;<a name="line.28"></a>
<FONT color="green">029</FONT>     * Uses commons-math {@link org.apache.commons.math.distribution.TDistribution}<a name="line.29"></a>
<FONT color="green">030</FONT>     * implementation to estimate exact p-values.&lt;/p&gt;<a name="line.30"></a>
<FONT color="green">031</FONT>     *<a name="line.31"></a>
<FONT color="green">032</FONT>     * @version $Revision: 885278 $ $Date: 2009-11-29 16:47:51 -0500 (Sun, 29 Nov 2009) $<a name="line.32"></a>
<FONT color="green">033</FONT>     */<a name="line.33"></a>
<FONT color="green">034</FONT>    public class TTestImpl implements TTest  {<a name="line.34"></a>
<FONT color="green">035</FONT>    <a name="line.35"></a>
<FONT color="green">036</FONT>        /** Message for insufficient data. */<a name="line.36"></a>
<FONT color="green">037</FONT>        private static final String INSUFFICIENT_DATA_MESSAGE =<a name="line.37"></a>
<FONT color="green">038</FONT>            "insufficient data for t statistic, needs at least 2, got {0}";<a name="line.38"></a>
<FONT color="green">039</FONT>    <a name="line.39"></a>
<FONT color="green">040</FONT>        /** Distribution used to compute inference statistics. */<a name="line.40"></a>
<FONT color="green">041</FONT>        private TDistribution distribution;<a name="line.41"></a>
<FONT color="green">042</FONT>    <a name="line.42"></a>
<FONT color="green">043</FONT>        /**<a name="line.43"></a>
<FONT color="green">044</FONT>         * Default constructor.<a name="line.44"></a>
<FONT color="green">045</FONT>         */<a name="line.45"></a>
<FONT color="green">046</FONT>        public TTestImpl() {<a name="line.46"></a>
<FONT color="green">047</FONT>            this(new TDistributionImpl(1.0));<a name="line.47"></a>
<FONT color="green">048</FONT>        }<a name="line.48"></a>
<FONT color="green">049</FONT>    <a name="line.49"></a>
<FONT color="green">050</FONT>        /**<a name="line.50"></a>
<FONT color="green">051</FONT>         * Create a test instance using the given distribution for computing<a name="line.51"></a>
<FONT color="green">052</FONT>         * inference statistics.<a name="line.52"></a>
<FONT color="green">053</FONT>         * @param t distribution used to compute inference statistics.<a name="line.53"></a>
<FONT color="green">054</FONT>         * @since 1.2<a name="line.54"></a>
<FONT color="green">055</FONT>         */<a name="line.55"></a>
<FONT color="green">056</FONT>        public TTestImpl(TDistribution t) {<a name="line.56"></a>
<FONT color="green">057</FONT>            super();<a name="line.57"></a>
<FONT color="green">058</FONT>            setDistribution(t);<a name="line.58"></a>
<FONT color="green">059</FONT>        }<a name="line.59"></a>
<FONT color="green">060</FONT>    <a name="line.60"></a>
<FONT color="green">061</FONT>        /**<a name="line.61"></a>
<FONT color="green">062</FONT>         * Computes a paired, 2-sample t-statistic based on the data in the input<a name="line.62"></a>
<FONT color="green">063</FONT>         * arrays.  The t-statistic returned is equivalent to what would be returned by<a name="line.63"></a>
<FONT color="green">064</FONT>         * computing the one-sample t-statistic {@link #t(double, double[])}, with<a name="line.64"></a>
<FONT color="green">065</FONT>         * &lt;code&gt;mu = 0&lt;/code&gt; and the sample array consisting of the (signed)<a name="line.65"></a>
<FONT color="green">066</FONT>         * differences between corresponding entries in &lt;code&gt;sample1&lt;/code&gt; and<a name="line.66"></a>
<FONT color="green">067</FONT>         * &lt;code&gt;sample2.&lt;/code&gt;<a name="line.67"></a>
<FONT color="green">068</FONT>         * &lt;p&gt;<a name="line.68"></a>
<FONT color="green">069</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.69"></a>
<FONT color="green">070</FONT>         * &lt;li&gt;The input arrays must have the same length and their common length<a name="line.70"></a>
<FONT color="green">071</FONT>         * must be at least 2.<a name="line.71"></a>
<FONT color="green">072</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.72"></a>
<FONT color="green">073</FONT>         *<a name="line.73"></a>
<FONT color="green">074</FONT>         * @param sample1 array of sample data values<a name="line.74"></a>
<FONT color="green">075</FONT>         * @param sample2 array of sample data values<a name="line.75"></a>
<FONT color="green">076</FONT>         * @return t statistic<a name="line.76"></a>
<FONT color="green">077</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.77"></a>
<FONT color="green">078</FONT>         * @throws MathException if the statistic can not be computed do to a<a name="line.78"></a>
<FONT color="green">079</FONT>         *         convergence or other numerical error.<a name="line.79"></a>
<FONT color="green">080</FONT>         */<a name="line.80"></a>
<FONT color="green">081</FONT>        public double pairedT(double[] sample1, double[] sample2)<a name="line.81"></a>
<FONT color="green">082</FONT>            throws IllegalArgumentException, MathException {<a name="line.82"></a>
<FONT color="green">083</FONT>            checkSampleData(sample1);<a name="line.83"></a>
<FONT color="green">084</FONT>            checkSampleData(sample2);<a name="line.84"></a>
<FONT color="green">085</FONT>            double meanDifference = StatUtils.meanDifference(sample1, sample2);<a name="line.85"></a>
<FONT color="green">086</FONT>            return t(meanDifference, 0,<a name="line.86"></a>
<FONT color="green">087</FONT>                    StatUtils.varianceDifference(sample1, sample2, meanDifference),<a name="line.87"></a>
<FONT color="green">088</FONT>                    sample1.length);<a name="line.88"></a>
<FONT color="green">089</FONT>        }<a name="line.89"></a>
<FONT color="green">090</FONT>    <a name="line.90"></a>
<FONT color="green">091</FONT>         /**<a name="line.91"></a>
<FONT color="green">092</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.92"></a>
<FONT color="green">093</FONT>         * &lt;i&gt; p-value&lt;/i&gt;, associated with a paired, two-sample, two-tailed t-test<a name="line.93"></a>
<FONT color="green">094</FONT>         * based on the data in the input arrays.<a name="line.94"></a>
<FONT color="green">095</FONT>         * &lt;p&gt;<a name="line.95"></a>
<FONT color="green">096</FONT>         * The number returned is the smallest significance level<a name="line.96"></a>
<FONT color="green">097</FONT>         * at which one can reject the null hypothesis that the mean of the paired<a name="line.97"></a>
<FONT color="green">098</FONT>         * differences is 0 in favor of the two-sided alternative that the mean paired<a name="line.98"></a>
<FONT color="green">099</FONT>         * difference is not equal to 0. For a one-sided test, divide the returned<a name="line.99"></a>
<FONT color="green">100</FONT>         * value by 2.&lt;/p&gt;<a name="line.100"></a>
<FONT color="green">101</FONT>         * &lt;p&gt;<a name="line.101"></a>
<FONT color="green">102</FONT>         * This test is equivalent to a one-sample t-test computed using<a name="line.102"></a>
<FONT color="green">103</FONT>         * {@link #tTest(double, double[])} with &lt;code&gt;mu = 0&lt;/code&gt; and the sample<a name="line.103"></a>
<FONT color="green">104</FONT>         * array consisting of the signed differences between corresponding elements of<a name="line.104"></a>
<FONT color="green">105</FONT>         * &lt;code&gt;sample1&lt;/code&gt; and &lt;code&gt;sample2.&lt;/code&gt;&lt;/p&gt;<a name="line.105"></a>
<FONT color="green">106</FONT>         * &lt;p&gt;<a name="line.106"></a>
<FONT color="green">107</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.107"></a>
<FONT color="green">108</FONT>         * The validity of the p-value depends on the assumptions of the parametric<a name="line.108"></a>
<FONT color="green">109</FONT>         * t-test procedure, as discussed<a name="line.109"></a>
<FONT color="green">110</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.110"></a>
<FONT color="green">111</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.111"></a>
<FONT color="green">112</FONT>         * &lt;p&gt;<a name="line.112"></a>
<FONT color="green">113</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.113"></a>
<FONT color="green">114</FONT>         * &lt;li&gt;The input array lengths must be the same and their common length must<a name="line.114"></a>
<FONT color="green">115</FONT>         * be at least 2.<a name="line.115"></a>
<FONT color="green">116</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.116"></a>
<FONT color="green">117</FONT>         *<a name="line.117"></a>
<FONT color="green">118</FONT>         * @param sample1 array of sample data values<a name="line.118"></a>
<FONT color="green">119</FONT>         * @param sample2 array of sample data values<a name="line.119"></a>
<FONT color="green">120</FONT>         * @return p-value for t-test<a name="line.120"></a>
<FONT color="green">121</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.121"></a>
<FONT color="green">122</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.122"></a>
<FONT color="green">123</FONT>         */<a name="line.123"></a>
<FONT color="green">124</FONT>        public double pairedTTest(double[] sample1, double[] sample2)<a name="line.124"></a>
<FONT color="green">125</FONT>            throws IllegalArgumentException, MathException {<a name="line.125"></a>
<FONT color="green">126</FONT>            double meanDifference = StatUtils.meanDifference(sample1, sample2);<a name="line.126"></a>
<FONT color="green">127</FONT>            return tTest(meanDifference, 0,<a name="line.127"></a>
<FONT color="green">128</FONT>                    StatUtils.varianceDifference(sample1, sample2, meanDifference),<a name="line.128"></a>
<FONT color="green">129</FONT>                    sample1.length);<a name="line.129"></a>
<FONT color="green">130</FONT>        }<a name="line.130"></a>
<FONT color="green">131</FONT>    <a name="line.131"></a>
<FONT color="green">132</FONT>         /**<a name="line.132"></a>
<FONT color="green">133</FONT>         * Performs a paired t-test evaluating the null hypothesis that the<a name="line.133"></a>
<FONT color="green">134</FONT>         * mean of the paired differences between &lt;code&gt;sample1&lt;/code&gt; and<a name="line.134"></a>
<FONT color="green">135</FONT>         * &lt;code&gt;sample2&lt;/code&gt; is 0 in favor of the two-sided alternative that the<a name="line.135"></a>
<FONT color="green">136</FONT>         * mean paired difference is not equal to 0, with significance level<a name="line.136"></a>
<FONT color="green">137</FONT>         * &lt;code&gt;alpha&lt;/code&gt;.<a name="line.137"></a>
<FONT color="green">138</FONT>         * &lt;p&gt;<a name="line.138"></a>
<FONT color="green">139</FONT>         * Returns &lt;code&gt;true&lt;/code&gt; iff the null hypothesis can be rejected with<a name="line.139"></a>
<FONT color="green">140</FONT>         * confidence &lt;code&gt;1 - alpha&lt;/code&gt;.  To perform a 1-sided test, use<a name="line.140"></a>
<FONT color="green">141</FONT>         * &lt;code&gt;alpha * 2&lt;/code&gt;&lt;/p&gt;<a name="line.141"></a>
<FONT color="green">142</FONT>         * &lt;p&gt;<a name="line.142"></a>
<FONT color="green">143</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.143"></a>
<FONT color="green">144</FONT>         * The validity of the test depends on the assumptions of the parametric<a name="line.144"></a>
<FONT color="green">145</FONT>         * t-test procedure, as discussed<a name="line.145"></a>
<FONT color="green">146</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.146"></a>
<FONT color="green">147</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.147"></a>
<FONT color="green">148</FONT>         * &lt;p&gt;<a name="line.148"></a>
<FONT color="green">149</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.149"></a>
<FONT color="green">150</FONT>         * &lt;li&gt;The input array lengths must be the same and their common length<a name="line.150"></a>
<FONT color="green">151</FONT>         * must be at least 2.<a name="line.151"></a>
<FONT color="green">152</FONT>         * &lt;/li&gt;<a name="line.152"></a>
<FONT color="green">153</FONT>         * &lt;li&gt; &lt;code&gt; 0 &lt; alpha &lt; 0.5 &lt;/code&gt;<a name="line.153"></a>
<FONT color="green">154</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.154"></a>
<FONT color="green">155</FONT>         *<a name="line.155"></a>
<FONT color="green">156</FONT>         * @param sample1 array of sample data values<a name="line.156"></a>
<FONT color="green">157</FONT>         * @param sample2 array of sample data values<a name="line.157"></a>
<FONT color="green">158</FONT>         * @param alpha significance level of the test<a name="line.158"></a>
<FONT color="green">159</FONT>         * @return true if the null hypothesis can be rejected with<a name="line.159"></a>
<FONT color="green">160</FONT>         * confidence 1 - alpha<a name="line.160"></a>
<FONT color="green">161</FONT>         * @throws IllegalArgumentException if the preconditions are not met<a name="line.161"></a>
<FONT color="green">162</FONT>         * @throws MathException if an error occurs performing the test<a name="line.162"></a>
<FONT color="green">163</FONT>         */<a name="line.163"></a>
<FONT color="green">164</FONT>        public boolean pairedTTest(double[] sample1, double[] sample2, double alpha)<a name="line.164"></a>
<FONT color="green">165</FONT>            throws IllegalArgumentException, MathException {<a name="line.165"></a>
<FONT color="green">166</FONT>            checkSignificanceLevel(alpha);<a name="line.166"></a>
<FONT color="green">167</FONT>            return pairedTTest(sample1, sample2) &lt; alpha;<a name="line.167"></a>
<FONT color="green">168</FONT>        }<a name="line.168"></a>
<FONT color="green">169</FONT>    <a name="line.169"></a>
<FONT color="green">170</FONT>        /**<a name="line.170"></a>
<FONT color="green">171</FONT>         * Computes a &lt;a href="http://www.itl.nist.gov/div898/handbook/prc/section2/prc22.htm#formula"&gt;<a name="line.171"></a>
<FONT color="green">172</FONT>         * t statistic &lt;/a&gt; given observed values and a comparison constant.<a name="line.172"></a>
<FONT color="green">173</FONT>         * &lt;p&gt;<a name="line.173"></a>
<FONT color="green">174</FONT>         * This statistic can be used to perform a one sample t-test for the mean.<a name="line.174"></a>
<FONT color="green">175</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.175"></a>
<FONT color="green">176</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.176"></a>
<FONT color="green">177</FONT>         * &lt;li&gt;The observed array length must be at least 2.<a name="line.177"></a>
<FONT color="green">178</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.178"></a>
<FONT color="green">179</FONT>         *<a name="line.179"></a>
<FONT color="green">180</FONT>         * @param mu comparison constant<a name="line.180"></a>
<FONT color="green">181</FONT>         * @param observed array of values<a name="line.181"></a>
<FONT color="green">182</FONT>         * @return t statistic<a name="line.182"></a>
<FONT color="green">183</FONT>         * @throws IllegalArgumentException if input array length is less than 2<a name="line.183"></a>
<FONT color="green">184</FONT>         */<a name="line.184"></a>
<FONT color="green">185</FONT>        public double t(double mu, double[] observed)<a name="line.185"></a>
<FONT color="green">186</FONT>        throws IllegalArgumentException {<a name="line.186"></a>
<FONT color="green">187</FONT>            checkSampleData(observed);<a name="line.187"></a>
<FONT color="green">188</FONT>            return t(StatUtils.mean(observed), mu, StatUtils.variance(observed),<a name="line.188"></a>
<FONT color="green">189</FONT>                    observed.length);<a name="line.189"></a>
<FONT color="green">190</FONT>        }<a name="line.190"></a>
<FONT color="green">191</FONT>    <a name="line.191"></a>
<FONT color="green">192</FONT>        /**<a name="line.192"></a>
<FONT color="green">193</FONT>         * Computes a &lt;a href="http://www.itl.nist.gov/div898/handbook/prc/section2/prc22.htm#formula"&gt;<a name="line.193"></a>
<FONT color="green">194</FONT>         * t statistic &lt;/a&gt; to use in comparing the mean of the dataset described by<a name="line.194"></a>
<FONT color="green">195</FONT>         * &lt;code&gt;sampleStats&lt;/code&gt; to &lt;code&gt;mu&lt;/code&gt;.<a name="line.195"></a>
<FONT color="green">196</FONT>         * &lt;p&gt;<a name="line.196"></a>
<FONT color="green">197</FONT>         * This statistic can be used to perform a one sample t-test for the mean.<a name="line.197"></a>
<FONT color="green">198</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.198"></a>
<FONT color="green">199</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.199"></a>
<FONT color="green">200</FONT>         * &lt;li&gt;&lt;code&gt;observed.getN() &gt; = 2&lt;/code&gt;.<a name="line.200"></a>
<FONT color="green">201</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.201"></a>
<FONT color="green">202</FONT>         *<a name="line.202"></a>
<FONT color="green">203</FONT>         * @param mu comparison constant<a name="line.203"></a>
<FONT color="green">204</FONT>         * @param sampleStats DescriptiveStatistics holding sample summary statitstics<a name="line.204"></a>
<FONT color="green">205</FONT>         * @return t statistic<a name="line.205"></a>
<FONT color="green">206</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.206"></a>
<FONT color="green">207</FONT>         */<a name="line.207"></a>
<FONT color="green">208</FONT>        public double t(double mu, StatisticalSummary sampleStats)<a name="line.208"></a>
<FONT color="green">209</FONT>        throws IllegalArgumentException {<a name="line.209"></a>
<FONT color="green">210</FONT>            checkSampleData(sampleStats);<a name="line.210"></a>
<FONT color="green">211</FONT>            return t(sampleStats.getMean(), mu, sampleStats.getVariance(),<a name="line.211"></a>
<FONT color="green">212</FONT>                    sampleStats.getN());<a name="line.212"></a>
<FONT color="green">213</FONT>        }<a name="line.213"></a>
<FONT color="green">214</FONT>    <a name="line.214"></a>
<FONT color="green">215</FONT>        /**<a name="line.215"></a>
<FONT color="green">216</FONT>         * Computes a 2-sample t statistic,  under the hypothesis of equal<a name="line.216"></a>
<FONT color="green">217</FONT>         * subpopulation variances.  To compute a t-statistic without the<a name="line.217"></a>
<FONT color="green">218</FONT>         * equal variances hypothesis, use {@link #t(double[], double[])}.<a name="line.218"></a>
<FONT color="green">219</FONT>         * &lt;p&gt;<a name="line.219"></a>
<FONT color="green">220</FONT>         * This statistic can be used to perform a (homoscedastic) two-sample<a name="line.220"></a>
<FONT color="green">221</FONT>         * t-test to compare sample means.&lt;/p&gt;<a name="line.221"></a>
<FONT color="green">222</FONT>         * &lt;p&gt;<a name="line.222"></a>
<FONT color="green">223</FONT>         * The t-statisitc is&lt;/p&gt;<a name="line.223"></a>
<FONT color="green">224</FONT>         * &lt;p&gt;<a name="line.224"></a>
<FONT color="green">225</FONT>         * &amp;nbsp;&amp;nbsp;&lt;code&gt;  t = (m1 - m2) / (sqrt(1/n1 +1/n2) sqrt(var))&lt;/code&gt;<a name="line.225"></a>
<FONT color="green">226</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.226"></a>
<FONT color="green">227</FONT>         * where &lt;strong&gt;&lt;code&gt;n1&lt;/code&gt;&lt;/strong&gt; is the size of first sample;<a name="line.227"></a>
<FONT color="green">228</FONT>         * &lt;strong&gt;&lt;code&gt; n2&lt;/code&gt;&lt;/strong&gt; is the size of second sample;<a name="line.228"></a>
<FONT color="green">229</FONT>         * &lt;strong&gt;&lt;code&gt; m1&lt;/code&gt;&lt;/strong&gt; is the mean of first sample;<a name="line.229"></a>
<FONT color="green">230</FONT>         * &lt;strong&gt;&lt;code&gt; m2&lt;/code&gt;&lt;/strong&gt; is the mean of second sample&lt;/li&gt;<a name="line.230"></a>
<FONT color="green">231</FONT>         * &lt;/ul&gt;<a name="line.231"></a>
<FONT color="green">232</FONT>         * and &lt;strong&gt;&lt;code&gt;var&lt;/code&gt;&lt;/strong&gt; is the pooled variance estimate:<a name="line.232"></a>
<FONT color="green">233</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.233"></a>
<FONT color="green">234</FONT>         * &lt;code&gt;var = sqrt(((n1 - 1)var1 + (n2 - 1)var2) / ((n1-1) + (n2-1)))&lt;/code&gt;<a name="line.234"></a>
<FONT color="green">235</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.235"></a>
<FONT color="green">236</FONT>         * with &lt;strong&gt;&lt;code&gt;var1&lt;code&gt;&lt;/strong&gt; the variance of the first sample and<a name="line.236"></a>
<FONT color="green">237</FONT>         * &lt;strong&gt;&lt;code&gt;var2&lt;/code&gt;&lt;/strong&gt; the variance of the second sample.<a name="line.237"></a>
<FONT color="green">238</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.238"></a>
<FONT color="green">239</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.239"></a>
<FONT color="green">240</FONT>         * &lt;li&gt;The observed array lengths must both be at least 2.<a name="line.240"></a>
<FONT color="green">241</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.241"></a>
<FONT color="green">242</FONT>         *<a name="line.242"></a>
<FONT color="green">243</FONT>         * @param sample1 array of sample data values<a name="line.243"></a>
<FONT color="green">244</FONT>         * @param sample2 array of sample data values<a name="line.244"></a>
<FONT color="green">245</FONT>         * @return t statistic<a name="line.245"></a>
<FONT color="green">246</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.246"></a>
<FONT color="green">247</FONT>         */<a name="line.247"></a>
<FONT color="green">248</FONT>        public double homoscedasticT(double[] sample1, double[] sample2)<a name="line.248"></a>
<FONT color="green">249</FONT>        throws IllegalArgumentException {<a name="line.249"></a>
<FONT color="green">250</FONT>            checkSampleData(sample1);<a name="line.250"></a>
<FONT color="green">251</FONT>            checkSampleData(sample2);<a name="line.251"></a>
<FONT color="green">252</FONT>            return homoscedasticT(StatUtils.mean(sample1), StatUtils.mean(sample2),<a name="line.252"></a>
<FONT color="green">253</FONT>                    StatUtils.variance(sample1), StatUtils.variance(sample2),<a name="line.253"></a>
<FONT color="green">254</FONT>                    sample1.length, sample2.length);<a name="line.254"></a>
<FONT color="green">255</FONT>        }<a name="line.255"></a>
<FONT color="green">256</FONT>    <a name="line.256"></a>
<FONT color="green">257</FONT>        /**<a name="line.257"></a>
<FONT color="green">258</FONT>         * Computes a 2-sample t statistic, without the hypothesis of equal<a name="line.258"></a>
<FONT color="green">259</FONT>         * subpopulation variances.  To compute a t-statistic assuming equal<a name="line.259"></a>
<FONT color="green">260</FONT>         * variances, use {@link #homoscedasticT(double[], double[])}.<a name="line.260"></a>
<FONT color="green">261</FONT>         * &lt;p&gt;<a name="line.261"></a>
<FONT color="green">262</FONT>         * This statistic can be used to perform a two-sample t-test to compare<a name="line.262"></a>
<FONT color="green">263</FONT>         * sample means.&lt;/p&gt;<a name="line.263"></a>
<FONT color="green">264</FONT>         * &lt;p&gt;<a name="line.264"></a>
<FONT color="green">265</FONT>         * The t-statisitc is&lt;/p&gt;<a name="line.265"></a>
<FONT color="green">266</FONT>         * &lt;p&gt;<a name="line.266"></a>
<FONT color="green">267</FONT>         * &amp;nbsp;&amp;nbsp; &lt;code&gt;  t = (m1 - m2) / sqrt(var1/n1 + var2/n2)&lt;/code&gt;<a name="line.267"></a>
<FONT color="green">268</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.268"></a>
<FONT color="green">269</FONT>         *  where &lt;strong&gt;&lt;code&gt;n1&lt;/code&gt;&lt;/strong&gt; is the size of the first sample<a name="line.269"></a>
<FONT color="green">270</FONT>         * &lt;strong&gt;&lt;code&gt; n2&lt;/code&gt;&lt;/strong&gt; is the size of the second sample;<a name="line.270"></a>
<FONT color="green">271</FONT>         * &lt;strong&gt;&lt;code&gt; m1&lt;/code&gt;&lt;/strong&gt; is the mean of the first sample;<a name="line.271"></a>
<FONT color="green">272</FONT>         * &lt;strong&gt;&lt;code&gt; m2&lt;/code&gt;&lt;/strong&gt; is the mean of the second sample;<a name="line.272"></a>
<FONT color="green">273</FONT>         * &lt;strong&gt;&lt;code&gt; var1&lt;/code&gt;&lt;/strong&gt; is the variance of the first sample;<a name="line.273"></a>
<FONT color="green">274</FONT>         * &lt;strong&gt;&lt;code&gt; var2&lt;/code&gt;&lt;/strong&gt; is the variance of the second sample;<a name="line.274"></a>
<FONT color="green">275</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.275"></a>
<FONT color="green">276</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.276"></a>
<FONT color="green">277</FONT>         * &lt;li&gt;The observed array lengths must both be at least 2.<a name="line.277"></a>
<FONT color="green">278</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.278"></a>
<FONT color="green">279</FONT>         *<a name="line.279"></a>
<FONT color="green">280</FONT>         * @param sample1 array of sample data values<a name="line.280"></a>
<FONT color="green">281</FONT>         * @param sample2 array of sample data values<a name="line.281"></a>
<FONT color="green">282</FONT>         * @return t statistic<a name="line.282"></a>
<FONT color="green">283</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.283"></a>
<FONT color="green">284</FONT>         */<a name="line.284"></a>
<FONT color="green">285</FONT>        public double t(double[] sample1, double[] sample2)<a name="line.285"></a>
<FONT color="green">286</FONT>        throws IllegalArgumentException {<a name="line.286"></a>
<FONT color="green">287</FONT>            checkSampleData(sample1);<a name="line.287"></a>
<FONT color="green">288</FONT>            checkSampleData(sample2);<a name="line.288"></a>
<FONT color="green">289</FONT>            return t(StatUtils.mean(sample1), StatUtils.mean(sample2),<a name="line.289"></a>
<FONT color="green">290</FONT>                    StatUtils.variance(sample1), StatUtils.variance(sample2),<a name="line.290"></a>
<FONT color="green">291</FONT>                    sample1.length, sample2.length);<a name="line.291"></a>
<FONT color="green">292</FONT>        }<a name="line.292"></a>
<FONT color="green">293</FONT>    <a name="line.293"></a>
<FONT color="green">294</FONT>        /**<a name="line.294"></a>
<FONT color="green">295</FONT>         * Computes a 2-sample t statistic &lt;/a&gt;, comparing the means of the datasets<a name="line.295"></a>
<FONT color="green">296</FONT>         * described by two {@link StatisticalSummary} instances, without the<a name="line.296"></a>
<FONT color="green">297</FONT>         * assumption of equal subpopulation variances.  Use<a name="line.297"></a>
<FONT color="green">298</FONT>         * {@link #homoscedasticT(StatisticalSummary, StatisticalSummary)} to<a name="line.298"></a>
<FONT color="green">299</FONT>         * compute a t-statistic under the equal variances assumption.<a name="line.299"></a>
<FONT color="green">300</FONT>         * &lt;p&gt;<a name="line.300"></a>
<FONT color="green">301</FONT>         * This statistic can be used to perform a two-sample t-test to compare<a name="line.301"></a>
<FONT color="green">302</FONT>         * sample means.&lt;/p&gt;<a name="line.302"></a>
<FONT color="green">303</FONT>         * &lt;p&gt;<a name="line.303"></a>
<FONT color="green">304</FONT>          * The returned  t-statisitc is&lt;/p&gt;<a name="line.304"></a>
<FONT color="green">305</FONT>         * &lt;p&gt;<a name="line.305"></a>
<FONT color="green">306</FONT>         * &amp;nbsp;&amp;nbsp; &lt;code&gt;  t = (m1 - m2) / sqrt(var1/n1 + var2/n2)&lt;/code&gt;<a name="line.306"></a>
<FONT color="green">307</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.307"></a>
<FONT color="green">308</FONT>         * where &lt;strong&gt;&lt;code&gt;n1&lt;/code&gt;&lt;/strong&gt; is the size of the first sample;<a name="line.308"></a>
<FONT color="green">309</FONT>         * &lt;strong&gt;&lt;code&gt; n2&lt;/code&gt;&lt;/strong&gt; is the size of the second sample;<a name="line.309"></a>
<FONT color="green">310</FONT>         * &lt;strong&gt;&lt;code&gt; m1&lt;/code&gt;&lt;/strong&gt; is the mean of the first sample;<a name="line.310"></a>
<FONT color="green">311</FONT>         * &lt;strong&gt;&lt;code&gt; m2&lt;/code&gt;&lt;/strong&gt; is the mean of the second sample<a name="line.311"></a>
<FONT color="green">312</FONT>         * &lt;strong&gt;&lt;code&gt; var1&lt;/code&gt;&lt;/strong&gt; is the variance of the first sample;<a name="line.312"></a>
<FONT color="green">313</FONT>         * &lt;strong&gt;&lt;code&gt; var2&lt;/code&gt;&lt;/strong&gt; is the variance of the second sample<a name="line.313"></a>
<FONT color="green">314</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.314"></a>
<FONT color="green">315</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.315"></a>
<FONT color="green">316</FONT>         * &lt;li&gt;The datasets described by the two Univariates must each contain<a name="line.316"></a>
<FONT color="green">317</FONT>         * at least 2 observations.<a name="line.317"></a>
<FONT color="green">318</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.318"></a>
<FONT color="green">319</FONT>         *<a name="line.319"></a>
<FONT color="green">320</FONT>         * @param sampleStats1 StatisticalSummary describing data from the first sample<a name="line.320"></a>
<FONT color="green">321</FONT>         * @param sampleStats2 StatisticalSummary describing data from the second sample<a name="line.321"></a>
<FONT color="green">322</FONT>         * @return t statistic<a name="line.322"></a>
<FONT color="green">323</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.323"></a>
<FONT color="green">324</FONT>         */<a name="line.324"></a>
<FONT color="green">325</FONT>        public double t(StatisticalSummary sampleStats1,<a name="line.325"></a>
<FONT color="green">326</FONT>                        StatisticalSummary sampleStats2)<a name="line.326"></a>
<FONT color="green">327</FONT>        throws IllegalArgumentException {<a name="line.327"></a>
<FONT color="green">328</FONT>            checkSampleData(sampleStats1);<a name="line.328"></a>
<FONT color="green">329</FONT>            checkSampleData(sampleStats2);<a name="line.329"></a>
<FONT color="green">330</FONT>            return t(sampleStats1.getMean(), sampleStats2.getMean(),<a name="line.330"></a>
<FONT color="green">331</FONT>                    sampleStats1.getVariance(), sampleStats2.getVariance(),<a name="line.331"></a>
<FONT color="green">332</FONT>                    sampleStats1.getN(), sampleStats2.getN());<a name="line.332"></a>
<FONT color="green">333</FONT>        }<a name="line.333"></a>
<FONT color="green">334</FONT>    <a name="line.334"></a>
<FONT color="green">335</FONT>        /**<a name="line.335"></a>
<FONT color="green">336</FONT>         * Computes a 2-sample t statistic, comparing the means of the datasets<a name="line.336"></a>
<FONT color="green">337</FONT>         * described by two {@link StatisticalSummary} instances, under the<a name="line.337"></a>
<FONT color="green">338</FONT>         * assumption of equal subpopulation variances.  To compute a t-statistic<a name="line.338"></a>
<FONT color="green">339</FONT>         * without the equal variances assumption, use<a name="line.339"></a>
<FONT color="green">340</FONT>         * {@link #t(StatisticalSummary, StatisticalSummary)}.<a name="line.340"></a>
<FONT color="green">341</FONT>         * &lt;p&gt;<a name="line.341"></a>
<FONT color="green">342</FONT>         * This statistic can be used to perform a (homoscedastic) two-sample<a name="line.342"></a>
<FONT color="green">343</FONT>         * t-test to compare sample means.&lt;/p&gt;<a name="line.343"></a>
<FONT color="green">344</FONT>         * &lt;p&gt;<a name="line.344"></a>
<FONT color="green">345</FONT>         * The t-statisitc returned is&lt;/p&gt;<a name="line.345"></a>
<FONT color="green">346</FONT>         * &lt;p&gt;<a name="line.346"></a>
<FONT color="green">347</FONT>         * &amp;nbsp;&amp;nbsp;&lt;code&gt;  t = (m1 - m2) / (sqrt(1/n1 +1/n2) sqrt(var))&lt;/code&gt;<a name="line.347"></a>
<FONT color="green">348</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.348"></a>
<FONT color="green">349</FONT>         * where &lt;strong&gt;&lt;code&gt;n1&lt;/code&gt;&lt;/strong&gt; is the size of first sample;<a name="line.349"></a>
<FONT color="green">350</FONT>         * &lt;strong&gt;&lt;code&gt; n2&lt;/code&gt;&lt;/strong&gt; is the size of second sample;<a name="line.350"></a>
<FONT color="green">351</FONT>         * &lt;strong&gt;&lt;code&gt; m1&lt;/code&gt;&lt;/strong&gt; is the mean of first sample;<a name="line.351"></a>
<FONT color="green">352</FONT>         * &lt;strong&gt;&lt;code&gt; m2&lt;/code&gt;&lt;/strong&gt; is the mean of second sample<a name="line.352"></a>
<FONT color="green">353</FONT>         * and &lt;strong&gt;&lt;code&gt;var&lt;/code&gt;&lt;/strong&gt; is the pooled variance estimate:<a name="line.353"></a>
<FONT color="green">354</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.354"></a>
<FONT color="green">355</FONT>         * &lt;code&gt;var = sqrt(((n1 - 1)var1 + (n2 - 1)var2) / ((n1-1) + (n2-1)))&lt;/code&gt;<a name="line.355"></a>
<FONT color="green">356</FONT>         * &lt;p&gt;<a name="line.356"></a>
<FONT color="green">357</FONT>         * with &lt;strong&gt;&lt;code&gt;var1&lt;code&gt;&lt;/strong&gt; the variance of the first sample and<a name="line.357"></a>
<FONT color="green">358</FONT>         * &lt;strong&gt;&lt;code&gt;var2&lt;/code&gt;&lt;/strong&gt; the variance of the second sample.<a name="line.358"></a>
<FONT color="green">359</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.359"></a>
<FONT color="green">360</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.360"></a>
<FONT color="green">361</FONT>         * &lt;li&gt;The datasets described by the two Univariates must each contain<a name="line.361"></a>
<FONT color="green">362</FONT>         * at least 2 observations.<a name="line.362"></a>
<FONT color="green">363</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.363"></a>
<FONT color="green">364</FONT>         *<a name="line.364"></a>
<FONT color="green">365</FONT>         * @param sampleStats1 StatisticalSummary describing data from the first sample<a name="line.365"></a>
<FONT color="green">366</FONT>         * @param sampleStats2 StatisticalSummary describing data from the second sample<a name="line.366"></a>
<FONT color="green">367</FONT>         * @return t statistic<a name="line.367"></a>
<FONT color="green">368</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.368"></a>
<FONT color="green">369</FONT>         */<a name="line.369"></a>
<FONT color="green">370</FONT>        public double homoscedasticT(StatisticalSummary sampleStats1,<a name="line.370"></a>
<FONT color="green">371</FONT>                StatisticalSummary sampleStats2)<a name="line.371"></a>
<FONT color="green">372</FONT>        throws IllegalArgumentException {<a name="line.372"></a>
<FONT color="green">373</FONT>            checkSampleData(sampleStats1);<a name="line.373"></a>
<FONT color="green">374</FONT>            checkSampleData(sampleStats2);<a name="line.374"></a>
<FONT color="green">375</FONT>            return homoscedasticT(sampleStats1.getMean(), sampleStats2.getMean(),<a name="line.375"></a>
<FONT color="green">376</FONT>                    sampleStats1.getVariance(), sampleStats2.getVariance(),<a name="line.376"></a>
<FONT color="green">377</FONT>                    sampleStats1.getN(), sampleStats2.getN());<a name="line.377"></a>
<FONT color="green">378</FONT>        }<a name="line.378"></a>
<FONT color="green">379</FONT>    <a name="line.379"></a>
<FONT color="green">380</FONT>         /**<a name="line.380"></a>
<FONT color="green">381</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.381"></a>
<FONT color="green">382</FONT>         * &lt;i&gt;p-value&lt;/i&gt;, associated with a one-sample, two-tailed t-test<a name="line.382"></a>
<FONT color="green">383</FONT>         * comparing the mean of the input array with the constant &lt;code&gt;mu&lt;/code&gt;.<a name="line.383"></a>
<FONT color="green">384</FONT>         * &lt;p&gt;<a name="line.384"></a>
<FONT color="green">385</FONT>         * The number returned is the smallest significance level<a name="line.385"></a>
<FONT color="green">386</FONT>         * at which one can reject the null hypothesis that the mean equals<a name="line.386"></a>
<FONT color="green">387</FONT>         * &lt;code&gt;mu&lt;/code&gt; in favor of the two-sided alternative that the mean<a name="line.387"></a>
<FONT color="green">388</FONT>         * is different from &lt;code&gt;mu&lt;/code&gt;. For a one-sided test, divide the<a name="line.388"></a>
<FONT color="green">389</FONT>         * returned value by 2.&lt;/p&gt;<a name="line.389"></a>
<FONT color="green">390</FONT>         * &lt;p&gt;<a name="line.390"></a>
<FONT color="green">391</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.391"></a>
<FONT color="green">392</FONT>         * The validity of the test depends on the assumptions of the parametric<a name="line.392"></a>
<FONT color="green">393</FONT>         * t-test procedure, as discussed<a name="line.393"></a>
<FONT color="green">394</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;here&lt;/a&gt;<a name="line.394"></a>
<FONT color="green">395</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.395"></a>
<FONT color="green">396</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.396"></a>
<FONT color="green">397</FONT>         * &lt;li&gt;The observed array length must be at least 2.<a name="line.397"></a>
<FONT color="green">398</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.398"></a>
<FONT color="green">399</FONT>         *<a name="line.399"></a>
<FONT color="green">400</FONT>         * @param mu constant value to compare sample mean against<a name="line.400"></a>
<FONT color="green">401</FONT>         * @param sample array of sample data values<a name="line.401"></a>
<FONT color="green">402</FONT>         * @return p-value<a name="line.402"></a>
<FONT color="green">403</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.403"></a>
<FONT color="green">404</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.404"></a>
<FONT color="green">405</FONT>         */<a name="line.405"></a>
<FONT color="green">406</FONT>        public double tTest(double mu, double[] sample)<a name="line.406"></a>
<FONT color="green">407</FONT>        throws IllegalArgumentException, MathException {<a name="line.407"></a>
<FONT color="green">408</FONT>            checkSampleData(sample);<a name="line.408"></a>
<FONT color="green">409</FONT>            return tTest( StatUtils.mean(sample), mu, StatUtils.variance(sample),<a name="line.409"></a>
<FONT color="green">410</FONT>                    sample.length);<a name="line.410"></a>
<FONT color="green">411</FONT>        }<a name="line.411"></a>
<FONT color="green">412</FONT>    <a name="line.412"></a>
<FONT color="green">413</FONT>        /**<a name="line.413"></a>
<FONT color="green">414</FONT>         * Performs a &lt;a href="http://www.itl.nist.gov/div898/handbook/eda/section3/eda353.htm"&gt;<a name="line.414"></a>
<FONT color="green">415</FONT>         * two-sided t-test&lt;/a&gt; evaluating the null hypothesis that the mean of the population from<a name="line.415"></a>
<FONT color="green">416</FONT>         * which &lt;code&gt;sample&lt;/code&gt; is drawn equals &lt;code&gt;mu&lt;/code&gt;.<a name="line.416"></a>
<FONT color="green">417</FONT>         * &lt;p&gt;<a name="line.417"></a>
<FONT color="green">418</FONT>         * Returns &lt;code&gt;true&lt;/code&gt; iff the null hypothesis can be<a name="line.418"></a>
<FONT color="green">419</FONT>         * rejected with confidence &lt;code&gt;1 - alpha&lt;/code&gt;.  To<a name="line.419"></a>
<FONT color="green">420</FONT>         * perform a 1-sided test, use &lt;code&gt;alpha * 2&lt;/code&gt;<a name="line.420"></a>
<FONT color="green">421</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.421"></a>
<FONT color="green">422</FONT>         * &lt;strong&gt;Examples:&lt;/strong&gt;&lt;br&gt;&lt;ol&gt;<a name="line.422"></a>
<FONT color="green">423</FONT>         * &lt;li&gt;To test the (2-sided) hypothesis &lt;code&gt;sample mean = mu &lt;/code&gt; at<a name="line.423"></a>
<FONT color="green">424</FONT>         * the 95% level, use &lt;br&gt;&lt;code&gt;tTest(mu, sample, 0.05) &lt;/code&gt;<a name="line.424"></a>
<FONT color="green">425</FONT>         * &lt;/li&gt;<a name="line.425"></a>
<FONT color="green">426</FONT>         * &lt;li&gt;To test the (one-sided) hypothesis &lt;code&gt; sample mean &lt; mu &lt;/code&gt;<a name="line.426"></a>
<FONT color="green">427</FONT>         * at the 99% level, first verify that the measured sample mean is less<a name="line.427"></a>
<FONT color="green">428</FONT>         * than &lt;code&gt;mu&lt;/code&gt; and then use<a name="line.428"></a>
<FONT color="green">429</FONT>         * &lt;br&gt;&lt;code&gt;tTest(mu, sample, 0.02) &lt;/code&gt;<a name="line.429"></a>
<FONT color="green">430</FONT>         * &lt;/li&gt;&lt;/ol&gt;&lt;/p&gt;<a name="line.430"></a>
<FONT color="green">431</FONT>         * &lt;p&gt;<a name="line.431"></a>
<FONT color="green">432</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.432"></a>
<FONT color="green">433</FONT>         * The validity of the test depends on the assumptions of the one-sample<a name="line.433"></a>
<FONT color="green">434</FONT>         * parametric t-test procedure, as discussed<a name="line.434"></a>
<FONT color="green">435</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/sg_glos.html#one-sample"&gt;here&lt;/a&gt;<a name="line.435"></a>
<FONT color="green">436</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.436"></a>
<FONT color="green">437</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.437"></a>
<FONT color="green">438</FONT>         * &lt;li&gt;The observed array length must be at least 2.<a name="line.438"></a>
<FONT color="green">439</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.439"></a>
<FONT color="green">440</FONT>         *<a name="line.440"></a>
<FONT color="green">441</FONT>         * @param mu constant value to compare sample mean against<a name="line.441"></a>
<FONT color="green">442</FONT>         * @param sample array of sample data values<a name="line.442"></a>
<FONT color="green">443</FONT>         * @param alpha significance level of the test<a name="line.443"></a>
<FONT color="green">444</FONT>         * @return p-value<a name="line.444"></a>
<FONT color="green">445</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.445"></a>
<FONT color="green">446</FONT>         * @throws MathException if an error computing the p-value<a name="line.446"></a>
<FONT color="green">447</FONT>         */<a name="line.447"></a>
<FONT color="green">448</FONT>        public boolean tTest(double mu, double[] sample, double alpha)<a name="line.448"></a>
<FONT color="green">449</FONT>        throws IllegalArgumentException, MathException {<a name="line.449"></a>
<FONT color="green">450</FONT>            checkSignificanceLevel(alpha);<a name="line.450"></a>
<FONT color="green">451</FONT>            return tTest(mu, sample) &lt; alpha;<a name="line.451"></a>
<FONT color="green">452</FONT>        }<a name="line.452"></a>
<FONT color="green">453</FONT>    <a name="line.453"></a>
<FONT color="green">454</FONT>        /**<a name="line.454"></a>
<FONT color="green">455</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.455"></a>
<FONT color="green">456</FONT>         * &lt;i&gt;p-value&lt;/i&gt;, associated with a one-sample, two-tailed t-test<a name="line.456"></a>
<FONT color="green">457</FONT>         * comparing the mean of the dataset described by &lt;code&gt;sampleStats&lt;/code&gt;<a name="line.457"></a>
<FONT color="green">458</FONT>         * with the constant &lt;code&gt;mu&lt;/code&gt;.<a name="line.458"></a>
<FONT color="green">459</FONT>         * &lt;p&gt;<a name="line.459"></a>
<FONT color="green">460</FONT>         * The number returned is the smallest significance level<a name="line.460"></a>
<FONT color="green">461</FONT>         * at which one can reject the null hypothesis that the mean equals<a name="line.461"></a>
<FONT color="green">462</FONT>         * &lt;code&gt;mu&lt;/code&gt; in favor of the two-sided alternative that the mean<a name="line.462"></a>
<FONT color="green">463</FONT>         * is different from &lt;code&gt;mu&lt;/code&gt;. For a one-sided test, divide the<a name="line.463"></a>
<FONT color="green">464</FONT>         * returned value by 2.&lt;/p&gt;<a name="line.464"></a>
<FONT color="green">465</FONT>         * &lt;p&gt;<a name="line.465"></a>
<FONT color="green">466</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.466"></a>
<FONT color="green">467</FONT>         * The validity of the test depends on the assumptions of the parametric<a name="line.467"></a>
<FONT color="green">468</FONT>         * t-test procedure, as discussed<a name="line.468"></a>
<FONT color="green">469</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.469"></a>
<FONT color="green">470</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.470"></a>
<FONT color="green">471</FONT>         * &lt;p&gt;<a name="line.471"></a>
<FONT color="green">472</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.472"></a>
<FONT color="green">473</FONT>         * &lt;li&gt;The sample must contain at least 2 observations.<a name="line.473"></a>
<FONT color="green">474</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.474"></a>
<FONT color="green">475</FONT>         *<a name="line.475"></a>
<FONT color="green">476</FONT>         * @param mu constant value to compare sample mean against<a name="line.476"></a>
<FONT color="green">477</FONT>         * @param sampleStats StatisticalSummary describing sample data<a name="line.477"></a>
<FONT color="green">478</FONT>         * @return p-value<a name="line.478"></a>
<FONT color="green">479</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.479"></a>
<FONT color="green">480</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.480"></a>
<FONT color="green">481</FONT>         */<a name="line.481"></a>
<FONT color="green">482</FONT>        public double tTest(double mu, StatisticalSummary sampleStats)<a name="line.482"></a>
<FONT color="green">483</FONT>        throws IllegalArgumentException, MathException {<a name="line.483"></a>
<FONT color="green">484</FONT>            checkSampleData(sampleStats);<a name="line.484"></a>
<FONT color="green">485</FONT>            return tTest(sampleStats.getMean(), mu, sampleStats.getVariance(),<a name="line.485"></a>
<FONT color="green">486</FONT>                    sampleStats.getN());<a name="line.486"></a>
<FONT color="green">487</FONT>        }<a name="line.487"></a>
<FONT color="green">488</FONT>    <a name="line.488"></a>
<FONT color="green">489</FONT>         /**<a name="line.489"></a>
<FONT color="green">490</FONT>         * Performs a &lt;a href="http://www.itl.nist.gov/div898/handbook/eda/section3/eda353.htm"&gt;<a name="line.490"></a>
<FONT color="green">491</FONT>         * two-sided t-test&lt;/a&gt; evaluating the null hypothesis that the mean of the<a name="line.491"></a>
<FONT color="green">492</FONT>         * population from which the dataset described by &lt;code&gt;stats&lt;/code&gt; is<a name="line.492"></a>
<FONT color="green">493</FONT>         * drawn equals &lt;code&gt;mu&lt;/code&gt;.<a name="line.493"></a>
<FONT color="green">494</FONT>         * &lt;p&gt;<a name="line.494"></a>
<FONT color="green">495</FONT>         * Returns &lt;code&gt;true&lt;/code&gt; iff the null hypothesis can be rejected with<a name="line.495"></a>
<FONT color="green">496</FONT>         * confidence &lt;code&gt;1 - alpha&lt;/code&gt;.  To  perform a 1-sided test, use<a name="line.496"></a>
<FONT color="green">497</FONT>         * &lt;code&gt;alpha * 2.&lt;/code&gt;&lt;/p&gt;<a name="line.497"></a>
<FONT color="green">498</FONT>         * &lt;p&gt;<a name="line.498"></a>
<FONT color="green">499</FONT>         * &lt;strong&gt;Examples:&lt;/strong&gt;&lt;br&gt;&lt;ol&gt;<a name="line.499"></a>
<FONT color="green">500</FONT>         * &lt;li&gt;To test the (2-sided) hypothesis &lt;code&gt;sample mean = mu &lt;/code&gt; at<a name="line.500"></a>
<FONT color="green">501</FONT>         * the 95% level, use &lt;br&gt;&lt;code&gt;tTest(mu, sampleStats, 0.05) &lt;/code&gt;<a name="line.501"></a>
<FONT color="green">502</FONT>         * &lt;/li&gt;<a name="line.502"></a>
<FONT color="green">503</FONT>         * &lt;li&gt;To test the (one-sided) hypothesis &lt;code&gt; sample mean &lt; mu &lt;/code&gt;<a name="line.503"></a>
<FONT color="green">504</FONT>         * at the 99% level, first verify that the measured sample mean is less<a name="line.504"></a>
<FONT color="green">505</FONT>         * than &lt;code&gt;mu&lt;/code&gt; and then use<a name="line.505"></a>
<FONT color="green">506</FONT>         * &lt;br&gt;&lt;code&gt;tTest(mu, sampleStats, 0.02) &lt;/code&gt;<a name="line.506"></a>
<FONT color="green">507</FONT>         * &lt;/li&gt;&lt;/ol&gt;&lt;/p&gt;<a name="line.507"></a>
<FONT color="green">508</FONT>         * &lt;p&gt;<a name="line.508"></a>
<FONT color="green">509</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.509"></a>
<FONT color="green">510</FONT>         * The validity of the test depends on the assumptions of the one-sample<a name="line.510"></a>
<FONT color="green">511</FONT>         * parametric t-test procedure, as discussed<a name="line.511"></a>
<FONT color="green">512</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/sg_glos.html#one-sample"&gt;here&lt;/a&gt;<a name="line.512"></a>
<FONT color="green">513</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.513"></a>
<FONT color="green">514</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.514"></a>
<FONT color="green">515</FONT>         * &lt;li&gt;The sample must include at least 2 observations.<a name="line.515"></a>
<FONT color="green">516</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.516"></a>
<FONT color="green">517</FONT>         *<a name="line.517"></a>
<FONT color="green">518</FONT>         * @param mu constant value to compare sample mean against<a name="line.518"></a>
<FONT color="green">519</FONT>         * @param sampleStats StatisticalSummary describing sample data values<a name="line.519"></a>
<FONT color="green">520</FONT>         * @param alpha significance level of the test<a name="line.520"></a>
<FONT color="green">521</FONT>         * @return p-value<a name="line.521"></a>
<FONT color="green">522</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.522"></a>
<FONT color="green">523</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.523"></a>
<FONT color="green">524</FONT>         */<a name="line.524"></a>
<FONT color="green">525</FONT>        public boolean tTest( double mu, StatisticalSummary sampleStats,<a name="line.525"></a>
<FONT color="green">526</FONT>                double alpha)<a name="line.526"></a>
<FONT color="green">527</FONT>        throws IllegalArgumentException, MathException {<a name="line.527"></a>
<FONT color="green">528</FONT>            checkSignificanceLevel(alpha);<a name="line.528"></a>
<FONT color="green">529</FONT>            return tTest(mu, sampleStats) &lt; alpha;<a name="line.529"></a>
<FONT color="green">530</FONT>        }<a name="line.530"></a>
<FONT color="green">531</FONT>    <a name="line.531"></a>
<FONT color="green">532</FONT>        /**<a name="line.532"></a>
<FONT color="green">533</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.533"></a>
<FONT color="green">534</FONT>         * &lt;i&gt;p-value&lt;/i&gt;, associated with a two-sample, two-tailed t-test<a name="line.534"></a>
<FONT color="green">535</FONT>         * comparing the means of the input arrays.<a name="line.535"></a>
<FONT color="green">536</FONT>         * &lt;p&gt;<a name="line.536"></a>
<FONT color="green">537</FONT>         * The number returned is the smallest significance level<a name="line.537"></a>
<FONT color="green">538</FONT>         * at which one can reject the null hypothesis that the two means are<a name="line.538"></a>
<FONT color="green">539</FONT>         * equal in favor of the two-sided alternative that they are different.<a name="line.539"></a>
<FONT color="green">540</FONT>         * For a one-sided test, divide the returned value by 2.&lt;/p&gt;<a name="line.540"></a>
<FONT color="green">541</FONT>         * &lt;p&gt;<a name="line.541"></a>
<FONT color="green">542</FONT>         * The test does not assume that the underlying popuation variances are<a name="line.542"></a>
<FONT color="green">543</FONT>         * equal  and it uses approximated degrees of freedom computed from the<a name="line.543"></a>
<FONT color="green">544</FONT>         * sample data to compute the p-value.  The t-statistic used is as defined in<a name="line.544"></a>
<FONT color="green">545</FONT>         * {@link #t(double[], double[])} and the Welch-Satterthwaite approximation<a name="line.545"></a>
<FONT color="green">546</FONT>         * to the degrees of freedom is used,<a name="line.546"></a>
<FONT color="green">547</FONT>         * as described<a name="line.547"></a>
<FONT color="green">548</FONT>         * &lt;a href="http://www.itl.nist.gov/div898/handbook/prc/section3/prc31.htm"&gt;<a name="line.548"></a>
<FONT color="green">549</FONT>         * here.&lt;/a&gt;  To perform the test under the assumption of equal subpopulation<a name="line.549"></a>
<FONT color="green">550</FONT>         * variances, use {@link #homoscedasticTTest(double[], double[])}.&lt;/p&gt;<a name="line.550"></a>
<FONT color="green">551</FONT>         * &lt;p&gt;<a name="line.551"></a>
<FONT color="green">552</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.552"></a>
<FONT color="green">553</FONT>         * The validity of the p-value depends on the assumptions of the parametric<a name="line.553"></a>
<FONT color="green">554</FONT>         * t-test procedure, as discussed<a name="line.554"></a>
<FONT color="green">555</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.555"></a>
<FONT color="green">556</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.556"></a>
<FONT color="green">557</FONT>         * &lt;p&gt;<a name="line.557"></a>
<FONT color="green">558</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.558"></a>
<FONT color="green">559</FONT>         * &lt;li&gt;The observed array lengths must both be at least 2.<a name="line.559"></a>
<FONT color="green">560</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.560"></a>
<FONT color="green">561</FONT>         *<a name="line.561"></a>
<FONT color="green">562</FONT>         * @param sample1 array of sample data values<a name="line.562"></a>
<FONT color="green">563</FONT>         * @param sample2 array of sample data values<a name="line.563"></a>
<FONT color="green">564</FONT>         * @return p-value for t-test<a name="line.564"></a>
<FONT color="green">565</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.565"></a>
<FONT color="green">566</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.566"></a>
<FONT color="green">567</FONT>         */<a name="line.567"></a>
<FONT color="green">568</FONT>        public double tTest(double[] sample1, double[] sample2)<a name="line.568"></a>
<FONT color="green">569</FONT>        throws IllegalArgumentException, MathException {<a name="line.569"></a>
<FONT color="green">570</FONT>            checkSampleData(sample1);<a name="line.570"></a>
<FONT color="green">571</FONT>            checkSampleData(sample2);<a name="line.571"></a>
<FONT color="green">572</FONT>            return tTest(StatUtils.mean(sample1), StatUtils.mean(sample2),<a name="line.572"></a>
<FONT color="green">573</FONT>                    StatUtils.variance(sample1), StatUtils.variance(sample2),<a name="line.573"></a>
<FONT color="green">574</FONT>                    sample1.length, sample2.length);<a name="line.574"></a>
<FONT color="green">575</FONT>        }<a name="line.575"></a>
<FONT color="green">576</FONT>    <a name="line.576"></a>
<FONT color="green">577</FONT>        /**<a name="line.577"></a>
<FONT color="green">578</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.578"></a>
<FONT color="green">579</FONT>         * &lt;i&gt;p-value&lt;/i&gt;, associated with a two-sample, two-tailed t-test<a name="line.579"></a>
<FONT color="green">580</FONT>         * comparing the means of the input arrays, under the assumption that<a name="line.580"></a>
<FONT color="green">581</FONT>         * the two samples are drawn from subpopulations with equal variances.<a name="line.581"></a>
<FONT color="green">582</FONT>         * To perform the test without the equal variances assumption, use<a name="line.582"></a>
<FONT color="green">583</FONT>         * {@link #tTest(double[], double[])}.<a name="line.583"></a>
<FONT color="green">584</FONT>         * &lt;p&gt;<a name="line.584"></a>
<FONT color="green">585</FONT>         * The number returned is the smallest significance level<a name="line.585"></a>
<FONT color="green">586</FONT>         * at which one can reject the null hypothesis that the two means are<a name="line.586"></a>
<FONT color="green">587</FONT>         * equal in favor of the two-sided alternative that they are different.<a name="line.587"></a>
<FONT color="green">588</FONT>         * For a one-sided test, divide the returned value by 2.&lt;/p&gt;<a name="line.588"></a>
<FONT color="green">589</FONT>         * &lt;p&gt;<a name="line.589"></a>
<FONT color="green">590</FONT>         * A pooled variance estimate is used to compute the t-statistic.  See<a name="line.590"></a>
<FONT color="green">591</FONT>         * {@link #homoscedasticT(double[], double[])}. The sum of the sample sizes<a name="line.591"></a>
<FONT color="green">592</FONT>         * minus 2 is used as the degrees of freedom.&lt;/p&gt;<a name="line.592"></a>
<FONT color="green">593</FONT>         * &lt;p&gt;<a name="line.593"></a>
<FONT color="green">594</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.594"></a>
<FONT color="green">595</FONT>         * The validity of the p-value depends on the assumptions of the parametric<a name="line.595"></a>
<FONT color="green">596</FONT>         * t-test procedure, as discussed<a name="line.596"></a>
<FONT color="green">597</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.597"></a>
<FONT color="green">598</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.598"></a>
<FONT color="green">599</FONT>         * &lt;p&gt;<a name="line.599"></a>
<FONT color="green">600</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.600"></a>
<FONT color="green">601</FONT>         * &lt;li&gt;The observed array lengths must both be at least 2.<a name="line.601"></a>
<FONT color="green">602</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.602"></a>
<FONT color="green">603</FONT>         *<a name="line.603"></a>
<FONT color="green">604</FONT>         * @param sample1 array of sample data values<a name="line.604"></a>
<FONT color="green">605</FONT>         * @param sample2 array of sample data values<a name="line.605"></a>
<FONT color="green">606</FONT>         * @return p-value for t-test<a name="line.606"></a>
<FONT color="green">607</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.607"></a>
<FONT color="green">608</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.608"></a>
<FONT color="green">609</FONT>         */<a name="line.609"></a>
<FONT color="green">610</FONT>        public double homoscedasticTTest(double[] sample1, double[] sample2)<a name="line.610"></a>
<FONT color="green">611</FONT>        throws IllegalArgumentException, MathException {<a name="line.611"></a>
<FONT color="green">612</FONT>            checkSampleData(sample1);<a name="line.612"></a>
<FONT color="green">613</FONT>            checkSampleData(sample2);<a name="line.613"></a>
<FONT color="green">614</FONT>            return homoscedasticTTest(StatUtils.mean(sample1),<a name="line.614"></a>
<FONT color="green">615</FONT>                    StatUtils.mean(sample2), StatUtils.variance(sample1),<a name="line.615"></a>
<FONT color="green">616</FONT>                    StatUtils.variance(sample2), sample1.length,<a name="line.616"></a>
<FONT color="green">617</FONT>                    sample2.length);<a name="line.617"></a>
<FONT color="green">618</FONT>        }<a name="line.618"></a>
<FONT color="green">619</FONT>    <a name="line.619"></a>
<FONT color="green">620</FONT>    <a name="line.620"></a>
<FONT color="green">621</FONT>         /**<a name="line.621"></a>
<FONT color="green">622</FONT>         * Performs a<a name="line.622"></a>
<FONT color="green">623</FONT>         * &lt;a href="http://www.itl.nist.gov/div898/handbook/eda/section3/eda353.htm"&gt;<a name="line.623"></a>
<FONT color="green">624</FONT>         * two-sided t-test&lt;/a&gt; evaluating the null hypothesis that &lt;code&gt;sample1&lt;/code&gt;<a name="line.624"></a>
<FONT color="green">625</FONT>         * and &lt;code&gt;sample2&lt;/code&gt; are drawn from populations with the same mean,<a name="line.625"></a>
<FONT color="green">626</FONT>         * with significance level &lt;code&gt;alpha&lt;/code&gt;.  This test does not assume<a name="line.626"></a>
<FONT color="green">627</FONT>         * that the subpopulation variances are equal.  To perform the test assuming<a name="line.627"></a>
<FONT color="green">628</FONT>         * equal variances, use<a name="line.628"></a>
<FONT color="green">629</FONT>         * {@link #homoscedasticTTest(double[], double[], double)}.<a name="line.629"></a>
<FONT color="green">630</FONT>         * &lt;p&gt;<a name="line.630"></a>
<FONT color="green">631</FONT>         * Returns &lt;code&gt;true&lt;/code&gt; iff the null hypothesis that the means are<a name="line.631"></a>
<FONT color="green">632</FONT>         * equal can be rejected with confidence &lt;code&gt;1 - alpha&lt;/code&gt;.  To<a name="line.632"></a>
<FONT color="green">633</FONT>         * perform a 1-sided test, use &lt;code&gt;alpha / 2&lt;/code&gt;&lt;/p&gt;<a name="line.633"></a>
<FONT color="green">634</FONT>         * &lt;p&gt;<a name="line.634"></a>
<FONT color="green">635</FONT>         * See {@link #t(double[], double[])} for the formula used to compute the<a name="line.635"></a>
<FONT color="green">636</FONT>         * t-statistic.  Degrees of freedom are approximated using the<a name="line.636"></a>
<FONT color="green">637</FONT>         * &lt;a href="http://www.itl.nist.gov/div898/handbook/prc/section3/prc31.htm"&gt;<a name="line.637"></a>
<FONT color="green">638</FONT>         * Welch-Satterthwaite approximation.&lt;/a&gt;&lt;/p&gt;<a name="line.638"></a>
<FONT color="green">639</FONT>    <a name="line.639"></a>
<FONT color="green">640</FONT>         * &lt;p&gt;<a name="line.640"></a>
<FONT color="green">641</FONT>         * &lt;strong&gt;Examples:&lt;/strong&gt;&lt;br&gt;&lt;ol&gt;<a name="line.641"></a>
<FONT color="green">642</FONT>         * &lt;li&gt;To test the (2-sided) hypothesis &lt;code&gt;mean 1 = mean 2 &lt;/code&gt; at<a name="line.642"></a>
<FONT color="green">643</FONT>         * the 95% level,  use<a name="line.643"></a>
<FONT color="green">644</FONT>         * &lt;br&gt;&lt;code&gt;tTest(sample1, sample2, 0.05). &lt;/code&gt;<a name="line.644"></a>
<FONT color="green">645</FONT>         * &lt;/li&gt;<a name="line.645"></a>
<FONT color="green">646</FONT>         * &lt;li&gt;To test the (one-sided) hypothesis &lt;code&gt; mean 1 &lt; mean 2 &lt;/code&gt; at<a name="line.646"></a>
<FONT color="green">647</FONT>         * the 99% level, first verify that the measured  mean of &lt;code&gt;sample 1&lt;/code&gt;<a name="line.647"></a>
<FONT color="green">648</FONT>         * is less than the mean of &lt;code&gt;sample 2&lt;/code&gt; and then use<a name="line.648"></a>
<FONT color="green">649</FONT>         * &lt;br&gt;&lt;code&gt;tTest(sample1, sample2, 0.02) &lt;/code&gt;<a name="line.649"></a>
<FONT color="green">650</FONT>         * &lt;/li&gt;&lt;/ol&gt;&lt;/p&gt;<a name="line.650"></a>
<FONT color="green">651</FONT>         * &lt;p&gt;<a name="line.651"></a>
<FONT color="green">652</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.652"></a>
<FONT color="green">653</FONT>         * The validity of the test depends on the assumptions of the parametric<a name="line.653"></a>
<FONT color="green">654</FONT>         * t-test procedure, as discussed<a name="line.654"></a>
<FONT color="green">655</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.655"></a>
<FONT color="green">656</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.656"></a>
<FONT color="green">657</FONT>         * &lt;p&gt;<a name="line.657"></a>
<FONT color="green">658</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.658"></a>
<FONT color="green">659</FONT>         * &lt;li&gt;The observed array lengths must both be at least 2.<a name="line.659"></a>
<FONT color="green">660</FONT>         * &lt;/li&gt;<a name="line.660"></a>
<FONT color="green">661</FONT>         * &lt;li&gt; &lt;code&gt; 0 &lt; alpha &lt; 0.5 &lt;/code&gt;<a name="line.661"></a>
<FONT color="green">662</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.662"></a>
<FONT color="green">663</FONT>         *<a name="line.663"></a>
<FONT color="green">664</FONT>         * @param sample1 array of sample data values<a name="line.664"></a>
<FONT color="green">665</FONT>         * @param sample2 array of sample data values<a name="line.665"></a>
<FONT color="green">666</FONT>         * @param alpha significance level of the test<a name="line.666"></a>
<FONT color="green">667</FONT>         * @return true if the null hypothesis can be rejected with<a name="line.667"></a>
<FONT color="green">668</FONT>         * confidence 1 - alpha<a name="line.668"></a>
<FONT color="green">669</FONT>         * @throws IllegalArgumentException if the preconditions are not met<a name="line.669"></a>
<FONT color="green">670</FONT>         * @throws MathException if an error occurs performing the test<a name="line.670"></a>
<FONT color="green">671</FONT>         */<a name="line.671"></a>
<FONT color="green">672</FONT>        public boolean tTest(double[] sample1, double[] sample2,<a name="line.672"></a>
<FONT color="green">673</FONT>                double alpha)<a name="line.673"></a>
<FONT color="green">674</FONT>        throws IllegalArgumentException, MathException {<a name="line.674"></a>
<FONT color="green">675</FONT>            checkSignificanceLevel(alpha);<a name="line.675"></a>
<FONT color="green">676</FONT>            return tTest(sample1, sample2) &lt; alpha;<a name="line.676"></a>
<FONT color="green">677</FONT>        }<a name="line.677"></a>
<FONT color="green">678</FONT>    <a name="line.678"></a>
<FONT color="green">679</FONT>        /**<a name="line.679"></a>
<FONT color="green">680</FONT>         * Performs a<a name="line.680"></a>
<FONT color="green">681</FONT>         * &lt;a href="http://www.itl.nist.gov/div898/handbook/eda/section3/eda353.htm"&gt;<a name="line.681"></a>
<FONT color="green">682</FONT>         * two-sided t-test&lt;/a&gt; evaluating the null hypothesis that &lt;code&gt;sample1&lt;/code&gt;<a name="line.682"></a>
<FONT color="green">683</FONT>         * and &lt;code&gt;sample2&lt;/code&gt; are drawn from populations with the same mean,<a name="line.683"></a>
<FONT color="green">684</FONT>         * with significance level &lt;code&gt;alpha&lt;/code&gt;,  assuming that the<a name="line.684"></a>
<FONT color="green">685</FONT>         * subpopulation variances are equal.  Use<a name="line.685"></a>
<FONT color="green">686</FONT>         * {@link #tTest(double[], double[], double)} to perform the test without<a name="line.686"></a>
<FONT color="green">687</FONT>         * the assumption of equal variances.<a name="line.687"></a>
<FONT color="green">688</FONT>         * &lt;p&gt;<a name="line.688"></a>
<FONT color="green">689</FONT>         * Returns &lt;code&gt;true&lt;/code&gt; iff the null hypothesis that the means are<a name="line.689"></a>
<FONT color="green">690</FONT>         * equal can be rejected with confidence &lt;code&gt;1 - alpha&lt;/code&gt;.  To<a name="line.690"></a>
<FONT color="green">691</FONT>         * perform a 1-sided test, use &lt;code&gt;alpha * 2.&lt;/code&gt;  To perform the test<a name="line.691"></a>
<FONT color="green">692</FONT>         * without the assumption of equal subpopulation variances, use<a name="line.692"></a>
<FONT color="green">693</FONT>         * {@link #tTest(double[], double[], double)}.&lt;/p&gt;<a name="line.693"></a>
<FONT color="green">694</FONT>         * &lt;p&gt;<a name="line.694"></a>
<FONT color="green">695</FONT>         * A pooled variance estimate is used to compute the t-statistic. See<a name="line.695"></a>
<FONT color="green">696</FONT>         * {@link #t(double[], double[])} for the formula. The sum of the sample<a name="line.696"></a>
<FONT color="green">697</FONT>         * sizes minus 2 is used as the degrees of freedom.&lt;/p&gt;<a name="line.697"></a>
<FONT color="green">698</FONT>         * &lt;p&gt;<a name="line.698"></a>
<FONT color="green">699</FONT>         * &lt;strong&gt;Examples:&lt;/strong&gt;&lt;br&gt;&lt;ol&gt;<a name="line.699"></a>
<FONT color="green">700</FONT>         * &lt;li&gt;To test the (2-sided) hypothesis &lt;code&gt;mean 1 = mean 2 &lt;/code&gt; at<a name="line.700"></a>
<FONT color="green">701</FONT>         * the 95% level, use &lt;br&gt;&lt;code&gt;tTest(sample1, sample2, 0.05). &lt;/code&gt;<a name="line.701"></a>
<FONT color="green">702</FONT>         * &lt;/li&gt;<a name="line.702"></a>
<FONT color="green">703</FONT>         * &lt;li&gt;To test the (one-sided) hypothesis &lt;code&gt; mean 1 &lt; mean 2, &lt;/code&gt;<a name="line.703"></a>
<FONT color="green">704</FONT>         * at the 99% level, first verify that the measured mean of<a name="line.704"></a>
<FONT color="green">705</FONT>         * &lt;code&gt;sample 1&lt;/code&gt; is less than the mean of &lt;code&gt;sample 2&lt;/code&gt;<a name="line.705"></a>
<FONT color="green">706</FONT>         * and then use<a name="line.706"></a>
<FONT color="green">707</FONT>         * &lt;br&gt;&lt;code&gt;tTest(sample1, sample2, 0.02) &lt;/code&gt;<a name="line.707"></a>
<FONT color="green">708</FONT>         * &lt;/li&gt;&lt;/ol&gt;&lt;/p&gt;<a name="line.708"></a>
<FONT color="green">709</FONT>         * &lt;p&gt;<a name="line.709"></a>
<FONT color="green">710</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.710"></a>
<FONT color="green">711</FONT>         * The validity of the test depends on the assumptions of the parametric<a name="line.711"></a>
<FONT color="green">712</FONT>         * t-test procedure, as discussed<a name="line.712"></a>
<FONT color="green">713</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.713"></a>
<FONT color="green">714</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.714"></a>
<FONT color="green">715</FONT>         * &lt;p&gt;<a name="line.715"></a>
<FONT color="green">716</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.716"></a>
<FONT color="green">717</FONT>         * &lt;li&gt;The observed array lengths must both be at least 2.<a name="line.717"></a>
<FONT color="green">718</FONT>         * &lt;/li&gt;<a name="line.718"></a>
<FONT color="green">719</FONT>         * &lt;li&gt; &lt;code&gt; 0 &lt; alpha &lt; 0.5 &lt;/code&gt;<a name="line.719"></a>
<FONT color="green">720</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.720"></a>
<FONT color="green">721</FONT>         *<a name="line.721"></a>
<FONT color="green">722</FONT>         * @param sample1 array of sample data values<a name="line.722"></a>
<FONT color="green">723</FONT>         * @param sample2 array of sample data values<a name="line.723"></a>
<FONT color="green">724</FONT>         * @param alpha significance level of the test<a name="line.724"></a>
<FONT color="green">725</FONT>         * @return true if the null hypothesis can be rejected with<a name="line.725"></a>
<FONT color="green">726</FONT>         * confidence 1 - alpha<a name="line.726"></a>
<FONT color="green">727</FONT>         * @throws IllegalArgumentException if the preconditions are not met<a name="line.727"></a>
<FONT color="green">728</FONT>         * @throws MathException if an error occurs performing the test<a name="line.728"></a>
<FONT color="green">729</FONT>         */<a name="line.729"></a>
<FONT color="green">730</FONT>        public boolean homoscedasticTTest(double[] sample1, double[] sample2,<a name="line.730"></a>
<FONT color="green">731</FONT>                double alpha)<a name="line.731"></a>
<FONT color="green">732</FONT>        throws IllegalArgumentException, MathException {<a name="line.732"></a>
<FONT color="green">733</FONT>            checkSignificanceLevel(alpha);<a name="line.733"></a>
<FONT color="green">734</FONT>            return homoscedasticTTest(sample1, sample2) &lt; alpha;<a name="line.734"></a>
<FONT color="green">735</FONT>        }<a name="line.735"></a>
<FONT color="green">736</FONT>    <a name="line.736"></a>
<FONT color="green">737</FONT>         /**<a name="line.737"></a>
<FONT color="green">738</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.738"></a>
<FONT color="green">739</FONT>         * &lt;i&gt;p-value&lt;/i&gt;, associated with a two-sample, two-tailed t-test<a name="line.739"></a>
<FONT color="green">740</FONT>         * comparing the means of the datasets described by two StatisticalSummary<a name="line.740"></a>
<FONT color="green">741</FONT>         * instances.<a name="line.741"></a>
<FONT color="green">742</FONT>         * &lt;p&gt;<a name="line.742"></a>
<FONT color="green">743</FONT>         * The number returned is the smallest significance level<a name="line.743"></a>
<FONT color="green">744</FONT>         * at which one can reject the null hypothesis that the two means are<a name="line.744"></a>
<FONT color="green">745</FONT>         * equal in favor of the two-sided alternative that they are different.<a name="line.745"></a>
<FONT color="green">746</FONT>         * For a one-sided test, divide the returned value by 2.&lt;/p&gt;<a name="line.746"></a>
<FONT color="green">747</FONT>         * &lt;p&gt;<a name="line.747"></a>
<FONT color="green">748</FONT>         * The test does not assume that the underlying popuation variances are<a name="line.748"></a>
<FONT color="green">749</FONT>         * equal  and it uses approximated degrees of freedom computed from the<a name="line.749"></a>
<FONT color="green">750</FONT>         * sample data to compute the p-value.   To perform the test assuming<a name="line.750"></a>
<FONT color="green">751</FONT>         * equal variances, use<a name="line.751"></a>
<FONT color="green">752</FONT>         * {@link #homoscedasticTTest(StatisticalSummary, StatisticalSummary)}.&lt;/p&gt;<a name="line.752"></a>
<FONT color="green">753</FONT>         * &lt;p&gt;<a name="line.753"></a>
<FONT color="green">754</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.754"></a>
<FONT color="green">755</FONT>         * The validity of the p-value depends on the assumptions of the parametric<a name="line.755"></a>
<FONT color="green">756</FONT>         * t-test procedure, as discussed<a name="line.756"></a>
<FONT color="green">757</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.757"></a>
<FONT color="green">758</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.758"></a>
<FONT color="green">759</FONT>         * &lt;p&gt;<a name="line.759"></a>
<FONT color="green">760</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.760"></a>
<FONT color="green">761</FONT>         * &lt;li&gt;The datasets described by the two Univariates must each contain<a name="line.761"></a>
<FONT color="green">762</FONT>         * at least 2 observations.<a name="line.762"></a>
<FONT color="green">763</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.763"></a>
<FONT color="green">764</FONT>         *<a name="line.764"></a>
<FONT color="green">765</FONT>         * @param sampleStats1  StatisticalSummary describing data from the first sample<a name="line.765"></a>
<FONT color="green">766</FONT>         * @param sampleStats2  StatisticalSummary describing data from the second sample<a name="line.766"></a>
<FONT color="green">767</FONT>         * @return p-value for t-test<a name="line.767"></a>
<FONT color="green">768</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.768"></a>
<FONT color="green">769</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.769"></a>
<FONT color="green">770</FONT>         */<a name="line.770"></a>
<FONT color="green">771</FONT>        public double tTest(StatisticalSummary sampleStats1, StatisticalSummary sampleStats2)<a name="line.771"></a>
<FONT color="green">772</FONT>        throws IllegalArgumentException, MathException {<a name="line.772"></a>
<FONT color="green">773</FONT>            checkSampleData(sampleStats1);<a name="line.773"></a>
<FONT color="green">774</FONT>            checkSampleData(sampleStats2);<a name="line.774"></a>
<FONT color="green">775</FONT>            return tTest(sampleStats1.getMean(), sampleStats2.getMean(), sampleStats1.getVariance(),<a name="line.775"></a>
<FONT color="green">776</FONT>                    sampleStats2.getVariance(), sampleStats1.getN(),<a name="line.776"></a>
<FONT color="green">777</FONT>                    sampleStats2.getN());<a name="line.777"></a>
<FONT color="green">778</FONT>        }<a name="line.778"></a>
<FONT color="green">779</FONT>    <a name="line.779"></a>
<FONT color="green">780</FONT>        /**<a name="line.780"></a>
<FONT color="green">781</FONT>         * Returns the &lt;i&gt;observed significance level&lt;/i&gt;, or<a name="line.781"></a>
<FONT color="green">782</FONT>         * &lt;i&gt;p-value&lt;/i&gt;, associated with a two-sample, two-tailed t-test<a name="line.782"></a>
<FONT color="green">783</FONT>         * comparing the means of the datasets described by two StatisticalSummary<a name="line.783"></a>
<FONT color="green">784</FONT>         * instances, under the hypothesis of equal subpopulation variances. To<a name="line.784"></a>
<FONT color="green">785</FONT>         * perform a test without the equal variances assumption, use<a name="line.785"></a>
<FONT color="green">786</FONT>         * {@link #tTest(StatisticalSummary, StatisticalSummary)}.<a name="line.786"></a>
<FONT color="green">787</FONT>         * &lt;p&gt;<a name="line.787"></a>
<FONT color="green">788</FONT>         * The number returned is the smallest significance level<a name="line.788"></a>
<FONT color="green">789</FONT>         * at which one can reject the null hypothesis that the two means are<a name="line.789"></a>
<FONT color="green">790</FONT>         * equal in favor of the two-sided alternative that they are different.<a name="line.790"></a>
<FONT color="green">791</FONT>         * For a one-sided test, divide the returned value by 2.&lt;/p&gt;<a name="line.791"></a>
<FONT color="green">792</FONT>         * &lt;p&gt;<a name="line.792"></a>
<FONT color="green">793</FONT>         * See {@link #homoscedasticT(double[], double[])} for the formula used to<a name="line.793"></a>
<FONT color="green">794</FONT>         * compute the t-statistic. The sum of the  sample sizes minus 2 is used as<a name="line.794"></a>
<FONT color="green">795</FONT>         * the degrees of freedom.&lt;/p&gt;<a name="line.795"></a>
<FONT color="green">796</FONT>         * &lt;p&gt;<a name="line.796"></a>
<FONT color="green">797</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.797"></a>
<FONT color="green">798</FONT>         * The validity of the p-value depends on the assumptions of the parametric<a name="line.798"></a>
<FONT color="green">799</FONT>         * t-test procedure, as discussed<a name="line.799"></a>
<FONT color="green">800</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;here&lt;/a&gt;<a name="line.800"></a>
<FONT color="green">801</FONT>         * &lt;/p&gt;&lt;p&gt;<a name="line.801"></a>
<FONT color="green">802</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.802"></a>
<FONT color="green">803</FONT>         * &lt;li&gt;The datasets described by the two Univariates must each contain<a name="line.803"></a>
<FONT color="green">804</FONT>         * at least 2 observations.<a name="line.804"></a>
<FONT color="green">805</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.805"></a>
<FONT color="green">806</FONT>         *<a name="line.806"></a>
<FONT color="green">807</FONT>         * @param sampleStats1  StatisticalSummary describing data from the first sample<a name="line.807"></a>
<FONT color="green">808</FONT>         * @param sampleStats2  StatisticalSummary describing data from the second sample<a name="line.808"></a>
<FONT color="green">809</FONT>         * @return p-value for t-test<a name="line.809"></a>
<FONT color="green">810</FONT>         * @throws IllegalArgumentException if the precondition is not met<a name="line.810"></a>
<FONT color="green">811</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.811"></a>
<FONT color="green">812</FONT>         */<a name="line.812"></a>
<FONT color="green">813</FONT>        public double homoscedasticTTest(StatisticalSummary sampleStats1,<a name="line.813"></a>
<FONT color="green">814</FONT>                                         StatisticalSummary sampleStats2)<a name="line.814"></a>
<FONT color="green">815</FONT>        throws IllegalArgumentException, MathException {<a name="line.815"></a>
<FONT color="green">816</FONT>            checkSampleData(sampleStats1);<a name="line.816"></a>
<FONT color="green">817</FONT>            checkSampleData(sampleStats2);<a name="line.817"></a>
<FONT color="green">818</FONT>            return homoscedasticTTest(sampleStats1.getMean(),<a name="line.818"></a>
<FONT color="green">819</FONT>                    sampleStats2.getMean(), sampleStats1.getVariance(),<a name="line.819"></a>
<FONT color="green">820</FONT>                    sampleStats2.getVariance(), sampleStats1.getN(),<a name="line.820"></a>
<FONT color="green">821</FONT>                    sampleStats2.getN());<a name="line.821"></a>
<FONT color="green">822</FONT>        }<a name="line.822"></a>
<FONT color="green">823</FONT>    <a name="line.823"></a>
<FONT color="green">824</FONT>        /**<a name="line.824"></a>
<FONT color="green">825</FONT>         * Performs a<a name="line.825"></a>
<FONT color="green">826</FONT>         * &lt;a href="http://www.itl.nist.gov/div898/handbook/eda/section3/eda353.htm"&gt;<a name="line.826"></a>
<FONT color="green">827</FONT>         * two-sided t-test&lt;/a&gt; evaluating the null hypothesis that<a name="line.827"></a>
<FONT color="green">828</FONT>         * &lt;code&gt;sampleStats1&lt;/code&gt; and &lt;code&gt;sampleStats2&lt;/code&gt; describe<a name="line.828"></a>
<FONT color="green">829</FONT>         * datasets drawn from populations with the same mean, with significance<a name="line.829"></a>
<FONT color="green">830</FONT>         * level &lt;code&gt;alpha&lt;/code&gt;.   This test does not assume that the<a name="line.830"></a>
<FONT color="green">831</FONT>         * subpopulation variances are equal.  To perform the test under the equal<a name="line.831"></a>
<FONT color="green">832</FONT>         * variances assumption, use<a name="line.832"></a>
<FONT color="green">833</FONT>         * {@link #homoscedasticTTest(StatisticalSummary, StatisticalSummary)}.<a name="line.833"></a>
<FONT color="green">834</FONT>         * &lt;p&gt;<a name="line.834"></a>
<FONT color="green">835</FONT>         * Returns &lt;code&gt;true&lt;/code&gt; iff the null hypothesis that the means are<a name="line.835"></a>
<FONT color="green">836</FONT>         * equal can be rejected with confidence &lt;code&gt;1 - alpha&lt;/code&gt;.  To<a name="line.836"></a>
<FONT color="green">837</FONT>         * perform a 1-sided test, use &lt;code&gt;alpha * 2&lt;/code&gt;&lt;/p&gt;<a name="line.837"></a>
<FONT color="green">838</FONT>         * &lt;p&gt;<a name="line.838"></a>
<FONT color="green">839</FONT>         * See {@link #t(double[], double[])} for the formula used to compute the<a name="line.839"></a>
<FONT color="green">840</FONT>         * t-statistic.  Degrees of freedom are approximated using the<a name="line.840"></a>
<FONT color="green">841</FONT>         * &lt;a href="http://www.itl.nist.gov/div898/handbook/prc/section3/prc31.htm"&gt;<a name="line.841"></a>
<FONT color="green">842</FONT>         * Welch-Satterthwaite approximation.&lt;/a&gt;&lt;/p&gt;<a name="line.842"></a>
<FONT color="green">843</FONT>         * &lt;p&gt;<a name="line.843"></a>
<FONT color="green">844</FONT>         * &lt;strong&gt;Examples:&lt;/strong&gt;&lt;br&gt;&lt;ol&gt;<a name="line.844"></a>
<FONT color="green">845</FONT>         * &lt;li&gt;To test the (2-sided) hypothesis &lt;code&gt;mean 1 = mean 2 &lt;/code&gt; at<a name="line.845"></a>
<FONT color="green">846</FONT>         * the 95%, use<a name="line.846"></a>
<FONT color="green">847</FONT>         * &lt;br&gt;&lt;code&gt;tTest(sampleStats1, sampleStats2, 0.05) &lt;/code&gt;<a name="line.847"></a>
<FONT color="green">848</FONT>         * &lt;/li&gt;<a name="line.848"></a>
<FONT color="green">849</FONT>         * &lt;li&gt;To test the (one-sided) hypothesis &lt;code&gt; mean 1 &lt; mean 2 &lt;/code&gt;<a name="line.849"></a>
<FONT color="green">850</FONT>         * at the 99% level,  first verify that the measured mean of<a name="line.850"></a>
<FONT color="green">851</FONT>         * &lt;code&gt;sample 1&lt;/code&gt; is less than  the mean of &lt;code&gt;sample 2&lt;/code&gt;<a name="line.851"></a>
<FONT color="green">852</FONT>         * and then use<a name="line.852"></a>
<FONT color="green">853</FONT>         * &lt;br&gt;&lt;code&gt;tTest(sampleStats1, sampleStats2, 0.02) &lt;/code&gt;<a name="line.853"></a>
<FONT color="green">854</FONT>         * &lt;/li&gt;&lt;/ol&gt;&lt;/p&gt;<a name="line.854"></a>
<FONT color="green">855</FONT>         * &lt;p&gt;<a name="line.855"></a>
<FONT color="green">856</FONT>         * &lt;strong&gt;Usage Note:&lt;/strong&gt;&lt;br&gt;<a name="line.856"></a>
<FONT color="green">857</FONT>         * The validity of the test depends on the assumptions of the parametric<a name="line.857"></a>
<FONT color="green">858</FONT>         * t-test procedure, as discussed<a name="line.858"></a>
<FONT color="green">859</FONT>         * &lt;a href="http://www.basic.nwu.edu/statguidefiles/ttest_unpaired_ass_viol.html"&gt;<a name="line.859"></a>
<FONT color="green">860</FONT>         * here&lt;/a&gt;&lt;/p&gt;<a name="line.860"></a>
<FONT color="green">861</FONT>         * &lt;p&gt;<a name="line.861"></a>
<FONT color="green">862</FONT>         * &lt;strong&gt;Preconditions&lt;/strong&gt;: &lt;ul&gt;<a name="line.862"></a>
<FONT color="green">863</FONT>         * &lt;li&gt;The datasets described by the two Univariates must each contain<a name="line.863"></a>
<FONT color="green">864</FONT>         * at least 2 observations.<a name="line.864"></a>
<FONT color="green">865</FONT>         * &lt;/li&gt;<a name="line.865"></a>
<FONT color="green">866</FONT>         * &lt;li&gt; &lt;code&gt; 0 &lt; alpha &lt; 0.5 &lt;/code&gt;<a name="line.866"></a>
<FONT color="green">867</FONT>         * &lt;/li&gt;&lt;/ul&gt;&lt;/p&gt;<a name="line.867"></a>
<FONT color="green">868</FONT>         *<a name="line.868"></a>
<FONT color="green">869</FONT>         * @param sampleStats1 StatisticalSummary describing sample data values<a name="line.869"></a>
<FONT color="green">870</FONT>         * @param sampleStats2 StatisticalSummary describing sample data values<a name="line.870"></a>
<FONT color="green">871</FONT>         * @param alpha significance level of the test<a name="line.871"></a>
<FONT color="green">872</FONT>         * @return true if the null hypothesis can be rejected with<a name="line.872"></a>
<FONT color="green">873</FONT>         * confidence 1 - alpha<a name="line.873"></a>
<FONT color="green">874</FONT>         * @throws IllegalArgumentException if the preconditions are not met<a name="line.874"></a>
<FONT color="green">875</FONT>         * @throws MathException if an error occurs performing the test<a name="line.875"></a>
<FONT color="green">876</FONT>         */<a name="line.876"></a>
<FONT color="green">877</FONT>        public boolean tTest(StatisticalSummary sampleStats1,<a name="line.877"></a>
<FONT color="green">878</FONT>                StatisticalSummary sampleStats2, double alpha)<a name="line.878"></a>
<FONT color="green">879</FONT>        throws IllegalArgumentException, MathException {<a name="line.879"></a>
<FONT color="green">880</FONT>            checkSignificanceLevel(alpha);<a name="line.880"></a>
<FONT color="green">881</FONT>            return tTest(sampleStats1, sampleStats2) &lt; alpha;<a name="line.881"></a>
<FONT color="green">882</FONT>        }<a name="line.882"></a>
<FONT color="green">883</FONT>    <a name="line.883"></a>
<FONT color="green">884</FONT>        //----------------------------------------------- Protected methods<a name="line.884"></a>
<FONT color="green">885</FONT>    <a name="line.885"></a>
<FONT color="green">886</FONT>        /**<a name="line.886"></a>
<FONT color="green">887</FONT>         * Computes approximate degrees of freedom for 2-sample t-test.<a name="line.887"></a>
<FONT color="green">888</FONT>         *<a name="line.888"></a>
<FONT color="green">889</FONT>         * @param v1 first sample variance<a name="line.889"></a>
<FONT color="green">890</FONT>         * @param v2 second sample variance<a name="line.890"></a>
<FONT color="green">891</FONT>         * @param n1 first sample n<a name="line.891"></a>
<FONT color="green">892</FONT>         * @param n2 second sample n<a name="line.892"></a>
<FONT color="green">893</FONT>         * @return approximate degrees of freedom<a name="line.893"></a>
<FONT color="green">894</FONT>         */<a name="line.894"></a>
<FONT color="green">895</FONT>        protected double df(double v1, double v2, double n1, double n2) {<a name="line.895"></a>
<FONT color="green">896</FONT>            return (((v1 / n1) + (v2 / n2)) * ((v1 / n1) + (v2 / n2))) /<a name="line.896"></a>
<FONT color="green">897</FONT>            ((v1 * v1) / (n1 * n1 * (n1 - 1d)) + (v2 * v2) /<a name="line.897"></a>
<FONT color="green">898</FONT>                    (n2 * n2 * (n2 - 1d)));<a name="line.898"></a>
<FONT color="green">899</FONT>        }<a name="line.899"></a>
<FONT color="green">900</FONT>    <a name="line.900"></a>
<FONT color="green">901</FONT>        /**<a name="line.901"></a>
<FONT color="green">902</FONT>         * Computes t test statistic for 1-sample t-test.<a name="line.902"></a>
<FONT color="green">903</FONT>         *<a name="line.903"></a>
<FONT color="green">904</FONT>         * @param m sample mean<a name="line.904"></a>
<FONT color="green">905</FONT>         * @param mu constant to test against<a name="line.905"></a>
<FONT color="green">906</FONT>         * @param v sample variance<a name="line.906"></a>
<FONT color="green">907</FONT>         * @param n sample n<a name="line.907"></a>
<FONT color="green">908</FONT>         * @return t test statistic<a name="line.908"></a>
<FONT color="green">909</FONT>         */<a name="line.909"></a>
<FONT color="green">910</FONT>        protected double t(double m, double mu, double v, double n) {<a name="line.910"></a>
<FONT color="green">911</FONT>            return (m - mu) / Math.sqrt(v / n);<a name="line.911"></a>
<FONT color="green">912</FONT>        }<a name="line.912"></a>
<FONT color="green">913</FONT>    <a name="line.913"></a>
<FONT color="green">914</FONT>        /**<a name="line.914"></a>
<FONT color="green">915</FONT>         * Computes t test statistic for 2-sample t-test.<a name="line.915"></a>
<FONT color="green">916</FONT>         * &lt;p&gt;<a name="line.916"></a>
<FONT color="green">917</FONT>         * Does not assume that subpopulation variances are equal.&lt;/p&gt;<a name="line.917"></a>
<FONT color="green">918</FONT>         *<a name="line.918"></a>
<FONT color="green">919</FONT>         * @param m1 first sample mean<a name="line.919"></a>
<FONT color="green">920</FONT>         * @param m2 second sample mean<a name="line.920"></a>
<FONT color="green">921</FONT>         * @param v1 first sample variance<a name="line.921"></a>
<FONT color="green">922</FONT>         * @param v2 second sample variance<a name="line.922"></a>
<FONT color="green">923</FONT>         * @param n1 first sample n<a name="line.923"></a>
<FONT color="green">924</FONT>         * @param n2 second sample n<a name="line.924"></a>
<FONT color="green">925</FONT>         * @return t test statistic<a name="line.925"></a>
<FONT color="green">926</FONT>         */<a name="line.926"></a>
<FONT color="green">927</FONT>        protected double t(double m1, double m2,  double v1, double v2, double n1,<a name="line.927"></a>
<FONT color="green">928</FONT>                double n2)  {<a name="line.928"></a>
<FONT color="green">929</FONT>                return (m1 - m2) / Math.sqrt((v1 / n1) + (v2 / n2));<a name="line.929"></a>
<FONT color="green">930</FONT>        }<a name="line.930"></a>
<FONT color="green">931</FONT>    <a name="line.931"></a>
<FONT color="green">932</FONT>        /**<a name="line.932"></a>
<FONT color="green">933</FONT>         * Computes t test statistic for 2-sample t-test under the hypothesis<a name="line.933"></a>
<FONT color="green">934</FONT>         * of equal subpopulation variances.<a name="line.934"></a>
<FONT color="green">935</FONT>         *<a name="line.935"></a>
<FONT color="green">936</FONT>         * @param m1 first sample mean<a name="line.936"></a>
<FONT color="green">937</FONT>         * @param m2 second sample mean<a name="line.937"></a>
<FONT color="green">938</FONT>         * @param v1 first sample variance<a name="line.938"></a>
<FONT color="green">939</FONT>         * @param v2 second sample variance<a name="line.939"></a>
<FONT color="green">940</FONT>         * @param n1 first sample n<a name="line.940"></a>
<FONT color="green">941</FONT>         * @param n2 second sample n<a name="line.941"></a>
<FONT color="green">942</FONT>         * @return t test statistic<a name="line.942"></a>
<FONT color="green">943</FONT>         */<a name="line.943"></a>
<FONT color="green">944</FONT>        protected double homoscedasticT(double m1, double m2,  double v1,<a name="line.944"></a>
<FONT color="green">945</FONT>                double v2, double n1, double n2)  {<a name="line.945"></a>
<FONT color="green">946</FONT>                double pooledVariance = ((n1  - 1) * v1 + (n2 -1) * v2 ) / (n1 + n2 - 2);<a name="line.946"></a>
<FONT color="green">947</FONT>                return (m1 - m2) / Math.sqrt(pooledVariance * (1d / n1 + 1d / n2));<a name="line.947"></a>
<FONT color="green">948</FONT>        }<a name="line.948"></a>
<FONT color="green">949</FONT>    <a name="line.949"></a>
<FONT color="green">950</FONT>        /**<a name="line.950"></a>
<FONT color="green">951</FONT>         * Computes p-value for 2-sided, 1-sample t-test.<a name="line.951"></a>
<FONT color="green">952</FONT>         *<a name="line.952"></a>
<FONT color="green">953</FONT>         * @param m sample mean<a name="line.953"></a>
<FONT color="green">954</FONT>         * @param mu constant to test against<a name="line.954"></a>
<FONT color="green">955</FONT>         * @param v sample variance<a name="line.955"></a>
<FONT color="green">956</FONT>         * @param n sample n<a name="line.956"></a>
<FONT color="green">957</FONT>         * @return p-value<a name="line.957"></a>
<FONT color="green">958</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.958"></a>
<FONT color="green">959</FONT>         */<a name="line.959"></a>
<FONT color="green">960</FONT>        protected double tTest(double m, double mu, double v, double n)<a name="line.960"></a>
<FONT color="green">961</FONT>        throws MathException {<a name="line.961"></a>
<FONT color="green">962</FONT>            double t = Math.abs(t(m, mu, v, n));<a name="line.962"></a>
<FONT color="green">963</FONT>            distribution.setDegreesOfFreedom(n - 1);<a name="line.963"></a>
<FONT color="green">964</FONT>            return 2.0 * distribution.cumulativeProbability(-t);<a name="line.964"></a>
<FONT color="green">965</FONT>        }<a name="line.965"></a>
<FONT color="green">966</FONT>    <a name="line.966"></a>
<FONT color="green">967</FONT>        /**<a name="line.967"></a>
<FONT color="green">968</FONT>         * Computes p-value for 2-sided, 2-sample t-test.<a name="line.968"></a>
<FONT color="green">969</FONT>         * &lt;p&gt;<a name="line.969"></a>
<FONT color="green">970</FONT>         * Does not assume subpopulation variances are equal. Degrees of freedom<a name="line.970"></a>
<FONT color="green">971</FONT>         * are estimated from the data.&lt;/p&gt;<a name="line.971"></a>
<FONT color="green">972</FONT>         *<a name="line.972"></a>
<FONT color="green">973</FONT>         * @param m1 first sample mean<a name="line.973"></a>
<FONT color="green">974</FONT>         * @param m2 second sample mean<a name="line.974"></a>
<FONT color="green">975</FONT>         * @param v1 first sample variance<a name="line.975"></a>
<FONT color="green">976</FONT>         * @param v2 second sample variance<a name="line.976"></a>
<FONT color="green">977</FONT>         * @param n1 first sample n<a name="line.977"></a>
<FONT color="green">978</FONT>         * @param n2 second sample n<a name="line.978"></a>
<FONT color="green">979</FONT>         * @return p-value<a name="line.979"></a>
<FONT color="green">980</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.980"></a>
<FONT color="green">981</FONT>         */<a name="line.981"></a>
<FONT color="green">982</FONT>        protected double tTest(double m1, double m2, double v1, double v2,<a name="line.982"></a>
<FONT color="green">983</FONT>                double n1, double n2)<a name="line.983"></a>
<FONT color="green">984</FONT>        throws MathException {<a name="line.984"></a>
<FONT color="green">985</FONT>            double t = Math.abs(t(m1, m2, v1, v2, n1, n2));<a name="line.985"></a>
<FONT color="green">986</FONT>            double degreesOfFreedom = 0;<a name="line.986"></a>
<FONT color="green">987</FONT>            degreesOfFreedom = df(v1, v2, n1, n2);<a name="line.987"></a>
<FONT color="green">988</FONT>            distribution.setDegreesOfFreedom(degreesOfFreedom);<a name="line.988"></a>
<FONT color="green">989</FONT>            return 2.0 * distribution.cumulativeProbability(-t);<a name="line.989"></a>
<FONT color="green">990</FONT>        }<a name="line.990"></a>
<FONT color="green">991</FONT>    <a name="line.991"></a>
<FONT color="green">992</FONT>        /**<a name="line.992"></a>
<FONT color="green">993</FONT>         * Computes p-value for 2-sided, 2-sample t-test, under the assumption<a name="line.993"></a>
<FONT color="green">994</FONT>         * of equal subpopulation variances.<a name="line.994"></a>
<FONT color="green">995</FONT>         * &lt;p&gt;<a name="line.995"></a>
<FONT color="green">996</FONT>         * The sum of the sample sizes minus 2 is used as degrees of freedom.&lt;/p&gt;<a name="line.996"></a>
<FONT color="green">997</FONT>         *<a name="line.997"></a>
<FONT color="green">998</FONT>         * @param m1 first sample mean<a name="line.998"></a>
<FONT color="green">999</FONT>         * @param m2 second sample mean<a name="line.999"></a>
<FONT color="green">1000</FONT>         * @param v1 first sample variance<a name="line.1000"></a>
<FONT color="green">1001</FONT>         * @param v2 second sample variance<a name="line.1001"></a>
<FONT color="green">1002</FONT>         * @param n1 first sample n<a name="line.1002"></a>
<FONT color="green">1003</FONT>         * @param n2 second sample n<a name="line.1003"></a>
<FONT color="green">1004</FONT>         * @return p-value<a name="line.1004"></a>
<FONT color="green">1005</FONT>         * @throws MathException if an error occurs computing the p-value<a name="line.1005"></a>
<FONT color="green">1006</FONT>         */<a name="line.1006"></a>
<FONT color="green">1007</FONT>        protected double homoscedasticTTest(double m1, double m2, double v1,<a name="line.1007"></a>
<FONT color="green">1008</FONT>                double v2, double n1, double n2)<a name="line.1008"></a>
<FONT color="green">1009</FONT>        throws MathException {<a name="line.1009"></a>
<FONT color="green">1010</FONT>            double t = Math.abs(homoscedasticT(m1, m2, v1, v2, n1, n2));<a name="line.1010"></a>
<FONT color="green">1011</FONT>            double degreesOfFreedom = n1 + n2 - 2;<a name="line.1011"></a>
<FONT color="green">1012</FONT>            distribution.setDegreesOfFreedom(degreesOfFreedom);<a name="line.1012"></a>
<FONT color="green">1013</FONT>            return 2.0 * distribution.cumulativeProbability(-t);<a name="line.1013"></a>
<FONT color="green">1014</FONT>        }<a name="line.1014"></a>
<FONT color="green">1015</FONT>    <a name="line.1015"></a>
<FONT color="green">1016</FONT>        /**<a name="line.1016"></a>
<FONT color="green">1017</FONT>         * Modify the distribution used to compute inference statistics.<a name="line.1017"></a>
<FONT color="green">1018</FONT>         * @param value the new distribution<a name="line.1018"></a>
<FONT color="green">1019</FONT>         * @since 1.2<a name="line.1019"></a>
<FONT color="green">1020</FONT>         */<a name="line.1020"></a>
<FONT color="green">1021</FONT>        public void setDistribution(TDistribution value) {<a name="line.1021"></a>
<FONT color="green">1022</FONT>            distribution = value;<a name="line.1022"></a>
<FONT color="green">1023</FONT>        }<a name="line.1023"></a>
<FONT color="green">1024</FONT>    <a name="line.1024"></a>
<FONT color="green">1025</FONT>        /** Check significance level.<a name="line.1025"></a>
<FONT color="green">1026</FONT>         * @param alpha significance level<a name="line.1026"></a>
<FONT color="green">1027</FONT>         * @exception IllegalArgumentException if significance level is out of bounds<a name="line.1027"></a>
<FONT color="green">1028</FONT>         */<a name="line.1028"></a>
<FONT color="green">1029</FONT>        private void checkSignificanceLevel(final double alpha)<a name="line.1029"></a>
<FONT color="green">1030</FONT>            throws IllegalArgumentException {<a name="line.1030"></a>
<FONT color="green">1031</FONT>            if ((alpha &lt;= 0) || (alpha &gt; 0.5)) {<a name="line.1031"></a>
<FONT color="green">1032</FONT>                throw MathRuntimeException.createIllegalArgumentException(<a name="line.1032"></a>
<FONT color="green">1033</FONT>                      "out of bounds significance level {0}, must be between {1} and {2}",<a name="line.1033"></a>
<FONT color="green">1034</FONT>                      alpha, 0.0, 0.5);<a name="line.1034"></a>
<FONT color="green">1035</FONT>            }<a name="line.1035"></a>
<FONT color="green">1036</FONT>        }<a name="line.1036"></a>
<FONT color="green">1037</FONT>    <a name="line.1037"></a>
<FONT color="green">1038</FONT>        /** Check sample data.<a name="line.1038"></a>
<FONT color="green">1039</FONT>         * @param data sample data<a name="line.1039"></a>
<FONT color="green">1040</FONT>         * @exception IllegalArgumentException if there is not enough sample data<a name="line.1040"></a>
<FONT color="green">1041</FONT>         */<a name="line.1041"></a>
<FONT color="green">1042</FONT>        private void checkSampleData(final double[] data)<a name="line.1042"></a>
<FONT color="green">1043</FONT>            throws IllegalArgumentException {<a name="line.1043"></a>
<FONT color="green">1044</FONT>            if ((data == null) || (data.length &lt; 2)) {<a name="line.1044"></a>
<FONT color="green">1045</FONT>                throw MathRuntimeException.createIllegalArgumentException(<a name="line.1045"></a>
<FONT color="green">1046</FONT>                      INSUFFICIENT_DATA_MESSAGE,<a name="line.1046"></a>
<FONT color="green">1047</FONT>                      (data == null) ? 0 : data.length);<a name="line.1047"></a>
<FONT color="green">1048</FONT>            }<a name="line.1048"></a>
<FONT color="green">1049</FONT>        }<a name="line.1049"></a>
<FONT color="green">1050</FONT>    <a name="line.1050"></a>
<FONT color="green">1051</FONT>        /** Check sample data.<a name="line.1051"></a>
<FONT color="green">1052</FONT>         * @param stat statistical summary<a name="line.1052"></a>
<FONT color="green">1053</FONT>         * @exception IllegalArgumentException if there is not enough sample data<a name="line.1053"></a>
<FONT color="green">1054</FONT>         */<a name="line.1054"></a>
<FONT color="green">1055</FONT>        private void checkSampleData(final StatisticalSummary stat)<a name="line.1055"></a>
<FONT color="green">1056</FONT>            throws IllegalArgumentException {<a name="line.1056"></a>
<FONT color="green">1057</FONT>            if ((stat == null) || (stat.getN() &lt; 2)) {<a name="line.1057"></a>
<FONT color="green">1058</FONT>                throw MathRuntimeException.createIllegalArgumentException(<a name="line.1058"></a>
<FONT color="green">1059</FONT>                      INSUFFICIENT_DATA_MESSAGE,<a name="line.1059"></a>
<FONT color="green">1060</FONT>                      (stat == null) ? 0 : stat.getN());<a name="line.1060"></a>
<FONT color="green">1061</FONT>            }<a name="line.1061"></a>
<FONT color="green">1062</FONT>        }<a name="line.1062"></a>
<FONT color="green">1063</FONT>    <a name="line.1063"></a>
<FONT color="green">1064</FONT>    }<a name="line.1064"></a>


</PRE>
</BODY>
</HTML>
author	dwinter
date	Tue, 04 Jan 2011 10:02:07 +0100
parents
children