mirror of
				https://github.com/saitohirga/WSJT-X.git
				synced 2025-10-26 02:20:20 -04:00 
			
		
		
		
	
		
			
	
	
		
			425 lines
		
	
	
		
			16 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
		
		
			
		
	
	
			425 lines
		
	
	
		
			16 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
|  | // Copyright John Maddock 2006
 | ||
|  | // Copyright Paul A. Bristow 2007, 2010
 | ||
|  | 
 | ||
|  | // Use, modification and distribution are subject to the
 | ||
|  | // Boost Software License, Version 1.0.
 | ||
|  | // (See accompanying file LICENSE_1_0.txt
 | ||
|  | // or copy at http://www.boost.org/LICENSE_1_0.txt)
 | ||
|  | 
 | ||
|  | #ifdef _MSC_VER
 | ||
|  | #  pragma warning(disable: 4512) // assignment operator could not be generated.
 | ||
|  | #  pragma warning(disable: 4510) // default constructor could not be generated.
 | ||
|  | #  pragma warning(disable: 4610) // can never be instantiated - user defined constructor required.
 | ||
|  | #endif
 | ||
|  | 
 | ||
|  | #include <boost/math/distributions/students_t.hpp>
 | ||
|  | 
 | ||
|  | // avoid "using namespace std;" and "using namespace boost::math;"
 | ||
|  | // to avoid potential ambiguity with names in std random.
 | ||
|  | #include <iostream>
 | ||
|  | using std::cout; using std::endl; | ||
|  | using std::left; using std::fixed; using std::right; using std::scientific; | ||
|  | #include <iomanip>
 | ||
|  | using std::setw; | ||
|  | using std::setprecision; | ||
|  | 
 | ||
|  | void confidence_limits_on_mean(double Sm, double Sd, unsigned Sn) | ||
|  | { | ||
|  |    //
 | ||
|  |    // Sm = Sample Mean.
 | ||
|  |    // Sd = Sample Standard Deviation.
 | ||
|  |    // Sn = Sample Size.
 | ||
|  |    //
 | ||
|  |    // Calculate confidence intervals for the mean.
 | ||
|  |    // For example if we set the confidence limit to
 | ||
|  |    // 0.95, we know that if we repeat the sampling
 | ||
|  |    // 100 times, then we expect that the true mean
 | ||
|  |    // will be between out limits on 95 occations.
 | ||
|  |    // Note: this is not the same as saying a 95%
 | ||
|  |    // confidence interval means that there is a 95%
 | ||
|  |    // probability that the interval contains the true mean.
 | ||
|  |    // The interval computed from a given sample either
 | ||
|  |    // contains the true mean or it does not.
 | ||
|  |    // See http://www.itl.nist.gov/div898/handbook/eda/section3/eda352.htm
 | ||
|  | 
 | ||
|  |    using boost::math::students_t; | ||
|  | 
 | ||
|  |    // Print out general info:
 | ||
|  |    cout << | ||
|  |       "__________________________________\n" | ||
|  |       "2-Sided Confidence Limits For Mean\n" | ||
|  |       "__________________________________\n\n"; | ||
|  |    cout << setprecision(7); | ||
|  |    cout << setw(40) << left << "Number of Observations" << "=  " << Sn << "\n"; | ||
|  |    cout << setw(40) << left << "Mean" << "=  " << Sm << "\n"; | ||
|  |    cout << setw(40) << left << "Standard Deviation" << "=  " << Sd << "\n"; | ||
|  |    //
 | ||
|  |    // Define a table of significance/risk levels:
 | ||
|  |    //
 | ||
|  |    double alpha[] = { 0.5, 0.25, 0.1, 0.05, 0.01, 0.001, 0.0001, 0.00001 }; | ||
|  |    //
 | ||
|  |    // Start by declaring the distribution we'll need:
 | ||
|  |    //
 | ||
|  |    students_t dist(Sn - 1); | ||
|  |    //
 | ||
|  |    // Print table header:
 | ||
|  |    //
 | ||
|  |    cout << "\n\n" | ||
|  |            "_______________________________________________________________\n" | ||
|  |            "Confidence       T           Interval          Lower          Upper\n" | ||
|  |            " Value (%)     Value          Width            Limit          Limit\n" | ||
|  |            "_______________________________________________________________\n"; | ||
|  |    //
 | ||
|  |    // Now print out the data for the table rows.
 | ||
|  |    //
 | ||
|  |    for(unsigned i = 0; i < sizeof(alpha)/sizeof(alpha[0]); ++i) | ||
|  |    { | ||
|  |       // Confidence value:
 | ||
|  |       cout << fixed << setprecision(3) << setw(10) << right << 100 * (1-alpha[i]); | ||
|  |       // calculate T:
 | ||
|  |       double T = quantile(complement(dist, alpha[i] / 2)); | ||
|  |       // Print T:
 | ||
|  |       cout << fixed << setprecision(3) << setw(10) << right << T; | ||
|  |       // Calculate width of interval (one sided):
 | ||
|  |       double w = T * Sd / sqrt(double(Sn)); | ||
|  |       // Print width:
 | ||
|  |       if(w < 0.01) | ||
|  |          cout << scientific << setprecision(3) << setw(17) << right << w; | ||
|  |       else | ||
|  |          cout << fixed << setprecision(3) << setw(17) << right << w; | ||
|  |       // Print Limits:
 | ||
|  |       cout << fixed << setprecision(5) << setw(15) << right << Sm - w; | ||
|  |       cout << fixed << setprecision(5) << setw(15) << right << Sm + w << endl; | ||
|  |    } | ||
|  |    cout << endl; | ||
|  | } // void confidence_limits_on_mean
 | ||
|  | 
 | ||
|  | void single_sample_t_test(double M, double Sm, double Sd, unsigned Sn, double alpha) | ||
|  | { | ||
|  |    //
 | ||
|  |    // M = true mean.
 | ||
|  |    // Sm = Sample Mean.
 | ||
|  |    // Sd = Sample Standard Deviation.
 | ||
|  |    // Sn = Sample Size.
 | ||
|  |    // alpha = Significance Level.
 | ||
|  |    //
 | ||
|  |    // A Students t test applied to a single set of data.
 | ||
|  |    // We are testing the null hypothesis that the true
 | ||
|  |    // mean of the sample is M, and that any variation is down
 | ||
|  |    // to chance.  We can also test the alternative hypothesis
 | ||
|  |    // that any difference is not down to chance.
 | ||
|  |    // See http://www.itl.nist.gov/div898/handbook/eda/section3/eda352.htm
 | ||
|  |     | ||
|  |    using boost::math::students_t; | ||
|  | 
 | ||
|  |    // Print header:
 | ||
|  |    cout << | ||
|  |       "__________________________________\n" | ||
|  |       "Student t test for a single sample\n" | ||
|  |       "__________________________________\n\n"; | ||
|  |    cout << setprecision(5); | ||
|  |    cout << setw(55) << left << "Number of Observations" << "=  " << Sn << "\n"; | ||
|  |    cout << setw(55) << left << "Sample Mean" << "=  " << Sm << "\n"; | ||
|  |    cout << setw(55) << left << "Sample Standard Deviation" << "=  " << Sd << "\n"; | ||
|  |    cout << setw(55) << left << "Expected True Mean" << "=  " << M << "\n\n"; | ||
|  |    //
 | ||
|  |    // Now we can calculate and output some stats:
 | ||
|  |    //
 | ||
|  |    // Difference in means:
 | ||
|  |    double diff = Sm - M; | ||
|  |    cout << setw(55) << left << "Sample Mean - Expected Test Mean" << "=  " << diff << "\n"; | ||
|  |    // Degrees of freedom:
 | ||
|  |    unsigned v = Sn - 1; | ||
|  |    cout << setw(55) << left << "Degrees of Freedom" << "=  " << v << "\n"; | ||
|  |    // t-statistic:
 | ||
|  |    double t_stat = diff * sqrt(double(Sn)) / Sd; | ||
|  |    cout << setw(55) << left << "T Statistic" << "=  " << t_stat << "\n"; | ||
|  |    //
 | ||
|  |    // Finally define our distribution, and get the probability:
 | ||
|  |    //
 | ||
|  |    students_t dist(v); | ||
|  |    double q = cdf(complement(dist, fabs(t_stat))); | ||
|  |    cout << setw(55) << left << "Probability that difference is due to chance" << "=  " | ||
|  |       << setprecision(3) << scientific << 2 * q << "\n\n"; | ||
|  |    //
 | ||
|  |    // Finally print out results of alternative hypothesis:
 | ||
|  |    //
 | ||
|  |    cout << setw(55) << left << | ||
|  |       "Results for Alternative Hypothesis and alpha" << "=  " | ||
|  |       << setprecision(4) << fixed << alpha << "\n\n"; | ||
|  |    cout << "Alternative Hypothesis     Conclusion\n"; | ||
|  |    cout << "Mean != " << setprecision(3) << fixed << M << "            "; | ||
|  |    if(q < alpha / 2) | ||
|  |       cout << "NOT REJECTED\n"; | ||
|  |    else | ||
|  |       cout << "REJECTED\n"; | ||
|  |    cout << "Mean  < " << setprecision(3) << fixed << M << "            "; | ||
|  |    if(cdf(complement(dist, t_stat)) > alpha) | ||
|  |       cout << "NOT REJECTED\n"; | ||
|  |    else | ||
|  |       cout << "REJECTED\n"; | ||
|  |    cout << "Mean  > " << setprecision(3) << fixed << M << "            "; | ||
|  |    if(cdf(dist, t_stat) > alpha) | ||
|  |       cout << "NOT REJECTED\n"; | ||
|  |    else | ||
|  |       cout << "REJECTED\n"; | ||
|  |    cout << endl << endl; | ||
|  | } // void single_sample_t_test(
 | ||
|  | 
 | ||
|  | void single_sample_find_df(double M, double Sm, double Sd) | ||
|  | { | ||
|  |    //
 | ||
|  |    // M = true mean.
 | ||
|  |    // Sm = Sample Mean.
 | ||
|  |    // Sd = Sample Standard Deviation.
 | ||
|  |    //
 | ||
|  |   | ||
|  |    using boost::math::students_t; | ||
|  | 
 | ||
|  |    // Print out general info:
 | ||
|  |    cout << | ||
|  |       "_____________________________________________________________\n" | ||
|  |       "Estimated sample sizes required for various confidence levels\n" | ||
|  |       "_____________________________________________________________\n\n"; | ||
|  |    cout << setprecision(5); | ||
|  |    cout << setw(40) << left << "True Mean" << "=  " << M << "\n"; | ||
|  |    cout << setw(40) << left << "Sample Mean" << "=  " << Sm << "\n"; | ||
|  |    cout << setw(40) << left << "Sample Standard Deviation" << "=  " << Sd << "\n"; | ||
|  |    //
 | ||
|  |    // Define a table of significance intervals:
 | ||
|  |    //
 | ||
|  |    double alpha[] = { 0.5, 0.25, 0.1, 0.05, 0.01, 0.001, 0.0001, 0.00001 }; | ||
|  |    //
 | ||
|  |    // Print table header:
 | ||
|  |    //
 | ||
|  |    cout << "\n\n" | ||
|  |            "_______________________________________________________________\n" | ||
|  |            "Confidence       Estimated          Estimated\n" | ||
|  |            " Value (%)      Sample Size        Sample Size\n" | ||
|  |            "              (one sided test)    (two sided test)\n" | ||
|  |            "_______________________________________________________________\n"; | ||
|  |    //
 | ||
|  |    // Now print out the data for the table rows.
 | ||
|  |    //
 | ||
|  |    for(unsigned i = 1; i < sizeof(alpha)/sizeof(alpha[0]); ++i) | ||
|  |    { | ||
|  |       // Confidence value:
 | ||
|  |       cout << fixed << setprecision(3) << setw(10) << right << 100 * (1-alpha[i]); | ||
|  |       // calculate df for single sided test:
 | ||
|  |       double df = students_t::find_degrees_of_freedom( | ||
|  |          fabs(M - Sm), alpha[i], alpha[i], Sd); | ||
|  |       // convert to sample size, always one more than the degrees of freedom:
 | ||
|  |       double size = ceil(df) + 1; | ||
|  |       // Print size:
 | ||
|  |       cout << fixed << setprecision(0) << setw(16) << right << size; | ||
|  |       // calculate df for two sided test:
 | ||
|  |       df = students_t::find_degrees_of_freedom( | ||
|  |          fabs(M - Sm), alpha[i]/2, alpha[i], Sd); | ||
|  |       // convert to sample size:
 | ||
|  |       size = ceil(df) + 1; | ||
|  |       // Print size:
 | ||
|  |       cout << fixed << setprecision(0) << setw(16) << right << size << endl; | ||
|  |    } | ||
|  |    cout << endl; | ||
|  | } // void single_sample_find_df
 | ||
|  | 
 | ||
|  | int main() | ||
|  | { | ||
|  |    //
 | ||
|  |    // Run tests for Heat Flow Meter data
 | ||
|  |    // see http://www.itl.nist.gov/div898/handbook/eda/section4/eda428.htm
 | ||
|  |    // The data was collected while calibrating a heat flow meter
 | ||
|  |    // against a known value.
 | ||
|  |    //
 | ||
|  |    confidence_limits_on_mean(9.261460, 0.2278881e-01, 195); | ||
|  |    single_sample_t_test(5, 9.261460, 0.2278881e-01, 195, 0.05); | ||
|  |    single_sample_find_df(5, 9.261460, 0.2278881e-01); | ||
|  | 
 | ||
|  |    //
 | ||
|  |    // Data for this example from:
 | ||
|  |    // P.K.Hou, O. W. Lau & M.C. Wong, Analyst (1983) vol. 108, p 64.
 | ||
|  |    // from Statistics for Analytical Chemistry, 3rd ed. (1994), pp 54-55
 | ||
|  |    // J. C. Miller and J. N. Miller, Ellis Horwood ISBN 0 13 0309907
 | ||
|  |    //
 | ||
|  |    // Determination of mercury by cold-vapour atomic absorption,
 | ||
|  |    // the following values were obtained fusing a trusted
 | ||
|  |    // Standard Reference Material containing 38.9% mercury,
 | ||
|  |    // which we assume is correct or 'true'.
 | ||
|  |    //
 | ||
|  |    confidence_limits_on_mean(37.8, 0.964365, 3); | ||
|  |    // 95% test:
 | ||
|  |    single_sample_t_test(38.9, 37.8, 0.964365, 3, 0.05); | ||
|  |    // 90% test:
 | ||
|  |    single_sample_t_test(38.9, 37.8, 0.964365, 3, 0.1); | ||
|  |    // parameter estimate:
 | ||
|  |    single_sample_find_df(38.9, 37.8, 0.964365); | ||
|  | 
 | ||
|  |    return 0; | ||
|  | } // int main()
 | ||
|  | 
 | ||
|  | /*
 | ||
|  | 
 | ||
|  | Output: | ||
|  | 
 | ||
|  | ------ Rebuild All started: Project: students_t_single_sample, Configuration: Release Win32 ------ | ||
|  |   students_t_single_sample.cpp | ||
|  |   Generating code | ||
|  |   Finished generating code | ||
|  |   students_t_single_sample.vcxproj -> J:\Cpp\MathToolkit\test\Math_test\Release\students_t_single_sample.exe | ||
|  | __________________________________ | ||
|  | 2-Sided Confidence Limits For Mean | ||
|  | __________________________________ | ||
|  | 
 | ||
|  | Number of Observations                  =  195 | ||
|  | Mean                                    =  9.26146 | ||
|  | Standard Deviation                      =  0.02278881 | ||
|  | 
 | ||
|  | 
 | ||
|  | _______________________________________________________________ | ||
|  | Confidence       T           Interval          Lower          Upper | ||
|  |  Value (%)     Value          Width            Limit          Limit | ||
|  | _______________________________________________________________ | ||
|  |     50.000     0.676       1.103e-003        9.26036        9.26256 | ||
|  |     75.000     1.154       1.883e-003        9.25958        9.26334 | ||
|  |     90.000     1.653       2.697e-003        9.25876        9.26416 | ||
|  |     95.000     1.972       3.219e-003        9.25824        9.26468 | ||
|  |     99.000     2.601       4.245e-003        9.25721        9.26571 | ||
|  |     99.900     3.341       5.453e-003        9.25601        9.26691 | ||
|  |     99.990     3.973       6.484e-003        9.25498        9.26794 | ||
|  |     99.999     4.537       7.404e-003        9.25406        9.26886 | ||
|  | 
 | ||
|  | __________________________________ | ||
|  | Student t test for a single sample | ||
|  | __________________________________ | ||
|  | 
 | ||
|  | Number of Observations                                 =  195 | ||
|  | Sample Mean                                            =  9.26146 | ||
|  | Sample Standard Deviation                              =  0.02279 | ||
|  | Expected True Mean                                     =  5.00000 | ||
|  | 
 | ||
|  | Sample Mean - Expected Test Mean                       =  4.26146 | ||
|  | Degrees of Freedom                                     =  194 | ||
|  | T Statistic                                            =  2611.28380 | ||
|  | Probability that difference is due to chance           =  0.000e+000 | ||
|  | 
 | ||
|  | Results for Alternative Hypothesis and alpha           =  0.0500 | ||
|  | 
 | ||
|  | Alternative Hypothesis     Conclusion | ||
|  | Mean != 5.000            NOT REJECTED | ||
|  | Mean  < 5.000            REJECTED | ||
|  | Mean  > 5.000            NOT REJECTED | ||
|  | 
 | ||
|  | 
 | ||
|  | _____________________________________________________________ | ||
|  | Estimated sample sizes required for various confidence levels | ||
|  | _____________________________________________________________ | ||
|  | 
 | ||
|  | True Mean                               =  5.00000 | ||
|  | Sample Mean                             =  9.26146 | ||
|  | Sample Standard Deviation               =  0.02279 | ||
|  | 
 | ||
|  | 
 | ||
|  | _______________________________________________________________ | ||
|  | Confidence       Estimated          Estimated | ||
|  |  Value (%)      Sample Size        Sample Size | ||
|  |               (one sided test)    (two sided test) | ||
|  | _______________________________________________________________ | ||
|  |     75.000               2               2 | ||
|  |     90.000               2               2 | ||
|  |     95.000               2               2 | ||
|  |     99.000               2               2 | ||
|  |     99.900               3               3 | ||
|  |     99.990               3               3 | ||
|  |     99.999               4               4 | ||
|  | 
 | ||
|  | __________________________________ | ||
|  | 2-Sided Confidence Limits For Mean | ||
|  | __________________________________ | ||
|  | 
 | ||
|  | Number of Observations                  =  3 | ||
|  | Mean                                    =  37.8000000 | ||
|  | Standard Deviation                      =  0.9643650 | ||
|  | 
 | ||
|  | 
 | ||
|  | _______________________________________________________________ | ||
|  | Confidence       T           Interval          Lower          Upper | ||
|  |  Value (%)     Value          Width            Limit          Limit | ||
|  | _______________________________________________________________ | ||
|  |     50.000     0.816            0.455       37.34539       38.25461 | ||
|  |     75.000     1.604            0.893       36.90717       38.69283 | ||
|  |     90.000     2.920            1.626       36.17422       39.42578 | ||
|  |     95.000     4.303            2.396       35.40438       40.19562 | ||
|  |     99.000     9.925            5.526       32.27408       43.32592 | ||
|  |     99.900    31.599           17.594       20.20639       55.39361 | ||
|  |     99.990    99.992           55.673      -17.87346       93.47346 | ||
|  |     99.999   316.225          176.067     -138.26683      213.86683 | ||
|  | 
 | ||
|  | __________________________________ | ||
|  | Student t test for a single sample | ||
|  | __________________________________ | ||
|  | 
 | ||
|  | Number of Observations                                 =  3 | ||
|  | Sample Mean                                            =  37.80000 | ||
|  | Sample Standard Deviation                              =  0.96437 | ||
|  | Expected True Mean                                     =  38.90000 | ||
|  | 
 | ||
|  | Sample Mean - Expected Test Mean                       =  -1.10000 | ||
|  | Degrees of Freedom                                     =  2 | ||
|  | T Statistic                                            =  -1.97566 | ||
|  | Probability that difference is due to chance           =  1.869e-001 | ||
|  | 
 | ||
|  | Results for Alternative Hypothesis and alpha           =  0.0500 | ||
|  | 
 | ||
|  | Alternative Hypothesis     Conclusion | ||
|  | Mean != 38.900            REJECTED | ||
|  | Mean  < 38.900            NOT REJECTED | ||
|  | Mean  > 38.900            NOT REJECTED | ||
|  | 
 | ||
|  | 
 | ||
|  | __________________________________ | ||
|  | Student t test for a single sample | ||
|  | __________________________________ | ||
|  | 
 | ||
|  | Number of Observations                                 =  3 | ||
|  | Sample Mean                                            =  37.80000 | ||
|  | Sample Standard Deviation                              =  0.96437 | ||
|  | Expected True Mean                                     =  38.90000 | ||
|  | 
 | ||
|  | Sample Mean - Expected Test Mean                       =  -1.10000 | ||
|  | Degrees of Freedom                                     =  2 | ||
|  | T Statistic                                            =  -1.97566 | ||
|  | Probability that difference is due to chance           =  1.869e-001 | ||
|  | 
 | ||
|  | Results for Alternative Hypothesis and alpha           =  0.1000 | ||
|  | 
 | ||
|  | Alternative Hypothesis     Conclusion | ||
|  | Mean != 38.900            REJECTED | ||
|  | Mean  < 38.900            NOT REJECTED | ||
|  | Mean  > 38.900            REJECTED | ||
|  | 
 | ||
|  | 
 | ||
|  | _____________________________________________________________ | ||
|  | Estimated sample sizes required for various confidence levels | ||
|  | _____________________________________________________________ | ||
|  | 
 | ||
|  | True Mean                               =  38.90000 | ||
|  | Sample Mean                             =  37.80000 | ||
|  | Sample Standard Deviation               =  0.96437 | ||
|  | 
 | ||
|  | 
 | ||
|  | _______________________________________________________________ | ||
|  | Confidence       Estimated          Estimated | ||
|  |  Value (%)      Sample Size        Sample Size | ||
|  |               (one sided test)    (two sided test) | ||
|  | _______________________________________________________________ | ||
|  |     75.000               3               4 | ||
|  |     90.000               7               9 | ||
|  |     95.000              11              13 | ||
|  |     99.000              20              22 | ||
|  |     99.900              35              37 | ||
|  |     99.990              50              53 | ||
|  |     99.999              66              68 | ||
|  | 
 | ||
|  | */ | ||
|  | 
 |