X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=tests%2Flanguage%2Fstats%2Fregression.at;h=2547fd6529943ae1498a3bad81f323d1630080b4;hb=899e0af5a1de32d108cb27fdca2c8c105f5bdd45;hp=7548160079b2e14d195c16dbe841dd55759fdcdf;hpb=0df9cdd3df66caf4353128feff3008289cda8115;p=pspp diff --git a/tests/language/stats/regression.at b/tests/language/stats/regression.at index 7548160079..2547fd6529 100644 --- a/tests/language/stats/regression.at +++ b/tests/language/stats/regression.at @@ -1,9 +1,26 @@ +dnl PSPP - a program for statistical analysis. +dnl Copyright (C) 2017 Free Software Foundation, Inc. +dnl +dnl This program is free software: you can redistribute it and/or modify +dnl it under the terms of the GNU General Public License as published by +dnl the Free Software Foundation, either version 3 of the License, or +dnl (at your option) any later version. +dnl +dnl This program is distributed in the hope that it will be useful, +dnl but WITHOUT ANY WARRANTY; without even the implied warranty of +dnl MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +dnl GNU General Public License for more details. +dnl +dnl You should have received a copy of the GNU General Public License +dnl along with this program. If not, see . +dnl AT_BANNER([LINEAR REGRESSION]) AT_SETUP([LINEAR REGRESSION - basic]) AT_DATA([regression.sps], [dnl set format = F22.3. data list notable list / v0 to v2. +filter by v0. begin data 0.65377128 7.735648 -23.97588 -0.13087553 6.142625 -19.63854 @@ -21,22 +38,24 @@ list. ]) AT_CHECK([pspp -O format=csv regression.sps], [0], [dnl +regression.sps:16: warning: REGRESSION: REGRESSION with SAVE ignores FILTER. All cases will be processed. + Table: Model Summary (v2) -,R,R Square,Adjusted R Square,Std. Error of the Estimate -,.971,.942,.925,1.337 +R,R Square,Adjusted R Square,Std. Error of the Estimate +.971,.942,.925,1.337 Table: ANOVA (v2) -,,Sum of Squares,df,Mean Square,F,Sig. -,Regression,202.753,2,101.376,56.754,.000 -,Residual,12.504,7,1.786,, -,Total,215.256,9,,, +,Sum of Squares,df,Mean Square,F,Sig. +Regression,202.753,2,101.376,56.754,.000 +Residual,12.504,7,1.786,, +Total,215.256,9,,, Table: Coefficients (v2) -,,Unstandardized Coefficients,,Standardized Coefficients,, -,,B,Std. Error,Beta,t,Sig. -,(Constant),2.191,2.357,.000,.930,.380 -,v0,1.813,1.053,.171,1.722,.129 -,v1,-3.427,.332,-1.026,-10.334,.000 +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),2.191,2.357,.000,.930,.380 +v0,1.813,1.053,.171,1.722,.129 +v1,-3.427,.332,-1.026,-10.334,.000 Table: Data List v0,v1,v2,RES1,PRED1 @@ -77,38 +96,38 @@ list. AT_CHECK([pspp -O format=csv regression.sps], [0], [dnl Table: Model Summary (v2) -,R,R Square,Adjusted R Square,Std. Error of the Estimate -,.971,.942,.925,1.337 +R,R Square,Adjusted R Square,Std. Error of the Estimate +.971,.942,.925,1.337 Table: ANOVA (v2) -,,Sum of Squares,df,Mean Square,F,Sig. -,Regression,202.753,2,101.376,56.754,.000 -,Residual,12.504,7,1.786,, -,Total,215.256,9,,, +,Sum of Squares,df,Mean Square,F,Sig. +Regression,202.753,2,101.376,56.754,.000 +Residual,12.504,7,1.786,, +Total,215.256,9,,, Table: Coefficients (v2) -,,Unstandardized Coefficients,,Standardized Coefficients,, -,,B,Std. Error,Beta,t,Sig. -,(Constant),2.191,2.357,.000,.930,.380 -,v0,1.813,1.053,.171,1.722,.129 -,v1,-3.427,.332,-1.026,-10.334,.000 +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),2.191,2.357,.000,.930,.380 +v0,1.813,1.053,.171,1.722,.129 +v1,-3.427,.332,-1.026,-10.334,.000 Table: Model Summary (v2) -,R,R Square,Adjusted R Square,Std. Error of the Estimate -,.971,.942,.925,1.337 +R,R Square,Adjusted R Square,Std. Error of the Estimate +.971,.942,.925,1.337 Table: ANOVA (v2) -,,Sum of Squares,df,Mean Square,F,Sig. -,Regression,202.753,2,101.376,56.754,.000 -,Residual,12.504,7,1.786,, -,Total,215.256,9,,, +,Sum of Squares,df,Mean Square,F,Sig. +Regression,202.753,2,101.376,56.754,.000 +Residual,12.504,7,1.786,, +Total,215.256,9,,, Table: Coefficients (v2) -,,Unstandardized Coefficients,,Standardized Coefficients,, -,,B,Std. Error,Beta,t,Sig. -,(Constant),2.191,2.357,.000,.930,.380 -,v0,1.813,1.053,.171,1.722,.129 -,v1,-3.427,.332,-1.026,-10.334,.000 +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),2.191,2.357,.000,.930,.380 +v0,1.813,1.053,.171,1.722,.129 +v1,-3.427,.332,-1.026,-10.334,.000 Table: Data List v0,v1,v2,RES1,PRED1 @@ -1767,20 +1786,20 @@ v0,F8.0 v1,F8.0 Table: Model Summary (v0) -,R,R Square,Adjusted R Square,Std. Error of the Estimate -,.05,.00,.00,8.11 +R,R Square,Adjusted R Square,Std. Error of the Estimate +.05,.00,.00,8.11 Table: ANOVA (v0) -,,Sum of Squares,df,Mean Square,F,Sig. -,Regression,235.23,1,235.23,3.58,.059 -,Residual,98438.40,1498,65.71,, -,Total,98673.63,1499,,, +,Sum of Squares,df,Mean Square,F,Sig. +Regression,235.23,1,235.23,3.58,.059 +Residual,98438.40,1498,65.71,, +Total,98673.63,1499,,, Table: Coefficients (v0) -,,Unstandardized Coefficients,,Standardized Coefficients,, -,,B,Std. Error,Beta,t,Sig. -,(Constant),1.24,.42,.00,2.95,.003 -,v1,1.37,.72,.05,1.89,.059 +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),1.24,.42,.00,2.95,.003 +v1,1.37,.72,.05,1.89,.059 ]) AT_CLEANUP @@ -2106,24 +2125,335 @@ regression AT_CHECK([pspp -O format=csv conf.sps], [0], [dnl Table: Model Summary (science) -,R,R Square,Adjusted R Square,Std. Error of the Estimate -,.699,.489,.479,7.148 +R,R Square,Adjusted R Square,Std. Error of the Estimate +.699,.489,.479,7.148 Table: ANOVA (science) -,,Sum of Squares,df,Mean Square,F,Sig. -,Regression,9543.721,4,2385.930,46.695,.000 -,Residual,9963.779,195,51.096,, -,Total,19507.500,199,,, +,Sum of Squares,df,Mean Square,F,Sig. +Regression,9543.721,4,2385.930,46.695,.000 +Residual,9963.779,195,51.096,, +Total,19507.500,199,,, Table: Coefficients (science) -,,Unstandardized Coefficients,,Standardized Coefficients,,,95% Confidence Interval for B, -,,B,Std. Error,Beta,t,Sig.,Lower Bound,Upper Bound -,(Constant),12.325,3.194,.000,3.859,.000,6.027,18.624 -,math,.389,.074,.368,5.252,.000,.243,.535 -,female,-2.010,1.023,-.101,-1.965,.051,-4.027,.007 -,socst,.050,.062,.054,.801,.424,-.073,.173 -,read,.335,.073,.347,4.607,.000,.192,.479 +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig.,95% Confidence Interval for B, +,B,Std. Error,Beta,,,Lower Bound,Upper Bound +(Constant),12.325,3.194,.000,3.859,.000,6.027,18.624 +math,.389,.074,.368,5.252,.000,.243,.535 +female,-2.010,1.023,-.101,-1.965,.051,-4.027,.007 +socst,.050,.062,.054,.801,.424,-.073,.173 +read,.335,.073,.347,4.607,.000,.192,.479 +]) + + +AT_CLEANUP + + +dnl Checks for regression against bug #44877. +AT_SETUP([LINEAR REGRESSION crash with long string variables]) +AT_DATA([regression.sps], [dnl +SET DECIMAL=DOT. + +DATA LIST notable LIST /text (A24) Y * X1 * +BEGIN DATA. +V00276601 0.00 90.00 +V00292909 10.00 30.00 +V00291204 20.00 20.00 +V00300070 0.00 90.00 +END DATA. + +REGRESSION +/VARIABLES= Y +/DEPENDENT= X1 +/METHOD=ENTER +/STATISTICS=COEFF R ANOVA +/SAVE= RESID. + +LIST. +]) +AT_CHECK([pspp -o pspp.csv regression.sps]) +AT_CHECK([cat pspp.csv], [0], [dnl +Table: Model Summary (X1) +R,R Square,Adjusted R Square,Std. Error of the Estimate +.95,.89,.84,15.08 + +Table: ANOVA (X1) +,Sum of Squares,df,Mean Square,F,Sig. +Regression,3820.45,1,3820.45,16.81,.055 +Residual,454.55,2,227.27,, +Total,4275.00,3,,, + +Table: Coefficients (X1) +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),85.45,10.16,.00,8.41,.004 +Y,-3.73,.91,-.95,-4.10,.055 + +Table: Data List +text,Y,X1,RES1 +V00276601,.00,90.00,4.55 +V00292909,10.00,30.00,-18.18 +V00291204,20.00,20.00,9.09 +V00300070,.00,90.00,4.55 +]) +AT_CLEANUP + + +dnl Test for a crash which happened on bad input syntax +AT_SETUP([LINEAR REGRESSION -- Empty Parentheses]) + +AT_DATA([empty-parens.sps], [dnl +set format = F22.3. + +data list notable list /math female socst read science * +begin data. + 58.00 1.00 61.00 55.00 58.00 + 65.00 1.00 61.00 63.00 53.00 +end data. + +regression + /variables = math female socst read + /statistics = coeff r anova ci () + /dependent = science + /method = enter ]) +AT_CHECK([pspp -o pspp.csv empty-parens.sps], [1], [ignore]) + +AT_CLEANUP + + + + +AT_SETUP([LINEAR REGRESSION varibles on ENTER subcommand]) +AT_DATA([regression.sps], [dnl +SET FORMAT=F10.3. + +DATA LIST notable LIST /number * value *. +BEGIN DATA + 16 7.25 + 0 .00 + 1 .10 + 9 27.9 + 0 .00 + 7 3.65 + 14 16.8 + 24 9.15 + 0 .00 + 24 19.0 + 7 4.05 + 12 7.90 + 6 .75 + 11 1.40 + 0 .00 + 3 2.30 + 12 7.60 + 11 6.80 + 16 8.65 +END DATA. + +REGRESSION + /STATISTICS COEFF R ANOVA + /DEPENDENT value + /METHOD=ENTER number. +]) + + +AT_CHECK([pspp -O format=csv regression.sps], [0], [dnl +Table: Model Summary (value) +R,R Square,Adjusted R Square,Std. Error of the Estimate +.612,.374,.338,6.176 + +Table: ANOVA (value) +,Sum of Squares,df,Mean Square,F,Sig. +Regression,388.065,1,388.065,10.173,.005 +Residual,648.498,17,38.147,, +Total,1036.563,18,,, + +Table: Coefficients (value) +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),.927,2.247,.000,.413,.685 +number,.611,.192,.612,3.189,.005 +]) + +AT_CLEANUP + + + +AT_SETUP([LINEAR REGRESSION /ORIGIN]) +AT_DATA([regression-origin.sps], [dnl +SET FORMAT=F10.3. + +DATA LIST notable LIST /number * value *. +BEGIN DATA + 16 7.25 + 0 .00 + 1 .10 + 9 27.9 + 0 .00 + 7 3.65 + 14 16.8 + 24 9.15 + 0 .00 + 24 19.0 + 7 4.05 + 12 7.90 + 6 .75 + 11 1.40 + 0 .00 + 3 2.30 + 12 7.60 + 11 6.80 + 16 8.65 +END DATA. + +REGRESSION + /STATISTICS COEFF R ANOVA + /DEPENDENT value + /ORIGIN + /METHOD=ENTER number. +]) + + +AT_CHECK([pspp -O format=csv regression-origin.sps], [0], [dnl +Table: Model Summary (value) +R,R Square,Adjusted R Square,Std. Error of the Estimate +.802,.643,.622,6.032 + +Table: ANOVA (value) +,Sum of Squares,df,Mean Square,F,Sig. +Regression,1181.726,1,1181.726,32.475,.000 +Residual,654.989,18,36.388,, +Total,1836.715,19,,, + +Table: Coefficients (value) +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +number,.672,.118,.802,5.699,.000 +]) + +AT_CLEANUP + +dnl This is an example from doc/tutorial.texi +dnl So if the results of this have to be changed in any way, +dnl make sure to update that file. +AT_SETUP([REGRESSION tutorial example]) +cp $top_srcdir/examples/repairs.sav . +AT_DATA([regression.sps], [dnl +GET FILE='repairs.sav'. +REGRESSION /VARIABLES=mtbf duty_cycle /DEPENDENT=mttr. +REGRESSION /VARIABLES=mtbf /DEPENDENT=mttr. +]) +AT_CHECK([pspp -o pspp.csv -o pspp.txt regression.sps]) +AT_CHECK([cat pspp.csv], [0], [dnl +Table: Model Summary (Mean time to repair (hours) ) +R,R Square,Adjusted R Square,Std. Error of the Estimate +.99,.99,.99,2.24 + +Table: ANOVA (Mean time to repair (hours) ) +,Sum of Squares,df,Mean Square,F,Sig. +Regression,5308.87,2,2654.44,530.75,.000 +Residual,60.02,12,5.00,, +Total,5368.89,14,,, + +Table: Coefficients (Mean time to repair (hours) ) +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),9.81,1.50,.00,6.54,.000 +Mean time between failures (months) ,3.10,.10,.99,32.43,.000 +Ratio of working to non-working time,1.09,1.78,.02,.61,.552 + +Table: Model Summary (Mean time to repair (hours) ) +R,R Square,Adjusted R Square,Std. Error of the Estimate +.99,.99,.99,2.18 + +Table: ANOVA (Mean time to repair (hours) ) +,Sum of Squares,df,Mean Square,F,Sig. +Regression,5307.00,1,5307.00,1114.73,.000 +Residual,61.89,13,4.76,, +Total,5368.89,14,,, + +Table: Coefficients (Mean time to repair (hours) ) +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig. +,B,Std. Error,Beta,, +(Constant),10.50,.96,.00,10.96,.000 +Mean time between failures (months) ,3.11,.09,.99,33.39,.000 +]) +AT_CLEANUP + + +AT_SETUP([LINEAR REGRESSION vif]) +AT_DATA([regression-vif.sps], [dnl +SET FORMAT=F10.3. + +data list notable list /competence_x1 motivation_x2 performance_y. +begin data +32 34 36 +35 37 39 +38 45 49 +31 41 41 +36 40 38 +32 38 36 +33 39 37 +31 40 41 +30 37 40 +35 37 43 +31 34 36 +34 32 35 +31 42 34 +25 36 40 +35 42 40 +36 41 44 +30 38 32 +34 41 41 +34 41 44 +22 27 26 +27 26 33 +30 30 35 +30 35 37 +37 39 44 +29 35 36 +31 35 29 +31 45 41 +29 30 32 +29 35 36 +31 37 37 +36 45 42 +32 44 39 +27 26 31 +33 39 35 +20 25 28 +30 36 39 +27 37 39 +25 39 36 +32 38 38 +32 38 35 +end data. + +regression /variables=competence_x1 motivation_x2 + /statistics=defaults tol + /dependent=performance_y + . +]) + + +AT_CHECK([pspp -O format=csv regression-vif.sps], [0], [dnl +Table: Model Summary (performance_y) +R,R Square,Adjusted R Square,Std. Error of the Estimate +.785,.616,.595,2.980 + +Table: ANOVA (performance_y) +,Sum of Squares,df,Mean Square,F,Sig. +Regression,526.494,2,263.247,29.641,.000 +Residual,328.606,37,8.881,, +Total,855.100,39,,, + +Table: Coefficients (performance_y) +,Unstandardized Coefficients,,Standardized Coefficients,t,Sig.,Collinearity Statistics, +,B,Std. Error,Beta,,,Tolerance,VIF +(Constant),7.220,4.020,.000,1.796,.080,, +competence_x1,.432,.166,.358,2.609,.013,.552,1.812 +motivation_x2,.453,.125,.499,3.636,.001,.552,1.812 +]) AT_CLEANUP