multicolinearity [2018/12/26 02:45]
Line 217: Line 217:
 > </code> > </code>
 +====== regression test with factors ======
 <code> <code>
 +> cps$sex <- factor(cps$sex)
 +> cps$union <- factor(cps$union)
 +> cps$race <- factor(cps$race)
 +> cps$sector <- factor(cps$sector)
 +> cps$occupation <- factor(cps$occupation)
 +> cps$marr <- factor(cps$marr)
 +> str(cps)
 +'data.frame': 534 obs. of  11 variables:
 + $ education : int  8 9 12 12 12 13 10 12 16 12 ...
 + $ south     : int  0 0 0 0 0 0 1 0 0 0 ...
 + $ sex       : Factor w/ 2 levels "0","1": 2 2 1 1 1 1 1 1 1 1 ...
 + $ experience: int  21 42 1 4 17 9 27 9 11 9 ...
 + $ union     : Factor w/ 2 levels "0","1": 1 1 1 1 1 2 1 1 1 1 ...
 + $ wage      : num  5.1 4.95 6.67 4 7.5 ...
 + $ age       : int  35 57 19 22 35 28 43 27 33 27 ...
 + $ race      : Factor w/ 3 levels "1","2","3": 2 3 3 3 3 3 3 3 3 3 ...
 + $ occupation: Factor w/ 6 levels "1","2","3","4",..: 6 6 6 6 6 6 6 6 6 6 ...
 + $ sector    : Factor w/ 3 levels "0","1","2": 2 2 2 1 1 1 1 1 2 1 ...
 + $ marr      : Factor w/ 2 levels "0","1": 2 2 1 1 2 1 1 1 2 1 ...
 </code> </code>
 <code> <code>
 +> lm4 = lm(log(cps$wage) ~ . -age, data = cps)
 +> summary(lm4)
 +lm(formula = log(cps$wage) ~ . - age, data = cps)
 +     Min       1Q   Median       3Q      Max 
 +-2.36103 -0.28080  0.00362  0.27793  1.79594 
 +             Estimate Std. Error t value Pr(>|t|)    
 +(Intercept)  1.194821   0.181804   6.572 1.21e-10 ***
 +education    0.066603   0.010060   6.621 8.96e-11 ***
 +south       -0.093384   0.041931  -2.227  0.02637 *  
 +sex1        -0.216934   0.041844  -5.184 3.11e-07 ***
 +experience   0.009371   0.001725   5.431 8.63e-08 ***
 +union1       0.211506   0.051218   4.129 4.24e-05 ***
 +race2       -0.033928   0.099051  -0.343  0.73209    
 +race3        0.079851   0.057392   1.391  0.16472    
 +occupation2 -0.364444   0.091500  -3.983 7.78e-05 ***
 +occupation3 -0.210295   0.076175  -2.761  0.00597 ** 
 +occupation4 -0.383882   0.080990  -4.740 2.77e-06 ***
 +occupation5 -0.050664   0.072717  -0.697  0.48628    
 +occupation6 -0.265348   0.079969  -3.318  0.00097 ***
 +sector1      0.114857   0.054862   2.094  0.03678 *  
 +sector2      0.093138   0.096514   0.965  0.33499    
 +marr1        0.062211   0.041025   1.516  0.13002    
 +Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1
 +Residual standard error: 0.4278 on 518 degrees of freedom
 +Multiple R-squared:  0.3614, Adjusted R-squared:  0.3429 
 +F-statistic: 19.54 on 15 and 518 DF,  p-value: < 2.2e-16
 </code> </code>
multicolinearity.txt · Last modified: 2018/12/26 02:49

