sampling_distribution_in_r
Differences
This shows you the differences between two versions of the page.
Both sides previous revisionPrevious revisionNext revision | Previous revisionLast revisionBoth sides next revision | ||
sampling_distribution_in_r [2024/03/20 08:23] – hkimscil | sampling_distribution_in_r [2024/03/20 13:57] – [Sampling distribution in R e.g. 1] hkimscil | ||
---|---|---|---|
Line 1: | Line 1: | ||
====== Sampling distribution in R e.g. 1 ====== | ====== Sampling distribution in R e.g. 1 ====== | ||
< | < | ||
- | n.ajstu <- 1000000 | + | n.ajstu <- 100000 |
- | mean.ajstu <- 70 | + | mean.ajstu <- 100 |
sd.ajstu <- 10 | sd.ajstu <- 10 | ||
+ | |||
set.seed(1024) | set.seed(1024) | ||
ajstu <- rnorm2(n.ajstu, | ajstu <- rnorm2(n.ajstu, | ||
Line 9: | Line 10: | ||
mean(ajstu) | mean(ajstu) | ||
sd(ajstu) | sd(ajstu) | ||
- | iter <- 10000 | + | var(ajstu) |
+ | |||
+ | iter <- 10000 # # of sampling | ||
- | n <- 4 | + | n.4 <- 4 |
means4 <- rep (NA, iter) | means4 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means4[i] = mean(sample(ajstu, | + | means4[i] = mean(sample(ajstu, |
} | } | ||
- | n <- 25 | + | n.25 <- 25 |
means25 <- rep (NA, iter) | means25 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means25[i] = mean(sample(ajstu, | + | means25[i] = mean(sample(ajstu, |
} | } | ||
- | n <- 100 | + | n.100 <- 100 |
means100 <- rep (NA, iter) | means100 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means100[i] = mean(sample(ajstu, | + | means100[i] = mean(sample(ajstu, |
} | } | ||
- | n <- 400 | + | n.400 <- 400 |
means400 <- rep (NA, iter) | means400 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means400[i] = mean(sample(ajstu, | + | means400[i] = mean(sample(ajstu, |
} | } | ||
- | n <- 900 | + | n.900 <- 900 |
means900 <- rep (NA, iter) | means900 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means900[i] = mean(sample(ajstu, | + | means900[i] = mean(sample(ajstu, |
} | } | ||
- | n <- 1600 | + | n.1600 <- 1600 |
means1600 <- rep (NA, iter) | means1600 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means1600[i] = mean(sample(ajstu, | + | means1600[i] = mean(sample(ajstu, |
} | } | ||
- | n <- 2500 | + | n.2500 <- 2500 |
means2500 <- rep (NA, iter) | means2500 <- rep (NA, iter) | ||
for(i in 1:iter){ | for(i in 1:iter){ | ||
- | means2500[i] = mean(sample(ajstu, | + | means2500[i] = mean(sample(ajstu, |
} | } | ||
Line 68: | Line 71: | ||
plot(h900, add = T, col=" | plot(h900, add = T, col=" | ||
- | se4 <- sqrt(var(ajstu)/ | ||
- | se25 <- sqrt(var(ajstu)/ | ||
- | se100 <- sqrt(var(ajstu)/ | ||
- | se400 <- sqrt(var(ajstu)/ | ||
- | se900 <- sqrt(var(ajstu)/ | ||
- | se1600 <- sqrt(var(ajstu)/ | ||
- | se2500 <- sqrt(var(ajstu)/ | ||
- | sss <- c(4, | + | sss <- c(4, |
- | ses <- rep (NA, length(sss)) | + | ses <- rep (NA, length(sss)) |
for(i in 1: | for(i in 1: | ||
ses[i] = sqrt(var(ajstu)/ | ses[i] = sqrt(var(ajstu)/ | ||
} | } | ||
+ | |||
+ | ses | ||
se.1 <- ses | se.1 <- ses | ||
- | se.2 <- 2*ses | + | se.2 <- 2 * ses |
- | lower.part.2 <- mean(ajstu)-se.2 | + | |
- | upper.part.2 <- mean(ajstu)+se.2 | + | |
- | data.frame(cbind(lower.part.2, | + | |
+ | lower.s2 <- mean(ajstu)-se.2 | ||
+ | upper.s2 <- mean(ajstu)+se.2 | ||
+ | data.frame(cbind(sss, | ||
</ | </ | ||
+ | |||
+ | < | ||
+ | # n =1600 일 경우에 | ||
+ | # sample의 평균이 100.15보다 작을 | ||
+ | # 확률은 어떻게 구해야 할까? | ||
+ | |||
+ | # n = 1600 일 경우에 | ||
+ | # sampling distribution은 | ||
+ | # Xbar ~ N(100, var(ajstu)/ | ||
+ | # 그리고, 위에서 standard error값은 | ||
+ | # sqrt(var(ajstu)/ | ||
+ | # 이것을 standard error라고 부른다 | ||
+ | # 따라서 | ||
+ | pnorm(100.15, | ||
+ | </ | ||
+ | |||
{{: | {{: | ||
===== Sampling distribution in proportion in R ===== | ===== Sampling distribution in proportion in R ===== |
sampling_distribution_in_r.txt · Last modified: 2024/03/20 14:15 by hkimscil