> clientes <- 1:50 > clientes
[1] 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 [26] 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50
> set.seed(16) > amostra <- sample(clientes, 10, replace = FALSE) > amostra
[1] 35 12 22 11 40 15 4 36 37 6
> sort(amostra)
[1] 4 6 11 12 15 22 35 36 37 40
> arq <- 1:5000 > head(arq)
[1] 1 2 3 4 5 6
> N <- 5000 > n <- 1000
> k <- N/n > k
[1] 5
> amostra2 <- seq(2, 5000, k) > head(amostra2)
[1] 2 7 12 17 22 27
> vet1.8 <- c(9, 12, 8, 10, 14, 7, 10) > vet1.8
[1] 9 12 8 10 14 7 10
> media <- mean(vet1.8) > media
[1] 10
> dados <- c(1, 1, 0, 0, 0, 0, 0, 1, 0, 1) > dados
[1] 1 1 0 0 0 0 0 1 0 1
> media <- mean(dados) > media
[1] 0.4
> renda <- c(500, rep(550, 3), rep(600, 2), 700, 750) > renda
[1] 500 550 550 550 600 600 700 750
> mediana <- median(renda) > mediana
[1] 575
> media <- mean(renda) > media
[1] 600
> tab1.7 <- c(547, 441, 123, 25) > names(tab1.7) <- c("O", "A", "B", "AB") > tab1.7
O A B AB 547 441 123 25
> soma <- sum(tab1.7) > moda <- max(tab1.7) > moda
[1] 547
> A <- c(3, 4, 4, 5, 5, 6, 7, 8) > A
[1] 3 4 4 5 5 6 7 8
> require(dprep) > moda(A)
[1] 5 4
> B <- 3:9 > B
[1] 3 4 5 6 7 8 9
> moda(B)
[1] 9 8 7 6 5 4 3
> notasA <- data.frame(aluno = c(1:4), nota = rep(5, 4)) > notasA
aluno nota 1 1 5 2 2 5 3 3 5 4 4 5
> notasB <- data.frame(aluno = c(1:4), nota = c(10, 0, 10, 0)) > notasB
aluno nota 1 1 10 2 2 0 3 3 10 4 4 0
> media <- c(mean(notasA$nota), mean(notasB$nota)) > media
[1] 5 5
> names(media) <- c("A", "B") > media
A B 5 5
> mediana <- c(median(notasA$nota), median(notasB$nota)) > mediana
[1] 5 5
> names(mediana) <- c("A", "B") > mediana
A B 5 5
> require(dprep) > moda <- c(moda(notasA$nota), NA) > moda
[1] 5 NA
> names(moda) <- c("A", "B") > moda
A B 5 NA
> notas <- c(5, 6, 9, 10, 10) > notas
[1] 5 6 9 10 10
> m <- mean(notas) > m
[1] 8
> #Elevando ao quadrado e depois tirando a raíz, temos os mesmos números, porém positivos. Ou seja, o módulo! > dm <- sum(sqrt((notas-m)^2))/length(notas) > dm
[1] 2
> peso <- c(2.5, 2.45, 4.15, 3.3, 2.86, 3.45, 3.48, 2.33, 3.7, + 3.15) > peso
[1] 2.50 2.45 4.15 3.30 2.86 3.45 3.48 2.33 3.70 3.15
> desvios <- c(-0.63, -0.69, 1.01, 0.16, -0.28, 0.31, 0.34, -0.81, + 0.56, 0.01) > desvios
[1] -0.63 -0.69 1.01 0.16 -0.28 0.31 0.34 -0.81 0.56 0.01
> desvm <- sum(sqrt((desvios)^2))/length(peso) > desvm
[1] 0.48
> notas10 <- c(5, 6, 9, 10, 10) * 10 > notas10
[1] 50 60 90 100 100
> var <- var(notas) * 100 > var
[1] 550
> var10 <- var(notas10) > var10
[1] 550
> peso <- c(68, 70, 86, 55, 75, 90) > peso
[1] 68 70 86 55 75 90
> altura <- c(170, 160, 164, 164, 170, 180) > altura
[1] 170 160 164 164 170 180
> varpeso <- (mean(peso^2)-(mean(peso)^2)) > varaltura <- (mean(altura^2)-(mean(altura)^2)) > dp.peso <- sqrt(varpeso) > dp.peso
[1] 11.64760
> dp.altura <- sqrt(varaltura) > dp.altura
[1] 6.4291
> media.peso <- mean(peso) > media.peso
[1] 74
> media.altura <- mean(altura) > media.altura
[1] 168
> #OS coeficientes de variação estão em porcentagem (%). > coef.peso <- 100*dp.peso/media.peso > coef.peso
[1] 15.74000
> coef.altura <- 100*dp.altura/media.altura > coef.altura
[1] 3.826846
> amostra <- c(3, 1.5, 2.5, 3.5, 4, 2, 3.5, 2, 1.5) > amostra
[1] 3.0 1.5 2.5 3.5 4.0 2.0 3.5 2.0 1.5
> a.ord <- sort(amostra) > a.ord
[1] 1.5 1.5 2.0 2.0 2.5 3.0 3.5 3.5 4.0
> q1 <- quantile(a.ord, 0.25, t = 4) > q1
25% 1.625
> q3 <- quantile(a.ord, 0.75, t = 4) > q3
75% 3.375
> freqA <- c(40, 30, 20, 10) > names(freqA) <- c("A", "B", "C", "D") > freqA
A B C D 40 30 20 10
> freqR <- c(0.4, 0.3, 0.2, 0.1) > names(freqR) <- c("A", "B", "C", "D") > freqR
A B C D 0.4 0.3 0.2 0.1
> sum(freqA)
[1] 100
> sum(freqR)
[1] 1
> pie(freqA)
> freqA <- c(52, 38, 43, 22, 11, 6) > names(freqA) <- c("0", "1", "2", "3", "4", "5") > freqA
0 1 2 3 4 5 52 38 43 22 11 6
> freqR <- c(0.302, 0.221, 0.25, 0.128, 0.064, 0.035) > names(freqR) <- c("0", "1", "2", "3", "4", "5") > freqR
0 1 2 3 4 5 0.302 0.221 0.250 0.128 0.064 0.035
> x <- 0:5
> barplot(freqA, xlab = "numero de filhos", ylab = "frequencia")
> freqA <- c(5, 10, 13, 16, 11, 9, 6) > freqA
[1] 5 10 13 16 11 9 6
> pond <- c(rep(1, 5), rep(3, 10), rep(5, 13), rep(7, 16), rep(9, + 11), rep(11, 9), rep(13, 6)) > hist(pond, xlab = "estresse", ylab = "frequencia", main = "nivel de estresse")
> caixas <- c(22, 29, 33, 35, 35, 37, 38, 43, 43, 44, 48, 48, 52, + 53, 55, 57, 61, 62, 67, 69) > caixas
[1] 22 29 33 35 35 37 38 43 43 44 48 48 52 53 55 57 61 62 67 69
> w <- summary(caixas) > w
Min. 1st Qu. Median Mean 3rd Qu. Max. 22.00 36.50 46.00 46.55 55.50 69.00
> boxplot(caixas, ylab="laranjas")
> t1 <- matrix(c(1:12, 25, 23, 17, 14, 11, 13, 9, 10, 11, 9, 20, + 22), nrow = 2, b = T) > t1
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8] [,9] [,10] [,11] [,12] [1,] 1 2 3 4 5 6 7 8 9 10 11 12 [2,] 25 23 17 14 11 13 9 10 11 9 20 22
> dimnames(t1) <- list(c("mes", "vendas"), c("jan", "fev", "mar", + "abr", "mai", "jun", "jul", "ago", "set", "out", "nov", "dez")) > t1
jan fev mar abr mai jun jul ago set out nov dez mes 1 2 3 4 5 6 7 8 9 10 11 12 vendas 25 23 17 14 11 13 9 10 11 9 20 22
> plot(t1[1, ], t1[2, ], ty = "l", xlab = "mes", ylab = "qtde vendida")