Professional Documents
Culture Documents
Grupo 9 - Melgar, L., Fiallos, B., Ladines, D., Rodríguez, D., Zambrano, J.
11/8/2021
## speed dist
## Min. : 4.0 Min. : 2.00
## 1st Qu.:12.0 1st Qu.: 26.00
## Median :15.0 Median : 36.00
## Mean :15.4 Mean : 42.98
## 3rd Qu.:19.0 3rd Qu.: 56.00
## Max. :25.0 Max. :120.00
n = 20
indices = sample(1:nrow(cars), 20)
carsMuestreado = cars[indices, ]
carsMuestreado
## speed dist
## 19 13 46
## 45 23 54
## 28 16 40
## 27 16 32
## 7 10 18
## 15 12 28
## 33 18 56
## 11 11 28
## 42 20 56
## 4 7 22
## 9 10 34
## 36 19 36
## 13 12 20
## 24 15 20
## 16 13 26
## 35 18 84
## 46 24 70
## 37 19 46
## 18 13 34
## 47 24 92
Variable Speed
muestraSpeed = carsMuestreado[,1]
library(fdth)
##
## Attaching package: 'fdth'
k = nclass.Sturges(muestraSpeed)
tablaS = fdt(muestraSpeed, breaks = "Sturges", right = FALSE)
tablaS
##
## Attaching package: 'modeest'
mean(muestraSpeed)
## [1] 15.65
median(muestraSpeed)
## [1] 15.5
## [1] 13
summary(muestraSpeed)
RI = IQR(muestraSpeed)
RI
## [1] 7
## [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
FALSE
## [13] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
sum(v_logico1)
## [1] 0
## [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
FALSE
## [13] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
sum(v_logico2)
## [1] 0
var(muestraSpeed)
## [1] 23.92368
sd(muestraSpeed)
## [1] 4.891184
cv = (sd(muestraSpeed)/mean(muestraSpeed)) * 100
cv
## [1] 31.25357
Variable Dist
muestraDist = carsMuestreado[,2]
library(fdth)
k = nclass.Sturges(muestraDist)
tablaD = fdt(muestraDist, breaks = "Sturges", right = FALSE)
tablaD
mean(muestraDist)
## [1] 42.1
median(muestraDist)
## [1] 35
## [1] 20 28 34 46 56
summary(muestraDist)
## 5% 95%
## 19.9 84.4
RI = IQR(muestraDist)
RI
## [1] 27
## [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
FALSE
## [13] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
sum(v_logico1)
## [1] 0
sum(v_logico2)
## [1] 0
var(muestraDist)
## [1] 446.0947
sd(muestraDist)
## [1] 21.12095
cv = (sd(muestraDist)/mean(muestraDist)) * 100
cv
## [1] 50.16854
Descriptivo Bivariado
corrMuestras = cor(muestraSpeed, muestraDist)
corrMuestras
## [1] 0.7839219
## [1] 80.98421
matrizMuestra = pairs(carsMuestreado)
Regresión Lineal con el data set “cars”
Supuestos:
• Linealidad
• Homogeneidad
• Homocedasticidad
• Normalidad
• Independencia
Modelo Lineal
modeloCars = lm(muestraDist ~ muestraSpeed, data = carsMuestreado)
summary(modeloCars)
##
## Call:
## lm(formula = muestraDist ~ muestraSpeed, data = carsMuestreado)
##
## Residuals:
## Min 1Q Median 3Q Max
## -19.900 -8.016 -1.285 6.754 33.945
##
## Coefficients:
## Estimate Std. Error t value Pr(>|t|)
## (Intercept) -10.8769 10.3381 -1.052 0.307
## muestraSpeed 3.3851 0.6319 5.357 4.32e-05 ***
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 13.47 on 18 degrees of freedom
## Multiple R-squared: 0.6145, Adjusted R-squared: 0.5931
## F-statistic: 28.7 on 1 and 18 DF, p-value: 4.316e-05
shapiro.test(modeloCars$residuals)
##
## Shapiro-Wilk normality test
##
## data: modeloCars$residuals
## W = 0.95095, p-value = 0.3818
Segú n el Test de Shapiro-Wilk normality test y guiá ndonos con el valor de p-value que
es menor al nivel de significancia de 0.05, entonces el modelo cumple con el supuesto
de la normalidad.
plot(muestraDist ~ muestraSpeed, xlab="Velocidad", ylab="Distancia de
frenado")
abline(modeloCars)
Regresión lineal Simple - Bondad de Ajuste
Y: Distancia de frenado
Contraste de hipó tesis:
H0: B1 = 0
H1: B1 not 0
Se rechaza la hipó tesis nula de que este coeficiente es cero debido a que el valor de
(Pr(>|t|) = 4.32e-05) esto significa que hay una probabilidad muy baja de que el
coeficiente estimado de speed en el modelo lineal est́e dentro de una distribució n
aleatoria de valores “nulos”, es decir, de coeficientes obtenidos aleatoriamente pero
que en realidad no son distintos de cero.
summary(state.x77)
n = 20
indices = sample(1:nrow(state.x77), 20)
stateMuestreado = state.x77[indices, ]
stateMuestreado
Variable Population
muestraPopu = stateMuestreado[,1]
library(fdth)
k = nclass.Sturges(muestraPopu)
tablaP = fdt(muestraPopu, breaks = "Sturges", right = FALSE)
tablaP
mean(muestraPopu)
## [1] 3966.2
median(muestraPopu)
## [1] 3329.5
## [1] 365 590 812 813 1144 1544 2110 2212 2280 3100 3559
3615
## [13] 3921 4122 4173 4981 8277 9111 10735 11860
summary(muestraPopu)
## 5% 95%
## 578.75 10791.25
RI = IQR(muestraPopu)
RI
## [1] 2931
sum(v_logico1)
## [1] 0
sum(v_logico2)
## [1] 3
## [1] 10735
var(muestraPopu)
## [1] 11725047
sd(muestraPopu)
## [1] 3424.186
cv = (sd(muestraPopu)/mean(muestraPopu)) * 100
cv
## [1] 86.33417
Variable Income
muestraIncome = stateMuestreado[,2]
library(fdth)
k = nclass.Sturges(muestraIncome)
tablaI = fdt(muestraIncome, breaks = "Sturges", right = FALSE)
tablaI
mean(muestraIncome)
## [1] 4572.9
median(muestraIncome)
## [1] 4615
## [1] 3378 3601 3624 3821 4119 4281 4449 4508 4530 4561 4669 4675 4701
4751 4815
## [16] 4864 5149 5299 5348 6315
summary(muestraIncome)
## 5% 95%
## 3589.85 5396.35
RI = IQR(muestraIncome)
RI
## [1] 586.75
sum(v_logico1)
## [1] 0
sum(v_logico2)
## [1] 1
## [1] 6315
var(muestraIncome)
## [1] 466150.6
sd(muestraIncome)
## [1] 682.7522
cv = (sd(muestraIncome)/mean(muestraIncome)) * 100
cv
## [1] 14.9304
Variable Area
muestraArea = stateMuestreado[,8]
library(fdth)
k = nclass.Sturges(muestraArea)
tablaA = fdt(muestraArea, breaks = "Sturges", right = FALSE)
tablaA
mean(muestraArea)
## [1] 85117.25
median(muestraArea)
## [1] 55453.5
## [1] 4862 9027 9891 39780 40975 41328 44966 50708 51945
54090
## [11] 56817 66570 76483 79289 81787 82677 109889 113417 121412
566432
summary(muestraArea)
## 5% 95%
## 8818.75 143663.00
RI = IQR(muestraArea)
RI
## [1] 40769.75
sum(v_logico1)
## [1] 0
sum(v_logico2)
## [1] 1
## [1] 566432
var(muestraArea)
## [1] 13912448017
sd(muestraArea)
## [1] 117951
cv = (sd(muestraArea)/mean(muestraArea)) * 100
cv
## [1] 138.5748
Supuestos:
• Linealidad
• Homogeneidad
• Homocedasticidad
• Normalidad
• Independencia
Modelo Lineal
modeloState = lm(muestraPopu ~ muestraIncome + muestraArea, data =
carsMuestreado)
summary(modeloState)
##
## Call:
## lm(formula = muestraPopu ~ muestraIncome + muestraArea, data =
carsMuestreado)
##
## Residuals:
## Min 1Q Median 3Q Max
## -3807.4 -1995.3 -946.5 541.6 7514.3
##
## Coefficients:
## Estimate Std. Error t value Pr(>|t|)
## (Intercept) -2.056e+02 5.791e+03 -0.036 0.972
## muestraIncome 1.155e+00 1.326e+00 0.871 0.396
## muestraArea -1.301e-02 7.673e-03 -1.696 0.108
##
## Residual standard error: 3348 on 17 degrees of freedom
## Multiple R-squared: 0.1448, Adjusted R-squared: 0.04417
## F-statistic: 1.439 on 2 and 17 DF, p-value: 0.2646
shapiro.test(modeloState$residuals)
##
## Shapiro-Wilk normality test
##
## data: modeloState$residuals
## W = 0.87936, p-value = 0.01723
Segú n el Test de Shapiro-Wilk normality test y guiá ndonos con el valor de p-value que
es menor al nivel de significancia de 0.05, entonces el modelo cumple con el supuesto
de la normalidad.
plot(muestraPopu ~ muestraIncome + muestraArea, xlab="Population",
ylab="Income + Area")
abline(modeloState)
#ANOVA
data = iris3
data
## , , Setosa
##
## Sepal L. Sepal W. Petal L. Petal W.
## [1,] 5.1 3.5 1.4 0.2
## [2,] 4.9 3.0 1.4 0.2
## [3,] 4.7 3.2 1.3 0.2
## [4,] 4.6 3.1 1.5 0.2
## [5,] 5.0 3.6 1.4 0.2
## [6,] 5.4 3.9 1.7 0.4
## [7,] 4.6 3.4 1.4 0.3
## [8,] 5.0 3.4 1.5 0.2
## [9,] 4.4 2.9 1.4 0.2
## [10,] 4.9 3.1 1.5 0.1
## [11,] 5.4 3.7 1.5 0.2
## [12,] 4.8 3.4 1.6 0.2
## [13,] 4.8 3.0 1.4 0.1
## [14,] 4.3 3.0 1.1 0.1
## [15,] 5.8 4.0 1.2 0.2
## [16,] 5.7 4.4 1.5 0.4
## [17,] 5.4 3.9 1.3 0.4
## [18,] 5.1 3.5 1.4 0.3
## [19,] 5.7 3.8 1.7 0.3
## [20,] 5.1 3.8 1.5 0.3
## [21,] 5.4 3.4 1.7 0.2
## [22,] 5.1 3.7 1.5 0.4
## [23,] 4.6 3.6 1.0 0.2
## [24,] 5.1 3.3 1.7 0.5
## [25,] 4.8 3.4 1.9 0.2
## [26,] 5.0 3.0 1.6 0.2
## [27,] 5.0 3.4 1.6 0.4
## [28,] 5.2 3.5 1.5 0.2
## [29,] 5.2 3.4 1.4 0.2
## [30,] 4.7 3.2 1.6 0.2
## [31,] 4.8 3.1 1.6 0.2
## [32,] 5.4 3.4 1.5 0.4
## [33,] 5.2 4.1 1.5 0.1
## [34,] 5.5 4.2 1.4 0.2
## [35,] 4.9 3.1 1.5 0.2
## [36,] 5.0 3.2 1.2 0.2
## [37,] 5.5 3.5 1.3 0.2
## [38,] 4.9 3.6 1.4 0.1
## [39,] 4.4 3.0 1.3 0.2
## [40,] 5.1 3.4 1.5 0.2
## [41,] 5.0 3.5 1.3 0.3
## [42,] 4.5 2.3 1.3 0.3
## [43,] 4.4 3.2 1.3 0.2
## [44,] 5.0 3.5 1.6 0.6
## [45,] 5.1 3.8 1.9 0.4
## [46,] 4.8 3.0 1.4 0.3
## [47,] 5.1 3.8 1.6 0.2
## [48,] 4.6 3.2 1.4 0.2
## [49,] 5.3 3.7 1.5 0.2
## [50,] 5.0 3.3 1.4 0.2
##
## , , Versicolor
##
## Sepal L. Sepal W. Petal L. Petal W.
## [1,] 7.0 3.2 4.7 1.4
## [2,] 6.4 3.2 4.5 1.5
## [3,] 6.9 3.1 4.9 1.5
## [4,] 5.5 2.3 4.0 1.3
## [5,] 6.5 2.8 4.6 1.5
## [6,] 5.7 2.8 4.5 1.3
## [7,] 6.3 3.3 4.7 1.6
## [8,] 4.9 2.4 3.3 1.0
## [9,] 6.6 2.9 4.6 1.3
## [10,] 5.2 2.7 3.9 1.4
## [11,] 5.0 2.0 3.5 1.0
## [12,] 5.9 3.0 4.2 1.5
## [13,] 6.0 2.2 4.0 1.0
## [14,] 6.1 2.9 4.7 1.4
## [15,] 5.6 2.9 3.6 1.3
## [16,] 6.7 3.1 4.4 1.4
## [17,] 5.6 3.0 4.5 1.5
## [18,] 5.8 2.7 4.1 1.0
## [19,] 6.2 2.2 4.5 1.5
## [20,] 5.6 2.5 3.9 1.1
## [21,] 5.9 3.2 4.8 1.8
## [22,] 6.1 2.8 4.0 1.3
## [23,] 6.3 2.5 4.9 1.5
## [24,] 6.1 2.8 4.7 1.2
## [25,] 6.4 2.9 4.3 1.3
## [26,] 6.6 3.0 4.4 1.4
## [27,] 6.8 2.8 4.8 1.4
## [28,] 6.7 3.0 5.0 1.7
## [29,] 6.0 2.9 4.5 1.5
## [30,] 5.7 2.6 3.5 1.0
## [31,] 5.5 2.4 3.8 1.1
## [32,] 5.5 2.4 3.7 1.0
## [33,] 5.8 2.7 3.9 1.2
## [34,] 6.0 2.7 5.1 1.6
## [35,] 5.4 3.0 4.5 1.5
## [36,] 6.0 3.4 4.5 1.6
## [37,] 6.7 3.1 4.7 1.5
## [38,] 6.3 2.3 4.4 1.3
## [39,] 5.6 3.0 4.1 1.3
## [40,] 5.5 2.5 4.0 1.3
## [41,] 5.5 2.6 4.4 1.2
## [42,] 6.1 3.0 4.6 1.4
## [43,] 5.8 2.6 4.0 1.2
## [44,] 5.0 2.3 3.3 1.0
## [45,] 5.6 2.7 4.2 1.3
## [46,] 5.7 3.0 4.2 1.2
## [47,] 5.7 2.9 4.2 1.3
## [48,] 6.2 2.9 4.3 1.3
## [49,] 5.1 2.5 3.0 1.1
## [50,] 5.7 2.8 4.1 1.3
##
## , , Virginica
##
## Sepal L. Sepal W. Petal L. Petal W.
## [1,] 6.3 3.3 6.0 2.5
## [2,] 5.8 2.7 5.1 1.9
## [3,] 7.1 3.0 5.9 2.1
## [4,] 6.3 2.9 5.6 1.8
## [5,] 6.5 3.0 5.8 2.2
## [6,] 7.6 3.0 6.6 2.1
## [7,] 4.9 2.5 4.5 1.7
## [8,] 7.3 2.9 6.3 1.8
## [9,] 6.7 2.5 5.8 1.8
## [10,] 7.2 3.6 6.1 2.5
## [11,] 6.5 3.2 5.1 2.0
## [12,] 6.4 2.7 5.3 1.9
## [13,] 6.8 3.0 5.5 2.1
## [14,] 5.7 2.5 5.0 2.0
## [15,] 5.8 2.8 5.1 2.4
## [16,] 6.4 3.2 5.3 2.3
## [17,] 6.5 3.0 5.5 1.8
## [18,] 7.7 3.8 6.7 2.2
## [19,] 7.7 2.6 6.9 2.3
## [20,] 6.0 2.2 5.0 1.5
## [21,] 6.9 3.2 5.7 2.3
## [22,] 5.6 2.8 4.9 2.0
## [23,] 7.7 2.8 6.7 2.0
## [24,] 6.3 2.7 4.9 1.8
## [25,] 6.7 3.3 5.7 2.1
## [26,] 7.2 3.2 6.0 1.8
## [27,] 6.2 2.8 4.8 1.8
## [28,] 6.1 3.0 4.9 1.8
## [29,] 6.4 2.8 5.6 2.1
## [30,] 7.2 3.0 5.8 1.6
## [31,] 7.4 2.8 6.1 1.9
## [32,] 7.9 3.8 6.4 2.0
## [33,] 6.4 2.8 5.6 2.2
## [34,] 6.3 2.8 5.1 1.5
## [35,] 6.1 2.6 5.6 1.4
## [36,] 7.7 3.0 6.1 2.3
## [37,] 6.3 3.4 5.6 2.4
## [38,] 6.4 3.1 5.5 1.8
## [39,] 6.0 3.0 4.8 1.8
## [40,] 6.9 3.1 5.4 2.1
## [41,] 6.7 3.1 5.6 2.4
## [42,] 6.9 3.1 5.1 2.3
## [43,] 5.8 2.7 5.1 1.9
## [44,] 6.8 3.2 5.9 2.3
## [45,] 6.7 3.3 5.7 2.5
## [46,] 6.7 3.0 5.2 2.3
## [47,] 6.3 2.5 5.0 1.9
## [48,] 6.5 3.0 5.2 2.0
## [49,] 6.2 3.4 5.4 2.3
## [50,] 5.9 3.0 5.1 1.8
## [1] 5.1 4.9 4.7 4.6 5.0 5.4 4.6 5.0 4.4 4.9 5.4 4.8 4.8 4.3 5.8
## , , Setosa
##
## Sepal L. Sepal W. Petal L. Petal W.
## [1,] 5.1 3.5 1.4 0.2
## [2,] 4.9 3.0 1.4 0.2
## [3,] 4.7 3.2 1.3 0.2
## [4,] 4.6 3.1 1.5 0.2
## [5,] 5.0 3.6 1.4 0.2
## [6,] 5.4 3.9 1.7 0.4
## [7,] 4.6 3.4 1.4 0.3
## [8,] 5.0 3.4 1.5 0.2
## [9,] 4.4 2.9 1.4 0.2
## [10,] 4.9 3.1 1.5 0.1
## [11,] 5.4 3.7 1.5 0.2
## [12,] 4.8 3.4 1.6 0.2
## [13,] 4.8 3.0 1.4 0.1
## [14,] 4.3 3.0 1.1 0.1
## [15,] 5.8 4.0 1.2 0.2
##
## , , Versicolor
##
## Sepal L. Sepal W. Petal L. Petal W.
## [1,] 7.0 3.2 4.7 1.4
## [2,] 6.4 3.2 4.5 1.5
## [3,] 6.9 3.1 4.9 1.5
## [4,] 5.5 2.3 4.0 1.3
## [5,] 6.5 2.8 4.6 1.5
## [6,] 5.7 2.8 4.5 1.3
## [7,] 6.3 3.3 4.7 1.6
## [8,] 4.9 2.4 3.3 1.0
## [9,] 6.6 2.9 4.6 1.3
## [10,] 5.2 2.7 3.9 1.4
## [11,] 5.0 2.0 3.5 1.0
## [12,] 5.9 3.0 4.2 1.5
## [13,] 6.0 2.2 4.0 1.0
## [14,] 6.1 2.9 4.7 1.4
## [15,] 5.6 2.9 3.6 1.3
##
## , , Virginica
##
## Sepal L. Sepal W. Petal L. Petal W.
## [1,] 6.3 3.3 6.0 2.5
## [2,] 5.8 2.7 5.1 1.9
## [3,] 7.1 3.0 5.9 2.1
## [4,] 6.3 2.9 5.6 1.8
## [5,] 6.5 3.0 5.8 2.2
## [6,] 7.6 3.0 6.6 2.1
## [7,] 4.9 2.5 4.5 1.7
## [8,] 7.3 2.9 6.3 1.8
## [9,] 6.7 2.5 5.8 1.8
## [10,] 7.2 3.6 6.1 2.5
## [11,] 6.5 3.2 5.1 2.0
## [12,] 6.4 2.7 5.3 1.9
## [13,] 6.8 3.0 5.5 2.1
## [14,] 5.7 2.5 5.0 2.0
## [15,] 5.8 2.8 5.1 2.4
sacm_datos[,,1]
sacm_datos[,,2]
sacm_datos[,,3]
mat_uni = data.frame(uni)
mat_uni$grupo= c(rep(1,15), rep(2,15), rep(3,15))
mat_uni
## Sepal.L. Sepal.W. Petal.L. Petal.W. grupo
## 1 5.1 3.5 1.4 0.2 1
## 2 4.9 3.0 1.4 0.2 1
## 3 4.7 3.2 1.3 0.2 1
## 4 4.6 3.1 1.5 0.2 1
## 5 5.0 3.6 1.4 0.2 1
## 6 5.4 3.9 1.7 0.4 1
## 7 4.6 3.4 1.4 0.3 1
## 8 5.0 3.4 1.5 0.2 1
## 9 4.4 2.9 1.4 0.2 1
## 10 4.9 3.1 1.5 0.1 1
## 11 5.4 3.7 1.5 0.2 1
## 12 4.8 3.4 1.6 0.2 1
## 13 4.8 3.0 1.4 0.1 1
## 14 4.3 3.0 1.1 0.1 1
## 15 5.8 4.0 1.2 0.2 1
## 16 7.0 3.2 4.7 1.4 2
## 17 6.4 3.2 4.5 1.5 2
## 18 6.9 3.1 4.9 1.5 2
## 19 5.5 2.3 4.0 1.3 2
## 20 6.5 2.8 4.6 1.5 2
## 21 5.7 2.8 4.5 1.3 2
## 22 6.3 3.3 4.7 1.6 2
## 23 4.9 2.4 3.3 1.0 2
## 24 6.6 2.9 4.6 1.3 2
## 25 5.2 2.7 3.9 1.4 2
## 26 5.0 2.0 3.5 1.0 2
## 27 5.9 3.0 4.2 1.5 2
## 28 6.0 2.2 4.0 1.0 2
## 29 6.1 2.9 4.7 1.4 2
## 30 5.6 2.9 3.6 1.3 2
## 31 6.3 3.3 6.0 2.5 3
## 32 5.8 2.7 5.1 1.9 3
## 33 7.1 3.0 5.9 2.1 3
## 34 6.3 2.9 5.6 1.8 3
## 35 6.5 3.0 5.8 2.2 3
## 36 7.6 3.0 6.6 2.1 3
## 37 4.9 2.5 4.5 1.7 3
## 38 7.3 2.9 6.3 1.8 3
## 39 6.7 2.5 5.8 1.8 3
## 40 7.2 3.6 6.1 2.5 3
## 41 6.5 3.2 5.1 2.0 3
## 42 6.4 2.7 5.3 1.9 3
## 43 6.8 3.0 5.5 2.1 3
## 44 5.7 2.5 5.0 2.0 3
## 45 5.8 2.8 5.1 2.4 3
Con el valor p no se rechaza la hipó tesis nula de que las medias son iguales a 0, es
decir, que los factores no afectan a la variable de respuesta “Sepal. L.”