install.packages("openintro")Installing package into ‘/usr/local/lib/R/site-library’
(as ‘lib’ is unspecified)
also installing the dependencies ‘airports’, ‘cherryblossom’, ‘usdata’
install.packages("openintro")Installing package into ‘/usr/local/lib/R/site-library’
(as ‘lib’ is unspecified)
also installing the dependencies ‘airports’, ‘cherryblossom’, ‘usdata’
library(openintro)
library(dplyr)Loading required package: airports
Loading required package: cherryblossom
Loading required package: usdata
Attaching package: ‘dplyr’
The following objects are masked from ‘package:stats’:
filter, lag
The following objects are masked from ‘package:base’:
intersect, setdiff, setequal, union
Vamos a generar una muestra simulando un grupo de 9 estudiantes que tienen edades entre 20 y 25 años
set.seed(1234)
# x= población de la cuál se obtendrá la muestra
# size= cantidad de elementos que tendrá la muestra
# replace= establece sin en la muestra se pueden repetir elementos contenidos en x
muestra = sample(x=20:25,size = 9, replace= TRUE)
muestrahead(babies)| case | bwt | gestation | parity | age | height | weight | smoke |
|---|---|---|---|---|---|---|---|
| <int> | <int> | <int> | <int> | <int> | <int> | <int> | <int> |
| 1 | 120 | 284 | 0 | 27 | 62 | 100 | 0 |
| 2 | 113 | 282 | 0 | 33 | 64 | 135 | 0 |
| 3 | 128 | 279 | 0 | 28 | 64 | 115 | 1 |
| 4 | 123 | NA | 0 | 36 | 69 | 190 | 0 |
| 5 | 108 | 282 | 0 | 23 | 67 | 125 | 1 |
| 6 | 136 | 286 | 0 | 25 | 62 | 93 | 0 |
edad_madres= babies$age[!is.na(babies$age)]
edad_madresresultado <- hist(edad_madres, breaks = 5, plot=F)resultado$breaks
[1] 15 20 25 30 35 40 45
$counts
[1] 134 402 374 190 108 26
$density
[1] 0.021717990 0.065153971 0.060615883 0.030794165 0.017504052 0.004213938
$mids
[1] 17.5 22.5 27.5 32.5 37.5 42.5
$xname
[1] "edad_madres"
$equidist
[1] TRUE
attr(,"class")
[1] "histogram"
data.frame(Xi=resultado$mids,
fi=resultado$counts,
densidad= resultado$density)%>%
mutate(hi= (fi/sum(resultado$counts)*100))%>%
mutate(Fi= cumsum(fi))%>%
mutate(HI= cumsum(fi/sum(resultado$counts)*100))| Xi | fi | densidad | hi | Fi | HI |
|---|---|---|---|---|---|
| <dbl> | <int> | <dbl> | <dbl> | <int> | <dbl> |
| 17.5 | 134 | 0.021717990 | 10.858995 | 134 | 10.85900 |
| 22.5 | 402 | 0.065153971 | 32.576985 | 536 | 43.43598 |
| 27.5 | 374 | 0.060615883 | 30.307942 | 910 | 73.74392 |
| 32.5 | 190 | 0.030794165 | 15.397083 | 1100 | 89.14100 |
| 37.5 | 108 | 0.017504052 | 8.752026 | 1208 | 97.89303 |
| 42.5 | 26 | 0.004213938 | 2.106969 | 1234 | 100.00000 |
hist(classdata$m1)hist(babies$age)hist(babies$height)hist(babies$weight)hist(babies$gestation,breaks =20)hist(age_at_mar$age)hist(arbuthnot$year, breaks = 50)# frecuencia relativa
hist(gpa_iq$gpa, freq=FALSE)hist(gpa_iq$gpa)resultado2 <- hist(gpa_iq$gpa, breaks = 5, plot=F)
data.frame(Xi=resultado2$mids,
fi=resultado2$counts,
densidad= resultado2$density
)%>%
mutate(hi= (fi/sum(resultado2$counts)*100))%>%
mutate(Fi= cumsum(fi))%>%
mutate(HI= cumsum(fi/sum(resultado2$counts)*100))| Xi | fi | densidad | hi | Fi | HI |
|---|---|---|---|---|---|
| <dbl> | <int> | <dbl> | <dbl> | <int> | <dbl> |
| 1 | 2 | 0.01282051 | 2.564103 | 2 | 2.564103 |
| 3 | 6 | 0.03846154 | 7.692308 | 8 | 10.256410 |
| 5 | 8 | 0.05128205 | 10.256410 | 16 | 20.512821 |
| 7 | 30 | 0.19230769 | 38.461538 | 46 | 58.974359 |
| 9 | 28 | 0.17948718 | 35.897436 | 74 | 94.871795 |
| 11 | 4 | 0.02564103 | 5.128205 | 78 | 100.000000 |