Você está na página 1de 15

R Notebook – CÁLCULOS Y ANÁLISIS PARA LA REALIZACIÓN DE LA

ESTADÍSTICA DESCRIPTIVA A LA BASE DATOS CRIME1


A continuación se presenta una reducida muestra de la base de datos usada y cargada en el programa
informático.
#Leer base de datos desde Internet
library(foreign)
datosCRIME1<-read.dta("http://fmwww.bc.edu/ec-p/data/wooldridge/crime1.dta")
datosCRIME1

## narr86 nfarr86 nparr86 pcnv avgsen tottime ptime86 qemp86 inc86 durat
## 1 0 0 0 0.38 17.6 35.2 12 0.0 0.0 0.0
## 2 2 2 0 0.44 0.0 0.0 0 1.0 0.8 0.0
## 3 1 1 0 0.33 22.8 22.8 0 0.0 0.0 11.0
## 4 2 2 1 0.25 0.0 0.0 5 2.0 8.8 0.0
## 5 1 1 0 0.00 0.0 0.0 0 2.0 8.1 1.0
## 6 0 0 0 1.00 0.0 0.0 0 4.0 97.6 0.0
## 7 2 2 1 0.44 0.0 0.0 0 0.0 0.0 1.0
## 8 5 3 5 0.75 0.0 0.0 0 0.0 0.0 3.0
## 9 0 0 0 0.33 10.9 21.8 9 0.0 0.0 19.3
## 10 0 0 0 0.23 0.0 0.0 0 3.0 16.7 0.0
## 11 1 1 0 0.00 0.0 0.0 0 4.0 162.5 0.0
## 12 0 0 0 0.17 31.7 63.4 12 0.0 0.0 0.0
## 13 0 0 0 0.33 0.0 0.0 0 4.0 32.9 0.0
## 14 0 0 0 0.00 0.0 0.0 0 0.0 0.0 14.0
## 15 1 1 0 0.00 0.0 0.0 0 4.0 174.5 0.0
## 16 0 0 0 0.20 59.2 59.2 3 1.7 14.3 4.3
## 17 1 1 0 0.38 0.0 0.0 0 0.0 0.0 18.0
## 18 0 0 0 0.50 0.0 0.0 0 4.0 154.0 0.0
## 19 0 0 0 0.60 7.9 23.7 0 0.0 0.0 11.0
## 20 0 0 0 0.50 0.0 0.0 0 4.0 100.3 0.0

## black hispan born60 pcnvsq pt86sq inc86sq


## 1 0 0 1 0.1444 144 0.000000e+00
## 2 0 1 0 0.1936 0 6.400000e-01
## 3 1 0 1 0.1089 0 0.000000e+00
## 4 0 1 1 0.0625 25 7.744000e+01
## 5 0 0 0 0.0000 0 6.561001e+01
## 6 0 0 1 1.0000 0 9.525760e+03
## 7 1 0 1 0.1936 0 0.000000e+00
## 8 0 0 1 0.5625 0 0.000000e+00
## 9 1 0 1 0.1089 81 0.000000e+00
## 10 0 1 1 0.0529 0 2.788900e+02
ANALISIS ESTADÍSTICOS UNIVARIANTES
#Estadistica Descriptiva a la base de Datos "datosCRIME1"
summary(datosCRIME1)

## narr86 nfarr86 nparr86 pcnv


## Min. : 0.0000 Min. :0.0000 Min. :0.0000 Min. :0.0000
## 1st Qu.: 0.0000 1st Qu.:0.0000 1st Qu.:0.0000 1st Qu.:0.0000
## Median : 0.0000 Median :0.0000 Median :0.0000 Median :0.2500
## Mean : 0.4044 Mean :0.2334 Mean :0.1255 Mean :0.3578
## 3rd Qu.: 1.0000 3rd Qu.:0.0000 3rd Qu.:0.0000 3rd Qu.:0.6700
## Max. :12.0000 Max. :6.0000 Max. :8.0000 Max. :1.0000
## avgsen tottime ptime86 qemp86
## Min. : 0.0000 Min. : 0.0000 Min. : 0.0000 Min. :0.000
## 1st Qu.: 0.0000 1st Qu.: 0.0000 1st Qu.: 0.0000 1st Qu.:1.000
## Median : 0.0000 Median : 0.0000 Median : 0.0000 Median :3.000
## Mean : 0.6323 Mean : 0.8387 Mean : 0.3872 Mean :2.309
## 3rd Qu.: 0.0000 3rd Qu.: 0.0000 3rd Qu.: 0.0000 3rd Qu.:4.000
## Max. :59.2000 Max. :63.4000 Max. :12.0000 Max. :4.000
## inc86 durat black hispan
## Min. : 0.00 Min. : 0.000 Min. :0.0000 Min. :0.0000
## 1st Qu.: 0.40 1st Qu.: 0.000 1st Qu.:0.0000 1st Qu.:0.0000
## Median : 29.00 Median : 0.000 Median :0.0000 Median :0.0000
## Mean : 54.97 Mean : 2.251 Mean :0.1611 Mean :0.2176
## 3rd Qu.: 90.10 3rd Qu.: 2.000 3rd Qu.:0.0000 3rd Qu.:0.0000
## Max. :541.00 Max. :25.000 Max. :1.0000 Max. :1.0000
## born60 pcnvsq pt86sq inc86sq
## Min. :0.0000 Min. :0.0000 Min. : 0.000 Min. : 0.00
## 1st Qu.:0.0000 1st Qu.:0.0000 1st Qu.: 0.000 1st Qu.: 0.16
## Median :0.0000 Median :0.0625 Median : 0.000 Median : 841.00
## Mean :0.3626 Mean :0.2841 Mean : 3.951 Mean : 7458.93
## 3rd Qu.:1.0000 3rd Qu.:0.4489 3rd Qu.: 0.000 3rd Qu.: 8118.01
## Max. :1.0000 Max. :1.0000 Max. :144.000 Max. :292681.00

attach(datosCRIME1)
#Elaboración de Histograma de una variable
hist(narr86, col="sky blue", main="Histograma de la Variable narr86")

El gráfico nos da a conocer la información de (frecuencia & número de veces arrestadas) y que la gran mayoría
de las personas que fueron arrestadas una sola vez en el año 1986.
#Elaboración de Hisograma de una variable
hist(narr86, col="sky blue", main="Histograma de la Variable narr86")

hist(nfarr86, col = "red", main = "Histograma de la variable nfarr86")

hist(nparr86, col="blue", main="Histograma de la Variable nparr86")


hist(pcnv, col = "yellow", main = "Histograma de la variable pcnv")

hist(avgsen, col = "black", main = "Histograma de la variable avgsen")


hist(tottime, col="pink", main="Histograma de la Variable tottime")

hist(ptime86, col = "brown", main = "Histograma de la variable ptime86")


hist(qemp86, col="green", main="Histograma de la Variable qemp86")

hist(inc86, col = "orange", main = "Histograma de la variable inc86")


hist(durat, col="purple", main="Histograma de la Variable durat")

hist(black, col = "maroon", main = "Histograma de la variable black")


hist(hispan, col = "gray", main = "Histograma de la variable hispan")

hist(born60, col="violet", main="Histograma de la Variable born60")


hist(pcnvsq, col = "green yellow", main = "Histograma de la variable pcnvsq")

hist(pt86sq, col="gold", main="Histograma de la Variable pt86sq")


hist(inc86sq, col = "darkgreen", main = "Histograma de la variable inc86sq")

#Diagrama de barras
barplot(narr86, col="sky blue", main="Diagrama de Barras de la Variable narr86")
#DIAGRAMA DE CAJAS de una variable
boxplot(narr86, col="purple", main="Diagrama de Cajas")

El gráfico nos da a conocer la información de que en el primer cuartil, segundo cuartil, tercer cuartil se
encuentran la mayoría de las personas que fueron arrestadas una sola vez en el año 1986 y también la
presencia de algunos datos aberrantes.

ANALISIS ESTADÍSTICOS BIVARIANTES


#Coeficiente de Correlación de Pearson y Gráfico de las Matrices de Correlación
cor(datosCRIME1)
## narr86 nfarr86 nparr86 pcnv avgsen
## narr86 1.00000000 0.80741555 0.660836101 -0.072460574 0.029297803
## nfarr86 0.80741555 1.00000000 0.634889922 -0.063637015 0.021534423
## nparr86 0.66083610 0.63488992 1.000000000 -0.017513357 -0.009805834
## pcnv -0.07246057 -0.06363701 -0.017513357 1.000000000 0.025832955
## avgsen 0.02929780 0.02153442 -0.009805834 0.025832955 1.000000000
## tottime 0.03448612 0.02605154 -0.002484245 0.029904743 0.928540437
## ptime86 -0.02994412 -0.01206333 -0.008736298 0.053936087 0.235280942
## qemp86 -0.17413566 -0.18622178 -0.129729439 -0.003704690 -0.106676748
## inc86 -0.18997653 -0.17876518 -0.140529313 -0.008890544 -0.095805958
## durat 0.08232769 0.10629126 0.062814689 -0.022945822 0.028431622
## black 0.14930289 0.16245659 0.101120535 -0.066061585 0.119399294
## hispan 0.05300297 0.01928596 -0.013677282 0.010201436 0.012767150
## born60 -0.02448522 -0.02049111 -0.012647417 0.047267356 0.012273553
## pcnvsq -0.10750092 -0.09631280 -0.045923607 0.962854147 -0.018978898
## pt86sq -0.06002315 -0.04582933 -0.029305953 0.049140378 0.214348189
## inc86sq -0.13095379 -0.11768424 -0.096646960 0.001867246 -0.059031815
## tottime ptime86 qemp86 inc86
## narr86 0.034486123 -0.0299441157 -0.1741356645 -0.1899765347
## nfarr86 0.026051545 -0.0120633287 -0.1862217751 -0.1787651819
## nparr86 -0.002484245 -0.0087362984 -0.1297294394 -0.1405293131
## pcnv 0.029904743 0.0539360868 -0.0037046904 -0.0088905436
## avgsen 0.928540437 0.2352809424 -0.1066767479 -0.0958059582
## tottime 1.000000000 0.2820839607 -0.1219436221 -0.0996803144
## ptime86 0.282083961 1.0000000000 -0.2659565140 -0.1600273709
## qemp86 -0.121943622 -0.2659565140 1.0000000000 0.7117812540
## inc86 -0.099680314 -0.1600273709 0.7117812540 1.0000000000
## durat 0.027841469 -0.0235857933 -0.4853196435 -0.3429295359
## black 0.113816143 0.0737466122 -0.1592463974 -0.1469572086
## hispan 0.020856548 0.0512793990 0.0331670117 0.0007708986
## born60 0.014933700 0.0064561501 0.0001805366 0.0811217774
## pcnvsq -0.016699734 0.0003593481 0.0504413071 0.0426943215
## pt86sq 0.262257518 0.9827637456 -0.2484045343 -0.1459995011
## inc86sq -0.059573348 -0.0901264610 0.4433382355 0.8876100113
## durat black hispan born60 pcnvsq
## narr86 0.082327695 0.14930289 0.0530029730 -0.0244852172 -0.1075009242
## nfarr86 0.106291261 0.16245659 0.0192859641 -0.0204911090 -0.0963128020
## nparr86 0.062814689 0.10112054 -0.0136772823 -0.0126474166 -0.0459236069
## pcnv -0.022945822 -0.06606159 0.0102014357 0.0472673557 0.9628541468
## avgsen 0.028431622 0.11939929 0.0127671500 0.0122735531 -0.0189788984
## tottime 0.027841469 0.11381614 0.0208565478 0.0149337000 -0.0166997343
## ptime86 -0.023585793 0.07374661 0.0512793990 0.0064561501 0.0003593481
## qemp86 -0.485319644 -0.15924640 0.0331670117 0.0001805366 0.0504413071
## inc86 -0.342929536 -0.14695721 0.0007708986 0.0811217774 0.0426943215
## durat 1.000000000 0.08871061 -0.0423549332 0.0040834226 -0.0514360593
## black 0.088710610 1.00000000 -0.2311148724 0.0100339299 -0.0850691277
## hispan -0.042354933 -0.23111487 1.0000000000 -0.0111059937 -0.0245856264
## born60 0.004083423 0.01003393 -0.0111059937 1.0000000000 0.0363751217
## pcnvsq -0.051436059 -0.08506913 -0.0245856264 0.0363751217 1.0000000000
## pt86sq -0.044771787 0.06045961 0.0519132792 -0.0007874258 0.0005918222
## inc86sq -0.210722054 -0.09735657 -0.0055170302 0.0909763436 0.0370840090
## pt86sq inc86sq
## narr86 -0.0600231515 -0.130953786
## nfarr86 -0.0458293293 -0.117684240
## nparr86 -0.0293059528 -0.096646960
## pcnv 0.0491403782 0.001867246
## avgsen 0.2143481886 -0.059031815
## tottime 0.2622575183 -0.059573348
## ptime86 0.9827637456 -0.090126461
## qemp86 -0.2484045343 0.443338236
## inc86 -0.1459995011 0.887610011
## durat -0.0447717870 -0.210722054
## black 0.0604596051 -0.097356566
## hispan 0.0519132792 -0.005517030
## born60 -0.0007874258 0.090976344
## pcnvsq 0.0005918222 0.037084009
## pt86sq 1.0000000000 -0.081426939
## inc86sq -0.0814269389 1.000000000

pairs(datosCRIME1, col="red", main="Matriz de Correlación")

#Existe una alta correlación positiva entre inc86^2 y los ingresos legales de 1986(inc86)
head(cor(datosCRIME1)[16,9])
[1] 0.88761

#Existe una alta correlación positiva entre el número de arrestos por delitos mayores, 19
86(nfarr86) y número de veces que fue arrestado, 1986(narr86)
head(cor(datosCRIME1)[2,1])
[1] 0.8074156
#Existe una alta correlación positiva entre el tiempo en prisión desde 18/meses (tottime)
y duración promedio de la sentencia(avgsen)
head(cor(datosCRIME1)[6,5])
[1] 0.9285404

#Existe una alta correlación positiva entre ptime86^2(pt86sq) y meses en prisión durante
1986(ptime86)
head(cor(datosCRIME1)[15,7])
[1] 0.9827637

#Existe una alta correlación positiva entre pcnv^2(pcnvsq) y proporción de condenas anter
iores(pcnv)
head(cor(datosCRIME1)[14,4])
[1] 0.9628541

#Coeficiente de Covarianza
cov(datosCRIME1)

## narr86 nfarr86 nparr86 pcnv


## narr86 7.380129e-01 4.030100e-01 2.741167e-01 -0.024600384
## nfarr86 4.030100e-01 3.375775e-01 1.781127e-01 -0.014611832
## nparr86 2.741167e-01 1.781127e-01 2.331415e-01 -0.003341853
## pcnv -2.460038e-02 -1.461183e-02 -3.341853e-03 0.156176710
## avgsen 8.829386e-02 4.389181e-02 -1.660955e-02 0.035813412
## tottime 1.364886e-01 6.973331e-02 -5.526170e-03 0.054446285
## ptime86 -5.016368e-02 -1.366784e-02 -8.225896e-03 0.041565548
## qemp86 -2.409135e-01 -1.742443e-01 -1.008764e-01 -0.002357770
## inc86 -1.087386e+01 -6.920243e+00 -4.520936e+00 -0.234092823
## durat 3.258383e-01 2.845172e-01 1.397318e-01 -0.041776873
## black 4.716108e-02 3.470625e-02 1.795282e-02 -0.009599325
## hispan 1.879171e-02 4.624473e-03 -2.725485e-03 0.001663809
## born60 -1.011411e-02 -5.724582e-03 -2.936319e-03 0.008981751
## pcnvsq -3.608492e-02 -2.186514e-02 -8.664177e-03 0.148679183
## pt86sq -1.138845e+00 -5.880905e-01 -3.125213e-01 0.428904448
## inc86sq -1.840629e+03 -1.118720e+03 -7.635090e+02 12.073298043
## avgsen tottime ptime86 qemp86
## narr86 8.829386e-02 1.364886e-01 -5.016368e-02 -2.409135e-01
## nfarr86 4.389181e-02 6.973331e-02 -1.366784e-02 -1.742443e-01
## nparr86 -1.660955e-02 -5.526170e-03 -8.225896e-03 -1.008764e-01
## pcnv 3.581341e-02 5.444629e-02 4.156555e-02 -2.357770e-03
## avgsen 1.230628e+01 1.500667e+01 1.609519e+00 -6.026632e-01
## tottime 1.500667e+01 2.122463e+01 2.534220e+00 -9.047332e-01
## ptime86 1.609519e+00 2.534220e+00 3.802698e+00 -8.352144e-01
## qemp86 -6.026632e-01 -9.047332e-01 -8.352144e-01 2.593479e+00
## inc86 -2.239276e+01 -3.059716e+01 -2.079179e+01 7.637296e+01
## durat 4.595040e-01 5.909305e-01 -2.118950e-01 -3.600754e+00
## black 1.540100e-01 1.928002e-01 5.287758e-02 -9.429629e-02
## hispan 1.848381e-02 3.965488e-02 4.126891e-02 2.204357e-02
## born60 2.070262e-02 3.308103e-02 6.053564e-03 1.397971e-04
## pcnvsq -2.601453e-02 -3.006153e-02 2.738059e-04 3.174017e-02
## pt86sq 1.660723e+01 2.668467e+01 4.232617e+01 -8.835169e+00
## inc86sq -3.388175e+03 -4.490433e+03 -2.875507e+03 1.168134e+04
## inc86 durat black hispan
## narr86 -1.087386e+01 3.258383e-01 4.716108e-02 0.018791712
## nfarr86 -6.920243e+00 2.845172e-01 3.470625e-02 0.004624473
## nparr86 -4.520936e+00 1.397318e-01 1.795282e-02 -0.002725485
## pcnv -2.340928e-01 -4.177687e-02 -9.599325e-03 0.001663809
## avgsen -2.239276e+01 4.595040e-01 1.540100e-01 0.018483813
## tottime -3.059716e+01 5.909305e-01 1.928002e-01 0.039654878
## ptime86 -2.079179e+01 -2.118950e-01 5.287758e-02 0.041268911
## qemp86 7.637296e+01 -3.600754e+00 -9.429629e-02 0.022043568
## inc86 4.439186e+03 -1.052642e+02 -3.600196e+00 0.021197421
## durat -1.052642e+02 2.122503e+01 1.502738e-01 -0.080530857
## black -3.600196e+00 1.502738e-01 1.351970e-01 -0.035070794
## hispan 2.119742e-02 -8.053086e-02 -3.507079e-02 0.170321034
## born60 2.598847e+00 9.045656e-03 1.773970e-03 -0.002203856
## pcnvsq 1.111484e+00 -9.259198e-02 -1.222185e-02 -0.003964578
## pt86sq -2.148409e+02 -4.555568e+00 4.909789e-01 0.473180159
## inc86sq 9.675870e+05 -1.588365e+04 -5.856862e+02 -37.252521778
## born60 pcnvsq pt86sq inc86sq
## narr86 -1.011411e-02 -3.608492e-02 -1.138845e+00 -1.840629e+03
## nfarr86 -5.724582e-03 -2.186514e-02 -5.880905e-01 -1.118720e+03
## nparr86 -2.936319e-03 -8.664177e-03 -3.125213e-01 -7.635090e+02
## pcnv 8.981751e-03 1.486792e-01 4.289044e-01 1.207330e+01
## avgsen 2.070262e-02 -2.601453e-02 1.660723e+01 -3.388175e+03
## tottime 3.308103e-02 -3.006153e-02 2.668467e+01 -4.490433e+03
## ptime86 6.053564e-03 2.738059e-04 4.232617e+01 -2.875507e+03
## qemp86 1.397971e-04 3.174017e-02 -8.835169e+00 1.168134e+04
## inc86 2.598847e+00 1.111484e+00 -2.148409e+02 9.675870e+05
## durat 9.045656e-03 -9.259198e-02 -4.555568e+00 -1.588365e+04
## black 1.773970e-03 -1.222185e-02 4.909789e-01 -5.856862e+02
## hispan -2.203856e-03 -3.964578e-03 4.731802e-01 -3.725252e+01
## born60 2.311975e-01 6.834041e-03 -8.362096e-03 7.157086e+02
## pcnvsq 6.834041e-03 1.526733e-01 5.107245e-03 2.370742e+02
## pt86sq -8.362096e-03 5.107245e-03 4.877843e+02 -2.942376e+04
## inc86sq 7.157086e+02 2.370742e+02 -2.942376e+04 2.676901e+08

Você também pode gostar