Lectura de datos

Se leen los datos saeraq.Rdata, que provienen del fichero raq.dat utilizado en (A. Field, Miles, and Field 2012) (disponible en la web del libro).

load( "saeraq.RData" )

Descriptivos con paquete `tables`

Se realizan descriptivos de cada variable según sexo y origen con el paquete tables (Murdoch (2016)).

# library( tables )
opt <- booktabs()  # booktabs para las tablas

# Función para imprimir tablas en latex
tablaLatex <- function( tabla, caption = NULL ){
  cat( '\\begin{table} \\centering\n' )
  if( !is.null( caption ) ) cat( paste0( '\\caption{', caption, '}\n' ) )
  latex( tt )
  cat( '\\end{table}' )
}

Variable `actividadS`

tt <- tabular( ( Sexo = sexo ) + ( Total = 1 ) ~ ( `Actividad S` = actividadS ) +
                 ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{actividadS} según \\texttt{sexo}." )
html( tt, options = htmloptions( HTMLcaption = "Variable actividadS según sexo.", pad = TRUE ) )

Variable actividadS según sexo.
	Actividad S
Sexo	Nada	Poco	Mucho	Muchísimo	Total
Mujer	466	487	509	465	1927
Hombre	147	171	160	166	644
Total	613	658	669	631	2571

tt <- tabular( ( Origen = origen ) + ( Total = 1 ) ~ ( `Actividad S` = actividadS ) +
                 ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{actividadS} según \\texttt{origen}." )
html( tt, options = htmloptions( HTMLcaption = "Variable actividadS según origen.", pad = TRUE ) )

Variable actividadS según origen.
	Actividad S
Origen	Nada	Poco	Mucho	Muchísimo	Total
Albacete	288	282	308	300	1178
Murcia	263	286	292	271	1112
Helsinki	62	90	69	60	281
Total	613	658	669	631	2571

tt <- tabular( ( Sexo = sexo ) * ( Origen = origen ) + ( Total = 1 ) ~
                 ( `Actividad S` = actividadS ) + ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{actividadS} según \\texttt{origen} y \\texttt{sexo}." )
html( tt, options = htmloptions( HTMLcaption = "Variable actividadS según origen y sexo.", pad = TRUE ) )

Variable actividadS según origen y sexo.
		Actividad S
Sexo	Origen	Nada	Poco	Mucho	Muchísimo	Total
Mujer	Albacete	212	206	238	221	877
	Murcia	205	210	220	197	832
	Helsinki	49	71	51	47	218
Hombre	Albacete	76	76	70	79	301
	Murcia	58	76	72	74	280
	Helsinki	13	19	18	13	63
	Total	613	658	669	631	2571

Variable `ingresos`

ic1 <- function(x){
  mean( x ) - qt( 0.975, df = length( x ) - 1 ) * sd( x ) / sqrt( length( x ) ) 
}

ic2 <- function(x){
  mean( x ) + qt( 0.975, df = length( x ) - 1 ) * sd( x ) / sqrt( length( x ) ) 
}

tt <- tabular( ( Sexo = sexo ) + ( Origen = origen ) ~  ( Ingresos = ingresos ) *
                 ( ic1 + mean + sd + ic2 + median ) + ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{ingresos} según \\texttt{origen} y \\texttt{sexo}." )
html( tt, options = htmloptions( HTMLcaption = "Variable ingresos según origen y sexo.", pad = TRUE ) )

Variable ingresos según origen y sexo.
		Ingresos
		ic1	mean	sd	ic2	median	Total
Sexo	Mujer	29262	29670	9129	30078	25906	1927
	Hombre	28982	29679	9000	30375	31628	644
Origen	Albacete	28917	29435	9059	29953	24651	1178
	Murcia	29311	29849	9143	30387	32055	1112
	Helsinki	28901	29965	9066	31030	32088	281

tt <- tabular( ( Sexo = sexo ) * ( Origen = origen ) + ( Total = 1 ) ~
                 ( Ingresos = ingresos ) * ( ic1 + mean + sd + ic2 + median ) +
                 ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{ingresos} según \\texttt{origen} y \\texttt{sexo}." )
html( tt, options = htmloptions( HTMLcaption = "Variable ingresos según origen y sexo.", pad = TRUE ) )

Variable ingresos según origen y sexo.
		Ingresos
Sexo	Origen	ic1	mean	sd	ic2	median	Total
Mujer	Albacete	28667	29267	9046	29866	24046	877
	Murcia	29181	29807	9201	30433	31833	832
	Helsinki	29552	30769	9121	31987	34367	218
Hombre	Albacete	28894	29925	9094	30957	32715	301
	Murcia	28919	29975	8983	31032	33033	280
	Helsinki	25078	27182	8357	29287	23057	63
	Total	29320	29672	9095	30024	27771	2571

Variable `nivelIngles`

tt <- tabular( ( Sexo = sexo ) + ( Total = 1 ) ~ ( `Nivel de inglés` = nivelIngles ) +
                 ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{nivelIngles} según \\texttt{sexo}." )
html( tt, options = htmloptions( HTMLcaption = "Variable nivelIngles según sexo.", pad = TRUE ) )

Variable nivelIngles según sexo.
	Nivel de inglés
Sexo	Nulo	CasiNulo	A1	A2	B1	B2	C1	C2	IsabelII	Shakespeare	Total
Mujer	227	210	343	345	354	278	109	56	3	2	1927
Hombre	70	79	108	110	119	99	36	23	0	0	644
Total	297	289	451	455	473	377	145	79	3	2	2571

tt <- tabular( ( Origen = origen ) + ( Total = 1 ) ~ ( `Nivel de inglés` = nivelIngles ) +
                 ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{nivelIngles} según \\texttt{origen}." )
html( tt, options = htmloptions( HTMLcaption = "Variable nivelIngles según origen.", pad = TRUE ) )

Variable nivelIngles según origen.
	Nivel de inglés
Origen	Nulo	CasiNulo	A1	A2	B1	B2	C1	C2	IsabelII	Shakespeare	Total
Albacete	130	130	204	212	208	180	71	43	0	0	1178
Murcia	132	130	194	187	215	157	63	29	3	2	1112
Helsinki	35	29	53	56	50	40	11	7	0	0	281
Total	297	289	451	455	473	377	145	79	3	2	2571

tt <- tabular( (Sexo = sexo ) * ( Origen = origen ) + ( Total = 1 ) ~
                 ( `Nivel de inglés` = nivelIngles ) + ( Total = 1 ), data = df )

# tablaLatex( tt, caption = "Variable \\texttt{nivelIngles} según \\texttt{origen}." )
html( tt, options = htmloptions( HTMLcaption = "Variable nivelIngles según origen.", pad = TRUE ) )

Variable nivelIngles según origen.
		Nivel de inglés
Sexo	Origen	Nulo	CasiNulo	A1	A2	B1	B2	C1	C2	IsabelII	Shakespeare	Total
Mujer	Albacete	92	101	159	159	160	126	50	30	0	0	877
	Murcia	106	89	150	139	152	121	50	20	3	2	832
	Helsinki	29	20	34	47	42	31	9	6	0	0	218
Hombre	Albacete	38	29	45	53	48	54	21	13	0	0	301
	Murcia	26	41	44	48	63	36	13	9	0	0	280
	Helsinki	6	9	19	9	8	9	2	1	0	0	63
	Total	297	289	451	455	473	377	145	79	3	2	2571

Descriptivos con paquete `likert`

Se realizan gráficos descriptivos de los datos agrupando por origen o sexo con el paquete likert (Bryer and Speerschneider (2015)).

# library( likert )
dfLikert <- df[ , grep( "^Q", colnames( df ) ) ]
colnames( dfLikert ) <- dicc[ grep( "^Q", dicc$item ), "spanish" ]

bloque1 <- 1:8
bloque2 <- 9:17
bloque3 <- 18:23

itemsO1 <- likert( items = dfLikert[ , bloque1 ], grouping = df$origen )
itemsO2 <- likert( items = dfLikert[ , bloque2 ], grouping = df$origen )
itemsO3 <- likert( items = dfLikert[ , bloque3 ], grouping = df$origen )

itemsS1 <- likert( items = dfLikert[ , bloque1 ], grouping = df$sexo )
itemsS2 <- likert( items = dfLikert[ , bloque2 ], grouping = df$sexo )
itemsS3 <- likert( items = dfLikert[ , bloque3 ], grouping = df$sexo )

Según `origen`

plot( itemsO1 )

Gráfico de barras según origen de los ítems 1 a 8.

plot( itemsO1, type = "density" )

Gráfico de densidad según origen de los ítems 1 a 8.

Según `sexo`

plot( itemsS1 )

Gráfico de barras según sexo de los ítems 1 a 8.

plot( itemsS1, type = "density" )

Gráfico de densidad según sexo de los ítems 1 a 8.

Referencias y bibliografía

Bryer, Jason, and Kimberly Speerschneider. 2015. Likert: Functions to Analyze and Visualize Likert Type Items. http://CRAN.R-project.org/package=likert.

Field, Andy, Jeremy Miles, and Zoe Field. 2012. Discovering Statistics Using R. 1st edition. Sage Publications Ltd.

Murdoch, Duncan. 2016. Tables: Formula-Driven Table Generation. http://CRAN.R-project.org/package=tables.

T2. Taller encuestas. Descriptivos 2³

VIII Jornadas R Albacete 2016²

Álvaro Hernández Vicente, Elvira Ferre Jaén, Antonio José Perán Orcajada, Ana Belén Marín Valverde, Antonio Maurandi López¹

17 de noviembre de 2016

Lectura de datos

Descriptivos con paquete `tables`

Variable `actividadS`

Variable `ingresos`

Variable `nivelIngles`

Descriptivos con paquete `likert`

Según `origen`

Según `sexo`

Referencias y bibliografía

T2. Taller encuestas. Descriptivos 23

VIII Jornadas R Albacete 20162

Álvaro Hernández Vicente, Elvira Ferre Jaén, Antonio José Perán Orcajada, Ana Belén Marín Valverde, Antonio Maurandi López1

17 de noviembre de 2016

Lectura de datos

Descriptivos con paquete tables

Variable actividadS

Variable ingresos

Variable nivelIngles

Descriptivos con paquete likert

Según origen

Según sexo

Referencias y bibliografía

T2. Taller encuestas. Descriptivos 2³

VIII Jornadas R Albacete 2016²

Álvaro Hernández Vicente, Elvira Ferre Jaén, Antonio José Perán Orcajada, Ana Belén Marín Valverde, Antonio Maurandi López¹

Descriptivos con paquete `tables`

Variable `actividadS`

Variable `ingresos`

Variable `nivelIngles`

Descriptivos con paquete `likert`

Según `origen`

Según `sexo`