Rmarkdown RMD

---
title: "Trabajo final Corte 1"

author: "Juan David Mortigo"
date: "2024-02-26"
output: html_document
---
## primero instalamos los paquetes
```{r}
library(dplyr)
library(descriptr)
library(ggplot2)
library(datos)
library(fdth)
```
## luego sacamos una muestra y sembramos una semilla
```{r}
ola <- na.omit(datos_credito)
set.seed(2210)
muestra_credito <- ola[sample(nrow(ola),size=80),1:14]

```
## sacamos tablas de estado civil y vivienda relacionadas y luego como data frame
```{r}
estcivil.vivienda <- table(muestra_credito$EstadoCivil, muestra_credito$Vivienda)
estcivil.vivienda
estadocivil <- table(muestra_credito$EstadoCivil)

estadocivil
vivienda <- table(muestra_credito$Vivienda)

vivienda
estadocivil1 <- as.data.frame(estadocivil)

estadocivil1
vivienda1 <- as.data.frame(vivienda)

vivienda1
```
## diagrama de barras de estado civil
```{r}
estadocivil2 <- rename(estadocivil1, estadoC=Var1, Frecuencia=Freq)
barras_estado <- ggplot(estadocivil2, aes(x = estadoC, y = Frecuencia,

fill=estadoC)) +
geom_bar(stat = 'identity') +
geom_text(aes(label = estadoC), vjust = -1, colour = "black") +
ylim(c(0,75))
barras_estado
```
## Asignamos colores y hacemos grafico de torta

```{r}
colores <- hcl.colors(length(estadocivil))
colores
torta1 <- pie(estadocivil,main="Estado Civil",radius = 1, col = colores, labels =
c(
"Divorciado","casado","Separado","soltero","viudo"))
```
## finalmente hacemos el grafico de donas

```{r}
hsize <- 2
df <- estadocivil1 %>%

mutate(x = hsize)
ggplot(df, aes(x = hsize, y = Freq, fill= Var1)) +

geom_col(color= "black") +
geom_label(aes(label = Freq),
position = position_stack(vjust = 0.5),
show.legend = FALSE) +
coord_polar(theta = "y") +
scale_fill_brewer(palette = "GnBu") +
xlim(c(0.2, hsize + 0.5))+
theme(panel.background = element_rect(fill = "pink"))+
guides(fill = guide_legend(title = "Estado Civil"))
```
# Hacemos el mismo proceso anterior con vivienda

```{r}
vivienda2 <- rename(vivienda1, Vivienda=Var1, Frecuencia=Freq)
barras_vivienda <- ggplot(vivienda2, aes(x = Vivienda, y = Frecuencia,

fill=Vivienda)) +
geom_bar(stat = 'identity') +
geom_text(aes(label = Vivienda), vjust = -1, colour = "black") +
ylim(c(0,50))
barras_vivienda
colores <- hcl.colors(length(vivienda))
torta1 <- pie(vivienda,main="Vivienda",radius = 1, col = colores, labels = c(
"Ignorar","Otra","Propietario","Padres","Privado","Alquila"))
hsize <- 2
df2 <- vivienda1 %>%

mutate(x = hsize)
ggplot(df2, aes(x = hsize, y = Freq, fill= Var1)) +

geom_col(color= "black") +
geom_label(aes(label = Freq),
position = position_stack(vjust = 0.5),
show.legend = FALSE) +
coord_polar(theta = "y") +
scale_fill_brewer(palette = "GnBu") +
xlim(c(0.2, hsize + 0.5))+
theme(panel.background = element_rect(fill = "pink"))+
guides(fill = guide_legend(title = "Vivienda"))
```
## Creamos una tabla relacionando los ingresos con el trabajo

```{r}
x <-muestra_credito$Ingresos
y <- muestra_credito$Trabajo
df3 <- data.frame(x = x, y = y)
df3
```
## posteriormente lo graficamos en un grafico de caja

```{r}
p <- ggplot(df3, aes(x = x, y = y)) + labs(x = "Ingresos", y = "Trabajo") +
theme(axis.title.x = element_text(size = 15,
color = "blue",
face = "bold"),
axis.title.y = element_text(size = 15,
color = "red",
face = "italic"))+
stat_boxplot(geom = "errorbar",
width = 5) +
geom_boxplot(fill = "dodgerblue1",
colour = "black",
alpha = 5,
outlier.colour = "tomato2")
p
```
## creamos una tabla de frecuencias para precio y creamos su grafica de histograma

y poligonos
```{r}
tabla1 <- fdt(muestra_credito$Precio)
plot(tabla1, col="cadetblue",type = "rfh", main = "Histograma del precio")
grafico_poligono <- plot(tabla1, col="cadetblue",type = "fp", main = "grafico de

poligono del precio")
```
# Hacemos un analisis cuantitativo completo para 3 variables numéricas resumidas en

una sola tabla.
### empezando por gastos
```{r}
gastos <- muestra_credito$Gastos
promedio <- sum(gastos)/length(gastos)
gast.ord <- sort(x=gastos,decreasing = FALSE)
mediana <- median(gastos)
moda <- ds_mode(gastos)
rango <- range(gastos,na.rm = FALSE)
varianza_gastos <- round(var(gastos),5)
desvest_gastos <- round(sd(gastos),5)
coefvar_gastos <- round(ds_cvar(gastos),3)
cuartil1_gastos <- quantile(x = gastos,probs = c(0.25,0.5,0.75,1),type = 6)
cuartil1_gastos <- quantile(x = gastos,probs = c(0.25),type = 6)

cuartil4_gastos <- quantile(x = gastos,probs = c(1),type = 6)
tabla.gastos<- matrix(c(53.45,45,35,95,392.83291,19.82001,37.081,35,45,60,130),nrow
= 11)
rownames(tabla.gastos) <- c("Promedio","Mediana","Moda","rango(35-130)","varianza",

"desviacion estandar","coeficiente de variacion",
"cuartil 1","cuartil 2", "cuartil 3", "cuartil 4")
colnames(tabla.gastos) <- c("Gastos")
tabla.gastos <- data.frame(tabla.gastos)

tabla.gastos
```
### seguimos con ingresos

```{r}
ingresos <- muestra_credito$Ingresos
promedioi <- sum(ingresos)/length(ingresos)
medianai <- median(ingresos)
modai <- ds_mode(ingresos)
rangoi <- range(ingresos,na.rm = FALSE)
varianza_ingresos <- round(var(ingresos),5)
desvest_ingresos <- round(sd(ingresos),5)
coefvar_ingresos <- round(ds_cvar(ingresos),3)
cuartil1_ingresos <- quantile(x = ingresos,probs = c(0.25,0.5,0.75,1),type = 6)
cuartil1_ingresos <- quantile(x = ingresos,probs = c(0.25),type = 6)
cuartil4_ingresos <- quantile(x = ingresos,probs = c(1),type = 6)
tabla.ingresos<-
matrix(c(170.3375,143,90,462,8798.22642,93.79886,55.066,94.5,143,230,500),nrow =
11)
rownames(tabla.ingresos) <- c("Promedio","Mediana","Moda","rango(38-

500)","varianza",
colnames(tabla.ingresos) <- c("ingresos")
tabla.ingresos <- data.frame(tabla.ingresos)

tabla.ingresos
```
### y finalmente con cantidad

```{r}
cantidad <- muestra_credito$Cantidad
promedioc <- sum(cantidad)/length(cantidad)
medianai <- median(cantidad)
modac <- ds_mode(cantidad)
rangoc <- range(cantidad,na.rm = FALSE)
varianza_cantidad <- round(var(cantidad),5)
desvest_cantidad <- round(sd(cantidad),5)
coefvar_cantidad <- round(ds_cvar(cantidad),3)
cuartil1_cantidad <- quantile(x = cantidad,probs = c(0.25,0.5,0.75,1),type = 6)
cuartil1_cantidad <- quantile(x = cantidad,probs = c(0.25),type = 6)
cuartil4_cantidad <- quantile(x = cantidad,probs = c(1),type = 6)
tabla.cantidad<-
matrix(c(1045.7125,1000,1300,4300,391269.44794,625.51535,59.817,625,1000,1300,4500)
,nrow = 11)
rownames(tabla.cantidad) <- c("Promedio","Mediana","Moda","rango(200-

4500)","varianza",
colnames(tabla.cantidad) <- c("cantidad")
tabla.cantidad <- data.frame(tabla.cantidad)

tabla.cantidad
```

Rmarkdown RMD

Cargado por

Copyright:

Formatos disponibles

Rmarkdown RMD

Cargado por

Información del documento

Título original

Derechos de autor

Formatos disponibles

Compartir este documento

Compartir o incrustar documentos

Opciones para compartir

¿Le pareció útil este documento?

¿Este contenido es inapropiado?

Copyright:

Formatos disponibles

Rmarkdown RMD

Cargado por

Copyright:

Formatos disponibles

---

title: "Trabajo final Corte 1"

muestra_credito <- ola[sample(nrow(ola),size=80),1:14]

estadocivil <- table(muestra_credito$EstadoCivil)

vivienda <- table(muestra_credito$Vivienda)

estadocivil1 <- as.data.frame(estadocivil)

vivienda1 <- as.data.frame(vivienda)

barras_estado <- ggplot(estadocivil2, aes(x = estadoC, y = Frecuencia,

## Asignamos colores y hacemos grafico de torta

## finalmente hacemos el grafico de donas

df <- estadocivil1 %>%

ggplot(df, aes(x = hsize, y = Freq, fill= Var1)) +

# Hacemos el mismo proceso anterior con vivienda

barras_vivienda <- ggplot(vivienda2, aes(x = Vivienda, y = Frecuencia,

df2 <- vivienda1 %>%

ggplot(df2, aes(x = hsize, y = Freq, fill= Var1)) +

## Creamos una tabla relacionando los ingresos con el trabajo

## posteriormente lo graficamos en un grafico de caja

## creamos una tabla de frecuencias para precio y creamos su grafica de histograma

grafico_poligono <- plot(tabla1, col="cadetblue",type = "fp", main = "grafico de

# Hacemos un analisis cuantitativo completo para 3 variables numéricas resumidas en

promedio <- sum(gastos)/length(gastos)

gast.ord <- sort(x=gastos,decreasing = FALSE)

mediana <- median(gastos)

moda <- ds_mode(gastos)

rango <- range(gastos,na.rm = FALSE)

varianza_gastos <- round(var(gastos),5)

desvest_gastos <- round(sd(gastos),5)

coefvar_gastos <- round(ds_cvar(gastos),3)

cuartil1_gastos <- quantile(x = gastos,probs = c(0.25,0.5,0.75,1),type = 6)

cuartil1_gastos <- quantile(x = gastos,probs = c(0.25),type = 6)

cuartil3_gastos <- quantile(x = gastos,probs = c(0.75),type = 6)

cuartil4_gastos <- quantile(x = gastos,probs = c(1),type = 6)

rownames(tabla.gastos) <- c("Promedio","Mediana","Moda","rango(35-130)","varianza",

colnames(tabla.gastos) <- c("Gastos")

tabla.gastos <- data.frame(tabla.gastos)

### seguimos con ingresos

promedioi <- sum(ingresos)/length(ingresos)

medianai <- median(ingresos)

modai <- ds_mode(ingresos)

rangoi <- range(ingresos,na.rm = FALSE)

varianza_ingresos <- round(var(ingresos),5)

desvest_ingresos <- round(sd(ingresos),5)

coefvar_ingresos <- round(ds_cvar(ingresos),3)

cuartil1_ingresos <- quantile(x = ingresos,probs = c(0.25,0.5,0.75,1),type = 6)

cuartil1_ingresos <- quantile(x = ingresos,probs = c(0.25),type = 6)

cuartil2_ingresos <- quantile(x = ingresos,probs = c(0.5),type = 6)

cuartil3_ingresos <- quantile(x = ingresos,probs = c(0.75),type = 6)

cuartil4_ingresos <- quantile(x = ingresos,probs = c(1),type = 6)

rownames(tabla.ingresos) <- c("Promedio","Mediana","Moda","rango(38-

colnames(tabla.ingresos) <- c("ingresos")

tabla.ingresos <- data.frame(tabla.ingresos)

### y finalmente con cantidad

promedioc <- sum(cantidad)/length(cantidad)

medianai <- median(cantidad)

modac <- ds_mode(cantidad)

rangoc <- range(cantidad,na.rm = FALSE)

varianza_cantidad <- round(var(cantidad),5)

desvest_cantidad <- round(sd(cantidad),5)