-
Notifications
You must be signed in to change notification settings - Fork 0
/
aula16.R
62 lines (50 loc) · 1.79 KB
/
aula16.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
# análise exploratória
# carregar os pacotes
library(tyiverse)
#ler base de dados
df <- read.csv('studentesperformance.csv')
#Entender base
df %>%
summary()
str(df)
# TRansformar variaveis categóricas em fatores
df$gender <- as.factor(df$gender)
df$race/ethnicity <-as.factor(df$race/ethenicity)
df$parental level of education <- as.factor(df$parental level of education)
df$lunch <- as.factor (df$lunch)
df$test preparation course <- as. facto(df$test preparation course)
#Transformar nomes das variáveis para facilitar a análise
colnames(df)
colnames(df) <- c('gender', 'race', 'paramental_level_education',
'lunch', 'preparation, math_score',
'reading_score', 'writing_score')
#Resumindo os dados por gênero
df %>%
group_by(gender) %>%
summarise (media_math = mean(math_score),
media_writing = mean(writing_score),
media_reading = mean(reading_score))
#Resumindo os dados por raça
df %>%
group_by(race) %>%
summarise (media_math = mean(math_score),
media_writing = mean(writing_score),
media_reading = mean(reading_score))
#Resumindo os dados por parental_level_education
df %>%
group_by(parental_level_education) %>%
summarise (media_math = mean(math_score),
media_writing = mean(writing_score),
media_reading = mean(reading_score))
#Resumindo os dados por lunch
df %>%
group_by(lunch) %>%
summarise (media_math = mean(math_score),
media_writing = mean(writing_score),
media_reading = mean(reading_score))
#Resumindo os dados por preparation
df %>%
group_by(preparation) %>%
summarise (media_math = mean(math_score),
media_writing = mean(writing_score),
media_reading = mean(reading_score))