-
Notifications
You must be signed in to change notification settings - Fork 2
/
education.R
80 lines (33 loc) · 1.82 KB
/
education.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
rm(list = ls())
# Load in the raw rda file
df = read.csv("cleaned_df.csv")
hist(df$diff_in_education)
summary(df$diff_in_education)
df$relationship_val <- as.numeric(substr(df$RELATIONSHIP_QUALITY, 2, 2))
summary(lm(relationship_val ~ diff_in_education, data=df))
df$abs_diff_in_education = abs(df$diff_in_education)
hist(df$abs_diff_in_education)
summary(df$abs_diff_in_education)
summary(lm(relationship_val ~ abs_diff_in_education, data=df))
df_different_education <- df[df$abs_diff_in_education!=0.0,]
hist(df_different_education$abs_diff_in_education)
summary(df_different_education$abs_diff_in_education)
summary(lm(relationship_val ~ abs_diff_in_education, data=df_different_education))
df_large_different_education <- df[df$abs_diff_in_education > 4.0,]
hist(df_large_different_education$abs_diff_in_education)
summary(df_large_different_education$abs_diff_in_education)
summary(lm(relationship_val ~ abs_diff_in_education, data=df_large_different_education))
df_vlarge_different_education <- df[df$abs_diff_in_education >= 8.0,]
hist(df_vlarge_different_education$abs_diff_in_education)
summary(df_vlarge_different_education$abs_diff_in_education)
summary(lm(relationship_val ~ abs_diff_in_education, data=df_vlarge_different_education))
fit = lm(relationship_val ~ abs_diff_in_education, data=df)
qqnorm(fit$residuals)
qqline(fit$residuals)
par(mfrow=c(2,2),mar=c(5,4,2,1))
plot(fit)
summary(aov(relationship_val ~ factor(RESPONDENT_YRSED) + factor(PARTNER_YRSED), data=df))
summary(aov(relationship_val ~ factor(RESPONDENT_YRSED)*factor(PARTNER_YRSED), data=df))
## next steps create another column, large diff in education yes/no
df$large_4_diff_in_education <- ifelse(df$abs_diff_in_education >= 4.0, "large", "not large")
summary(aov(relationship_val ~ factor(large_4_diff_in_education), data=df))