Académique Documents
Professionnel Documents
Culture Documents
Guilherme Fernandes
March 29, 2019
Exercício 1
library(faraway)
data(prostate)
head(prostate,n=10)
tail(prostate,n=10)
summary(prostate)
1
## Max. : 3.8210 Max. :6.108 Max. :79.00 Max. : 2.3263
## svi lcp gleason pgg45
## Min. :0.0000 Min. :-1.3863 Min. :6.000 Min. : 0.00
## 1st Qu.:0.0000 1st Qu.:-1.3863 1st Qu.:6.000 1st Qu.: 0.00
## Median :0.0000 Median :-0.7985 Median :7.000 Median : 15.00
## Mean :0.2165 Mean :-0.1794 Mean :6.753 Mean : 24.38
## 3rd Qu.:0.0000 3rd Qu.: 1.1786 3rd Qu.:7.000 3rd Qu.: 40.00
## Max. :1.0000 Max. : 2.9042 Max. :9.000 Max. :100.00
## lpsa
## Min. :-0.4308
## 1st Qu.: 1.7317
## Median : 2.5915
## Mean : 2.4784
## 3rd Qu.: 3.0564
## Max. : 5.5829
##Conjunto de histogramas
hist(prostate$lcavol)
Histogram of prostate$lcavol
20
15
Frequency
10
5
0
−1 0 1 2 3 4
prostate$lcavol
hist(prostate$lweight)
2
Histogram of prostate$lweight
40
30
Frequency
20
10
0
2 3 4 5 6
prostate$lweight
hist(prostate$age)
3
Histogram of prostate$age
30
25
20
Frequency
15
10
5
0
40 50 60 70 80
prostate$age
hist(prostate$lbph)
4
Histogram of prostate$lbph
40
30
Frequency
20
10
0
−1 0 1 2
prostate$lbph
hist(prostate$svi)
5
Histogram of prostate$svi
60
Frequency
40
20
0
prostate$svi
hist(prostate$lcp)
6
Histogram of prostate$lcp
40
30
Frequency
20
10
0
−1 0 1 2 3
prostate$lcp
hist(prostate$gleason)
7
Histogram of prostate$gleason
50
40
Frequency
30
20
10
0
prostate$gleason
hist(prostate$pgg45)
8
Histogram of prostate$pgg45
40
30
Frequency
20
10
0
0 20 40 60 80 100
prostate$pgg45
hist(prostate$lpsa)
9
Histogram of prostate$lpsa
40
30
Frequency
20
10
0
−1 0 1 2 3 4 5 6
prostate$lpsa
10
4
3
prostate$lcavol
2
1
0
−1
0 20 40 60 80 100
Index
plot(prostate$lweight)
11
6
prostate$lweight
5
4
3
0 20 40 60 80 100
Index
plot(prostate$age)
12
80
70
prostate$age
60
50
40
0 20 40 60 80 100
Index
plot(prostate$lbph)
13
2
prostate$lbph
1
0
−1
0 20 40 60 80 100
Index
plot(prostate$svi)
14
1.0
0.8
prostate$svi
0.6
0.4
0.2
0.0
0 20 40 60 80 100
Index
plot(prostate$lcp)
15
3
2
prostate$lcp
1
0
−1
0 20 40 60 80 100
Index
plot(prostate$gleason)
16
9.0
8.5
prostate$gleason
8.0
7.5
7.0
6.5
6.0
0 20 40 60 80 100
Index
plot(prostate$pgg45)
17
100
80
prostate$pgg45
60
40
20
0
0 20 40 60 80 100
Index
plot(prostate$lpsa)
18
5
4
prostate$lpsa
3
2
1
0
0 20 40 60 80 100
Index
##Conjunto de densidades
plot(density(prostate$lcavol))
19
density.default(x = prostate$lcavol)
0.30
0.20
Density
0.10
0.00
−2 0 2 4
N = 97 Bandwidth = 0.4249
plot(density(prostate$lweight))
20
density.default(x = prostate$lweight)
0.8
0.6
Density
0.4
0.2
0.0
2 3 4 5 6
N = 97 Bandwidth = 0.1352
plot(density(prostate$age))
21
density.default(x = prostate$age)
0.06
0.04
Density
0.02
0.00
40 50 60 70 80
N = 97 Bandwidth = 2.152
plot(density(prostate$lbph))
22
density.default(x = prostate$lbph)
0.30
0.20
Density
0.10
0.00
−3 −2 −1 0 1 2 3 4
N = 97 Bandwidth = 0.523
plot(density(prostate$svi))
23
density.default(x = prostate$svi)
2.0
1.5
Density
1.0
0.5
0.0
N = 97 Bandwidth = 0.1492
plot(density(prostate$lcp))
24
density.default(x = prostate$lcp)
0.4
0.3
Density
0.2
0.1
0.0
−2 0 2 4
N = 97 Bandwidth = 0.504
plot(density(prostate$gleason))
25
density.default(x = prostate$gleason)
0.8
0.6
Density
0.4
0.2
0.0
6 7 8 9
N = 97 Bandwidth = 0.2603
plot(density(prostate$pgg45))
26
density.default(x = prostate$pgg45)
0.020
0.015
Density
0.010
0.005
0.000
0 50 100
N = 97 Bandwidth = 10.17
plot(density(prostate$lpsa))
27
density.default(x = prostate$lpsa)
0.3
Density
0.2
0.1
0.0
0 2 4 6
N = 97 Bandwidth = 0.3564
28
3
2
1
0
−1
barplot(sort(prostate$lweight))
29
6
5
4
3
2
1
0
barplot(sort(prostate$age))
30
60
40
20
0
barplot(sort(prostate$lbph))
31
2.0
1.0
0.0
−1.0
barplot(sort(prostate$svi))
32
1.0
0.8
0.6
0.4
0.2
0.0
barplot(sort(prostate$lcp))
33
2
1
0
−1
barplot(sort(prostate$gleason))
34
8
6
4
2
0
barplot(sort(prostate$pgg45))
35
100
80
60
40
20
0
barplot(sort(prostate$lpsa))
36
5
4
3
2
1
0
## (Intercept) prostate$lweight
## -0.3328410 0.4607156
plot(prostate$lcavol~prostate$lweight)
abline(linear1,col=2)
37
4
3
prostate$lcavol
2
1
0
−1
3 4 5 6
prostate$lweight
linear2<-lm(prostate$lcavol~prostate$age)
coef(linear2)
## (Intercept) prostate$age
## -0.92485702 0.03561938
plot(prostate$lcavol~prostate$age)
abline(linear2,col=3)
38
4
3
prostate$lcavol
2
1
0
−1
40 50 60 70 80
prostate$age
linear3<-lm(prostate$lcavol~prostate$lbph)
coef(linear3)
## (Intercept) prostate$lbph
## 1.34777980 0.02221871
plot(prostate$lcavol~prostate$lbph)
abline(linear3,col=4)
39
4
3
prostate$lcavol
2
1
0
−1
−1 0 1 2
prostate$lbph
linear4<-lm(prostate$lcavol~prostate$lcp)
coef(linear4)
## (Intercept) prostate$lcp
## 1.4521105 0.5692395
plot(prostate$lcavol~prostate$lcp)
abline(linear4,col=5)
40
4
3
prostate$lcavol
2
1
0
−1
−1 0 1 2 3
prostate$lcp
linear5<-lm(prostate$lcavol~prostate$pgg45)
coef(linear5)
## (Intercept) prostate$pgg45
## 0.90816923 0.01812199
plot(prostate$lcavol~prostate$pgg45)
abline(linear5,col=6)
41
4
3
prostate$lcavol
2
1
0
−1
0 20 40 60 80 100
prostate$pgg45
linear6<-lm(prostate$lcavol~prostate$lpsa)
coef(linear6)
## (Intercept) prostate$lpsa
## -0.5085802 0.7499191
plot(prostate$lcavol~prostate$lpsa)
abline(linear6,col=7)
42
4
3
prostate$lcavol
2
1
0
−1
0 1 2 3 4 5
prostate$lpsa
Exercício 2
library(faraway)
data(divusa)
head(divusa,n=10)
tail(divusa,n=10)
43
## 70 1989 20.4 5.3 57.4 54.2 69.2 8.6307
## 71 1990 20.9 5.6 57.5 54.5 70.9 8.1924
## 72 1991 20.9 6.8 57.4 54.2 69.6 7.8744
## 73 1992 21.2 7.5 57.8 53.3 68.9 7.0862
## 74 1993 20.5 6.9 57.9 52.3 67.6 6.6145
## 75 1994 20.5 6.1 58.8 51.5 66.7 6.1865
## 76 1995 19.8 5.6 58.9 50.8 65.6 5.7770
## 77 1996 19.5 5.4 59.3 49.7 65.3 5.5488
summary(divusa)
##Conjunto de histogramas
hist(divusa$year)
44
Histogram of divusa$year
10
8
Frequency
6
4
2
0
divusa$year
hist(divusa$divorce)
45
Histogram of divusa$divorce
15
Frequency
10
5
0
10 15 20
divusa$divorce
hist(divusa$unemployed)
46
Histogram of divusa$unemployed
40
30
Frequency
20
10
0
0 5 10 15 20 25
divusa$unemployed
hist(divusa$femlab)
47
Histogram of divusa$femlab
10 12 14
Frequency
8
6
4
2
0
20 30 40 50 60
divusa$femlab
hist(divusa$marriage)
48
Histogram of divusa$marriage
30
25
20
Frequency
15
10
5
0
40 60 80 100 120
divusa$marriage
hist(divusa$birth)
49
Histogram of divusa$birth
20
15
Frequency
10
5
0
divusa$birth
hist(divusa$military)
50
Histogram of divusa$military
40
30
Frequency
20
10
0
0 20 40 60 80
divusa$military
51
1980
divusa$year
1960
1940
1920
0 20 40 60 80
Index
plot(divusa$divorce)
52
20
divusa$divorce
15
10
0 20 40 60 80
Index
plot(divusa$unemployed)
53
25
20
divusa$unemployed
15
10
5
0 20 40 60 80
Index
plot(divusa$femlab)
54
60
50
divusa$femlab
40
30
0 20 40 60 80
Index
plot(divusa$marriage)
55
110
divusa$marriage
90
80
70
60
50
0 20 40 60 80
Index
plot(divusa$birth)
56
100 110 120
divusa$birth
90
80
70
0 20 40 60 80
Index
plot(divusa$military)
57
80
divusa$military
60
40
20
0
0 20 40 60 80
Index
##Conjunto de densidades
plot(density(divusa$year))
58
density.default(x = divusa$year)
0.012
0.008
Density
0.004
0.000
N = 77 Bandwidth = 8.446
plot(density(divusa$divorce))
59
density.default(x = divusa$divorce)
0.08
0.06
Density
0.04
0.02
0.00
0 5 10 15 20 25 30
N = 77 Bandwidth = 2.14
plot(density(divusa$unemployed))
60
density.default(x = divusa$unemployed)
0.15
0.10
Density
0.05
0.00
0 5 10 15 20 25
N = 77 Bandwidth = 0.9297
plot(density(divusa$femlab))
61
density.default(x = divusa$femlab)
0.030
0.020
Density
0.010
0.000
10 20 30 40 50 60 70
N = 77 Bandwidth = 4.442
plot(density(divusa$marriage))
62
density.default(x = divusa$marriage)
0.030
0.020
Density
0.010
0.000
40 60 80 100 120
N = 77 Bandwidth = 4.955
plot(density(divusa$birth))
63
density.default(x = divusa$birth)
0.020
0.015
Density
0.010
0.005
0.000
N = 77 Bandwidth = 7.369
plot(density(divusa$military))
64
density.default(x = divusa$military)
0.04
Density
0.02
0.00
0 20 40 60 80
N = 77 Bandwidth = 3.042
65
1500
1000
500
0
barplot(sort(divusa$divorce))
66
20
15
10
5
0
barplot(sort(divusa$unemployed))
67
20
15
10
5
0
barplot(sort(divusa$femlab))
68
50
40
30
20
10
0
barplot(sort(divusa$marriage))
69
100
80
60
40
20
0
barplot(sort(divusa$birth))
70
100 120
80
60
40
20
0
barplot(sort(divusa$military))
71
80
60
40
20
0
## (Intercept) divusa$unemployed
## 14.954236 -0.234974
plot(divusa$divorce~divusa$unemployed)
abline(linear1,col=2)
72
20
divusa$divorce
15
10
5 10 15 20 25
divusa$unemployed
linear2<-lm(divusa$divorce~divusa$femlab)
coef(linear2)
## (Intercept) divusa$femlab
## -3.6552722 0.4386697
plot(divusa$divorce~divusa$femlab)
abline(linear2,col=3)
73
20
divusa$divorce
15
10
30 40 50 60
divusa$femlab
linear3<-lm(divusa$divorce~divusa$birth)
coef(linear3)
## (Intercept) divusa$birth
## 31.905774 -0.209667
plot(divusa$divorce~divusa$birth)
abline(linear3,col=4)
74
20
divusa$divorce
15
10
divusa$birth
linear4<-lm(divusa$divorce~divusa$military)
coef(linear5)
## (Intercept) prostate$pgg45
## 0.90816923 0.01812199
plot(divusa$divorce~divusa$military)
abline(linear5,col=5)
75
20
divusa$divorce
15
10
0 20 40 60 80
divusa$military
Exercicio 3
library(faraway)
data(prostate)
lreg <- lm(lpsa ~ lcavol, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
r2conjunto=c()
erroresiduopadraoconjunto=c()
lreg <- lm(lpsa ~ lcavol+lweight, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
76
print(paste0("Erro resíduo padrão: ", somadelmreg$sigma))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
lreg <- lm(lpsa ~ lcavol+lweight+svi, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
lreg <- lm(lpsa ~ lcavol+lweight+svi+lbph, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
lreg <- lm(lpsa ~ lcavol+lweight+svi+lbph+age, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
lreg <- lm(lpsa ~ lcavol+lweight+svi+lbph+age+lcp, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
77
print(paste0("Erro resíduo padrão: ", somadelmreg$sigma))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
lreg <- lm(lpsa ~ lcavol+lweight+svi+lbph+age+lcp+pgg45, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
lreg <- lm(lpsa ~ lcavol+lweight+svi+lbph+age+lcp+pgg45+gleason, prostate)
somadelmreg <- summary(lreg)
print(paste0("R2: ", somadelmreg$r.squared))
r2conjunto=c(r2conjunto,somadelmreg$r.squared)
erroresiduopadraoconjunto=c(erroresiduopadraoconjunto,somadelmreg$sigma)
plot(r2conjunto,type="b",main="Tendência de R ao quadrado",ylab = "R ao quadrado")
78
Tendência de R ao quadrado
0.65
R ao quadrado
0.63
0.61
0.59
1 2 3 4 5 6 7
Index
79
Tendência do erro residual padrão
0.75
0.74
Erro residual padrão
0.73
0.72
0.71
1 2 3 4 5 6 7
Index
Exercício 4
f=function(x){
y=((-1+(sqrt(1+8*x)))/2)
return(y)
}
vetor=c()
while(length(vetor)<1000){
u=runif(1)
vetor=append(vetor,f(u))
}
hist(vetor)
80
Histogram of vetor
150
100
Frequency
50
0
vetor
plot(density(vetor))
81
density.default(x = vetor)
0.0 0.2 0.4 0.6 0.8 1.0 1.2
Density
82