Documente Academic
Documente Profesional
Documente Cultură
for(i in 1:10000){
Z_2 <- X %*% W_1
A_2 <- sigmoid(Z_2)
Z_3 <- A_2 %*% W_2
Y_hat <- sigmoid(Z_3)
cost_hist[i] <- cost(Y,Y_hat)
delta_3 <- (-(Y-Y_hat) * sigmoidprime(Z_3))
djdw2 <- t(A_2) %*% delta_3
delta_2 <- delta_3 %*% t(W_2) * sigmoidprime(Z_2)
djdw1 <- t(X) %*% delta_2
W_1 <- W_1 - scalar * djdw1
W_2 <- W_2 - scalar * djdw2
}
W_1
##
[,1]
[,2]
[,3]
## [1,] 2.018745 -1.288067 2.1068752
## [2,] -0.510094 -1.001957 -0.7276968
W_2
##
[,1]
## [1,] 1.677602
## [2,] -3.618915
1
## [3,]
1.979281
Y_hat
##
[,1]
## [1,] 0.7500001
## [2,] 0.8202053
## [3,] 0.9296046
Y
##
[,1]
## [1,] 0.75
## [2,] 0.82
## [3,] 0.93
cost(Y,Y_hat)
## [1] 9.926357e-08
cost_hist
plot(cost_hist, type="l")
2000
4000
6000
Index
8000
10000
8
12
16
log(cost_hist)
plot(log(cost_hist),type = "l")
2000
4000
6000
8000
Index
10000
##
##
##
##
##
##
##
##
##
##
##
##
##
##
##
[1]
[7]
2.34134355 -1.43848624
1.44822475 0.89619914
1.82193939 -0.14279366
0.14810563
1.71923317 -0.01690314
$value
[1] 0.001226227
$counts
function gradient
47
45
$convergence
[1] 0
$message
NULL