@@ -111,18 +111,16 @@ plot(m)
111111
112112# # Grid search
113113if (TRUE ) {
114- numlayers <- sample(2 : 5 ,1 )
115114 hyper_params <- list (
116- activation = c(" Rectifier" ),
117- hidden = list (rep(sample(200 : 1000 ,1 ),2 ), rep(sample(100 : 200 ,1 ),3 ), rep(sample(30 : 100 ,1 ),4 )),
118- l1 = c(0 , runif(sample(1 : 3 ),0 ,1e-3 )),
119- l2 = c(0 , runif(sample(1 : 3 ),0 ,1e-3 )),
120- input_dropout_ratio = c(0 ,runif(2 , 0 , 0.1 )),
121- rate = runif(sample(3 : 5 ),0.002 ,0.02 ),
122- rate_annealing = 10 ^ runif(sample(3 : 6 ),1 ,3 )* 1e-8 ,
123- momentum_start = runif(sample(3 : 5 ),0 ,0.5 ),
124- momentum_stable = runif(sample(3 : 5 ),0.5 ,0.999 ),
125- momentum_ramp = runif(sample(3 ),0 ,100 )* 1e6
115+ hidden = list (c(64 ,64 ,64 ),c(128 ,128 ,128 ),c(512 ,512 )),
116+ l1 = c(0 , 1e-5 ),
117+ l2 = c(0 , 1e-5 ),
118+ input_dropout_ratio = c(0 ,0.05 ),
119+ rate = c(0.005 ,0.01 ,0.02 ),
120+ rate_annealing = c(1e-8 ,1e-7 ,1e-6 ),
121+ momentum_start = c(0.25 ,0.5 ,0.75 ),
122+ momentum_stable = c(0.75 ,0.9 ,0.99 ),
123+ momentum_ramp = c(1e6 , 1e7 , 1e8 )
126124 )
127125 hyper_params
128126
@@ -140,7 +138,8 @@ if (TRUE) {
140138 score_validation_samples = 10000 , # # downsample validation set for faster scoring
141139 score_duty_cycle = 0.025 , # # don't score more than 2.5% of the wall time
142140 adaptive_rate = F , # # manually tuned learning rate
143- max_w2 = 10 , # # helps stability for Rectifier
141+ activation = c(" Rectifier" ),
142+ max_w2 = 10 , # # can help improve stability for Rectifier
144143 hyper_params = hyper_params
145144 )
146145}
0 commit comments