[conv1a] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv1b] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv2a] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv2b] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv3a] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv3b] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv4a] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv4b] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv5a] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [conv5b] epsW=0.01 epsB=0.02 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [fc2048a] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [fc2048b] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [fc2048ba] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [fc2048bb] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [fc1000] epsW=0.01,0.01 epsB=0.02 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 schedW=dexp[500,0,4] schedB=dexp[10,0,2] [logprob] coeff=1 topk=5 [hs1a] enable=true [hs2a] enable=true [hs1b] enable=true [hs2b] enable=true [rnorm1a] scale=0.0001 pow=0.75 minDiv=2 [rnorm1b] scale=0.0001 pow=0.75 minDiv=2 [rnorm2a] scale=0.0001 pow=0.75 minDiv=2 [rnorm2b] scale=0.0001 pow=0.75 minDiv=2 [cnorm2a] scale=0.001 pow=0.75 [cnorm2b] scale=0.001 pow=0.75 # this is like #159 (so uses same def file: 153) but with learning rate decaying to 0.00002 # on guppy9 # /nobackup/kriz/tmp/ConvNet__2013-01-07_04.03.15 # logs/layers-169.log # epoch 60: set color noise to 0 from 0.1 # epoch 73: set conv1 epsw to 0 from 0.01 # logprob: 1.841218, 0.425298, 0.195489 # multiview logprob: 1.735123, 0.405960, 0.181120 # now lets run this for 80 epochs instead of 95: # on guppy9 # /nobackup/kriz/tmp/ConvNet__2013-01-13_15.31.51 # logs/layers-169-80.log # epoch 46: paused for experiments with dropout in conv layers # epoch 53: set color noise to 0 from 0.1 # epoch 74: set epsw to 0 from 0.01 on conv1 # epoch 80: killed :( # logprob: 1.866277, 0.429784, 0.200178