[conv1a] epsW=0.001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 wcnorm=0.00 [conv1b] epsW=0.001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 wcnorm=0.00 [conv2a] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0.00,0.00 wcNormMin=0.001,0 wcNormMax=0.002,0 [conv2b] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0.00,0.00 wcNormMin=0.001,0 wcNormMax=0.002,0 [conv3a] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [conv3b] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [conv4a] epsW=0.001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv4b] epsW=0.001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv5a] epsW=0.001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv5b] epsW=0.001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [fc2048a] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048b] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048ba] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048bb] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048ca] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048cb] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc1000] epsW=0.001,0.001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [logprob] coeff=1 topk=5 [hs1a] enable=true [hs2a] enable=true [hs3a] enable=true [hs1b] enable=true [hs2b] enable=true [hs3b] enable=true [rnorm1a] scale=0.0001 pow=0.75 [rnorm1b] scale=0.0001 pow=0.75 [rnorm2a] scale=0.0001 pow=0.75 [rnorm2b] scale=0.0001 pow=0.75 # this is like #101 but uses wcnorm in conv2 and also has 3 fc layers. # its also like #109 but uses wider fc layers with dropout in all cos 109 overfit # on guppy9 # logs/layers-111.log # /nobackup/kriz/tmp/ConvNet__2012-07-12_23.59.48 # epoch 19: set epsw to 0.001 from 0.01 # epoch 42: this is quite a bit worse, and in an underfitting way, so i'm starting #104, which will be like this but the fc layers will be 3072 each instead of 2048