[conv1a] epsW=0.0001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 [conv1b] epsW=0.0001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 [conv2a] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0.00,0.00 [conv2b] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0.00,0.00 [conv3a] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [conv3b] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [conv4a] epsW=0.0001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv4b] epsW=0.0001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv5a] epsW=0.0001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv5b] epsW=0.0001 epsB=0.002 momW=0.9 momB=0.9 wc=0.0005 wball=0 [conv6a] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [conv6b] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048a] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048b] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048ba] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc2048bb] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [fc1000] epsW=0.0001,0.0001 epsB=0.002 momW=0.9,0.9 momB=0.9 wc=0.0005,0.0005 wball=0,0 [logprob] coeff=1 topk=5 [hs1a] enable=true [hs2a] enable=true [hs1b] enable=true [hs2b] enable=true [rnorm1a] scale=0.0001 pow=0.75 minDiv=2 [rnorm1b] scale=0.0001 pow=0.75 minDiv=2 [rnorm2a] scale=0.0001 pow=0.75 minDiv=2 [rnorm2b] scale=0.0001 pow=0.75 minDiv=2 [cnorm2a] scale=0.001 pow=0.75 [cnorm2b] scale=0.001 pow=0.75 # this is like 141, but trained on half of 2009 imgnet, to be comparable to google's results # logs/layers-141-2009-half.log # /nobackup/kriz/tmp/ConvNet__2012-09-09_00.26.31 # on guppy9 # epoch 6.2600: set epsw to 0.001 from 0.01 # epoch 13.3361: set epsw to 0.0001 from 0.001 # epoch 18.2396: set epsw to 0.00001 from 0.0001 on conv1,conv2 # set color noise to 0 from 0.1 # epoch 21.1949: set epsw to 0 from 0.00001 on conv1,conv2 # epoch 25.3718: set epsw to 0.00001 from 0.0001 # epoch 28.3271: killed # ok test erro rate is a bit worse than 131, restarting with epsw 0.001, color noise 0.1 # epoch 44.183: set epsw to 0.0001 from 0.001 # epoch 56: eek, it started getting worse on validation :/ # 141 notes: # this is like #137 but with conv6, also communication in conv6 # /nobackup/kriz/tmp/ConvNet__2012-09-03_16.27.48 # logs/layers-141.log # epoch 23: set epsw to 0.001 from 0.01 # epoch 48: set epsw to 0.0001 from 0.001 # epoch 60: this seems overfitty....killing # but will use these weights to initialize a net on 2009... why the hell not?