[conv1a] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv1b] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv1c] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv1d] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv2a] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv2b] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv2c] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv2d] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0.00 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv3a] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv3b] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv3c] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv3d] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv4a] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv4b] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv4c] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv4d] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv5a] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv5b] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv5c] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [conv5d] epsW=0.04 epsB=0.08 momW=0.9 momB=0.9 wc=0.0005 wball=0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024a] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024b] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024c] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024d] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024ba] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024bb] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024bc] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1024bd] epsW=0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005 wball=0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1000a] epsW=0.04,0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005,0.0005 wball=0,0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1000b] epsW=0.04,0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005,0.0005 wball=0,0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1000c] epsW=0.04,0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005,0.0005 wball=0,0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [fc1000d] epsW=0.04,0.04,0.04,0.04 epsB=0.08 momW=0.9,0.9,0.9,0.9 momB=0.9 wc=0.0005,0.0005,0.0005,0.0005 wball=0,0,0,0 schedW=exp[tgtFactor=1000,noiseStdev=0] schedB=exp[tgtFactor=10,noiseStdev=0] [logprob] coeff=1 topk=5 [hs1a] enable=true [hs1b] enable=true [hs1c] enable=true [hs1d] enable=true [hs2a] enable=true [hs2b] enable=true [hs2c] enable=true [hs2d] enable=true [rnorm1a] scale=0.0001 pow=0.75 minDiv=2 [rnorm1b] scale=0.0001 pow=0.75 minDiv=2 [rnorm1c] scale=0.0001 pow=0.75 minDiv=2 [rnorm1d] scale=0.0001 pow=0.75 minDiv=2 [rnorm2a] scale=0.0001 pow=0.75 minDiv=2 [rnorm2b] scale=0.0001 pow=0.75 minDiv=2 [rnorm2c] scale=0.0001 pow=0.75 minDiv=2 [rnorm2d] scale=0.0001 pow=0.75 minDiv=2 [cnorm2a] scale=0.001 pow=0.75 [cnorm2b] scale=0.001 pow=0.75 [cnorm2c] scale=0.001 pow=0.75 [cnorm2d] scale=0.001 pow=0.75 # this is like 170-4gpu but with exp leraning rate # uses config file #153-4gpu # on krunch # logs/layers-170-4gpu-exp.log # /nobackup/kriz/tmp/ConvNet__2013-02-24_23.19.05 # epoch 14: moved to guppy9 # /nobackup/kriz/tmp/ConvNet__2013-02-24_23.19.05 # killed, exp is bad