450 lines
7.6 KiB
INI
450 lines
7.6 KiB
INI
[conv1a]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv1b]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv1c]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv1d]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv2a]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv2b]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv2c]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv2d]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv3a]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv3b]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv3c]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv3d]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv4a]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv4b]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv4c]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv4d]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv5a]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv5b]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv5c]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv5d]
|
|
epsW=0.02
|
|
epsB=0.04
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv6a]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv6b]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv6c]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[conv6d]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024a]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024b]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024c]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024d]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024ba]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024bb]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024bc]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1024bd]
|
|
epsW=0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005
|
|
wball=0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1000a]
|
|
epsW=0.02,0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1000b]
|
|
epsW=0.02,0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1000c]
|
|
epsW=0.02,0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[fc1000d]
|
|
epsW=0.02,0.02,0.02,0.02
|
|
epsB=0.04
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
|
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
|
|
|
[logprob]
|
|
coeff=1
|
|
topk=5
|
|
|
|
[hs1a]
|
|
enable=true
|
|
|
|
[hs1b]
|
|
enable=true
|
|
|
|
[hs1c]
|
|
enable=true
|
|
|
|
[hs1d]
|
|
enable=true
|
|
|
|
[hs2a]
|
|
enable=true
|
|
|
|
[hs2b]
|
|
enable=true
|
|
|
|
[hs2c]
|
|
enable=true
|
|
|
|
[hs2d]
|
|
enable=true
|
|
|
|
[rnorm1a]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm1b]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm1c]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm1d]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm2a]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm2b]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm2c]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm2d]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[cnorm2a]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2b]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2c]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2d]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
# this is like 170-4gpu but with 6th conv layer and also 48 low-level filters
|
|
# on krunch
|
|
# logs/layers-183-dexp.log
|
|
# /nobackup/kriz/tmp/ConvNet__2013-03-03_23.14.01
|
|
# killed in favor of 184
|
|
# this is obvioulsy the wrong net to run -- it has way too many params.
|