Initial commit
This commit is contained in:
commit
9fdd561586
246 changed files with 58283 additions and 0 deletions
450
layers/layer-params-184-4gpu.cfg
Normal file
450
layers/layer-params-184-4gpu.cfg
Normal file
|
@ -0,0 +1,450 @@
|
|||
[conv1a]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv1b]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv1c]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv1d]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv2a]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv2b]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv2c]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv2d]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0.00
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv3a]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv3b]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv3c]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv3d]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv4a]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv4b]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv4c]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv4d]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv5a]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv5b]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv5c]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv5d]
|
||||
epsW=0.02
|
||||
epsB=0.04
|
||||
momW=0.9
|
||||
momB=0.9
|
||||
wc=0.0005
|
||||
wball=0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv6a]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv6b]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv6c]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[conv6d]
|
||||
epsW=0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005
|
||||
wball=0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024a]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024b]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024c]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024d]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024ba]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024bb]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024bc]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1024bd]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1000a]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1000b]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1000c]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[fc1000d]
|
||||
epsW=0.02,0.02,0.02,0.02
|
||||
epsB=0.04
|
||||
momW=0.9,0.9,0.9,0.9
|
||||
momB=0.9
|
||||
wc=0.0005,0.0005,0.0005,0.0005
|
||||
wball=0,0,0,0
|
||||
schedW=dexp[tgtFactor=250,noiseStdev=0,numSteps=4]
|
||||
schedB=dexp[tgtFactor=10,noiseStdev=0,numSteps=2]
|
||||
|
||||
[logprob]
|
||||
coeff=1
|
||||
topk=5
|
||||
|
||||
[hs1a]
|
||||
enable=true
|
||||
|
||||
[hs1b]
|
||||
enable=true
|
||||
|
||||
[hs1c]
|
||||
enable=true
|
||||
|
||||
[hs1d]
|
||||
enable=true
|
||||
|
||||
[hs2a]
|
||||
enable=true
|
||||
|
||||
[hs2b]
|
||||
enable=true
|
||||
|
||||
[hs2c]
|
||||
enable=true
|
||||
|
||||
[hs2d]
|
||||
enable=true
|
||||
|
||||
[rnorm1a]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm1b]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm1c]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm1d]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm2a]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm2b]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm2c]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[rnorm2d]
|
||||
scale=0.0001
|
||||
pow=0.75
|
||||
minDiv=2
|
||||
|
||||
[cnorm2a]
|
||||
scale=0.001
|
||||
pow=0.75
|
||||
|
||||
[cnorm2b]
|
||||
scale=0.001
|
||||
pow=0.75
|
||||
|
||||
[cnorm2c]
|
||||
scale=0.001
|
||||
pow=0.75
|
||||
|
||||
[cnorm2d]
|
||||
scale=0.001
|
||||
pow=0.75
|
||||
|
||||
# this is like 183 but with half as many top-level conv filters so the # of params is not @#$%&!
|
||||
# also the fc layers are not connected .. fully (not to 3)
|
||||
# on krunch
|
||||
# 50 epochs
|
||||
# logs/layers-184.log
|
||||
# /nobackup/kriz/tmp/ConvNet__2013-03-04_04.05.18
|
Loading…
Add table
Add a link
Reference in a new issue