AlexNet/layers/layer-params-183-4gpu-exp.cfg
Laurent El Shafey 9fdd561586 Initial commit
2024-12-10 08:56:11 -08:00

450 lines
6.7 KiB
INI

[conv1a]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv1b]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv1c]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv1d]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv2a]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv2b]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv2c]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv2d]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv3a]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv3b]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv3c]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv3d]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv4a]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv4b]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv4c]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv4d]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv5a]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv5b]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv5c]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv5d]
epsW=0.04
epsB=0.08
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv6a]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv6b]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv6c]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[conv6d]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024a]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024b]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024c]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024d]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024ba]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024bb]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024bc]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1024bd]
epsW=0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005
wball=0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1000a]
epsW=0.04,0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005,0.0005
wball=0,0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1000b]
epsW=0.04,0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005,0.0005
wball=0,0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1000c]
epsW=0.04,0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005,0.0005
wball=0,0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[fc1000d]
epsW=0.04,0.04,0.04,0.04
epsB=0.08
momW=0.9,0.9,0.9,0.9
momB=0.9
wc=0.0005,0.0005,0.0005,0.0005
wball=0,0,0,0
schedW=exp[tgtFactor=1000,noiseStdev=0]
schedB=exp[tgtFactor=10,noiseStdev=0]
[logprob]
coeff=1
topk=5
[hs1a]
enable=true
[hs1b]
enable=true
[hs1c]
enable=true
[hs1d]
enable=true
[hs2a]
enable=true
[hs2b]
enable=true
[hs2c]
enable=true
[hs2d]
enable=true
[rnorm1a]
scale=0.0001
pow=0.75
minDiv=2
[rnorm1b]
scale=0.0001
pow=0.75
minDiv=2
[rnorm1c]
scale=0.0001
pow=0.75
minDiv=2
[rnorm1d]
scale=0.0001
pow=0.75
minDiv=2
[rnorm2a]
scale=0.0001
pow=0.75
minDiv=2
[rnorm2b]
scale=0.0001
pow=0.75
minDiv=2
[rnorm2c]
scale=0.0001
pow=0.75
minDiv=2
[rnorm2d]
scale=0.0001
pow=0.75
minDiv=2
[cnorm2a]
scale=0.001
pow=0.75
[cnorm2b]
scale=0.001
pow=0.75
[cnorm2c]
scale=0.001
pow=0.75
[cnorm2d]
scale=0.001
pow=0.75
# this is like 170-4gpu-exp but with 6th conv layer and also 48 low-level filters
# on krunch
# /nobackup/kriz/tmp/ConvNet__2013-02-26_20.53.34
# logs/layers-183.log
# killed, exp is bad