AlexNet/layers/layer-params-170-256-double.cfg
Laurent El Shafey 9fdd561586 Initial commit
2024-12-10 08:56:11 -08:00

203 lines
2.5 KiB
INI

[conv1a]
epsW=0.0
epsB=0.0
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv1b]
epsW=0.0
epsB=0.0
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv2a]
epsW=0.02
epsB=0.04
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv2b]
epsW=0.02
epsB=0.04
momW=0.9
momB=0.9
wc=0.0005
wball=0.00
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv3a]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv3b]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv4a]
epsW=0.02
epsB=0.04
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv4b]
epsW=0.02
epsB=0.04
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv5a]
epsW=0.02
epsB=0.04
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[conv5b]
epsW=0.02
epsB=0.04
momW=0.9
momB=0.9
wc=0.0005
wball=0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[fc2048a]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[fc2048b]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[fc2048ba]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[fc2048bb]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[fc1000]
epsW=0.02,0.02
epsB=0.04
momW=0.9,0.9
momB=0.9
wc=0.0005,0.0005
wball=0,0
schedW=dexp[250,0,4]
schedB=dexp[10,0,2]
[logprob]
coeff=1
topk=5
[hs1a]
enable=true
[hs2a]
enable=true
[hs1b]
enable=true
[hs2b]
enable=true
[rnorm1a]
scale=0.0001
pow=0.75
minDiv=2
[rnorm1b]
scale=0.0001
pow=0.75
minDiv=2
[rnorm2a]
scale=0.0001
pow=0.75
minDiv=2
[rnorm2b]
scale=0.0001
pow=0.75
minDiv=2
[cnorm2a]
scale=0.001
pow=0.75
[cnorm2b]
scale=0.001
pow=0.75
# this is 170 but running with minibatch 256 on krunch, also doubling eps to compensate for big batch size:
# use def file 153
# not doing fading
# /nobackup/kriz/tmp/ConvNet__2013-02-05_13.04.30
# logs/layers-170-256-double-eps.log
# epoch 61: set color noise to 0 from 0.1
# epoch 73: set conv1 epsw to 0 from 0.02
# after 84 epochs: logprob: 1.840643, 0.422726, 0.196598
# this matches #170 exactly, so im killing it to run 4gpu experiments