320 lines
3.6 KiB
INI
320 lines
3.6 KiB
INI
[conv1a]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
|
|
[conv1b]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
|
|
[conv1c]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
|
|
[conv1d]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
|
|
[conv2a]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0.00,0.00
|
|
|
|
[conv2b]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0.00,0.00
|
|
|
|
[conv2c]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0.00,0.00
|
|
|
|
[conv2d]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0.00,0.00
|
|
|
|
[conv3a]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv3b]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv3c]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv3d]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv4a]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv4b]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv4c]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv4d]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv5a]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv5b]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv5c]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv5d]
|
|
epsW=0.0001
|
|
epsB=0.02
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[fc1024-1a]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1024-1b]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1024-1c]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1024-1d]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
|
|
[fc1024-2a]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1024-2b]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1024-2c]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1024-2d]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[fc1000]
|
|
epsW=0.0001,0.0001,0.0001,0.0001
|
|
epsB=0.02
|
|
momW=0.9,0.9,0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005,0.0005,0.0005
|
|
wball=0,0,0,0
|
|
|
|
[logprob]
|
|
coeff=1
|
|
topk=5
|
|
|
|
[hs1a]
|
|
enable=true
|
|
|
|
[hs1b]
|
|
enable=true
|
|
|
|
[hs1c]
|
|
enable=true
|
|
|
|
[hs1d]
|
|
enable=true
|
|
|
|
[hs2a]
|
|
enable=true
|
|
|
|
[hs2b]
|
|
enable=true
|
|
|
|
[hs2c]
|
|
enable=true
|
|
|
|
[hs2d]
|
|
enable=true
|
|
|
|
[rnorm1a]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm1b]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm1c]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm1d]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm2a]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm2b]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm2c]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[rnorm2d]
|
|
scale=0.0001
|
|
pow=0.75
|
|
|
|
[cnorm2a]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2b]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2c]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2d]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
# this is like #129, but with 2x as many filters in conv2
|
|
# on guppy8
|
|
# /nobackup/kriz/tmp/ConvNet__2012-08-07_13.31.34
|
|
# logs/layers-130.log
|
|
# uhh.. relu wiped this. nice.
|
|
# on guppy9
|
|
# logs/layers-130a.log
|
|
# /nobackup/kriz/tmp/ConvNet__2012-08-09_14.09.20
|
|
# epoch 22: set epsw to 0.001 from 0.01
|
|
# epoch 46: set epsw to 0.0001 from 0.001
|
|
# epoch 62: killed. surprisingly, this is hardly (if at all) better than 2-gpu net
|