203 lines
2.8 KiB
INI
203 lines
2.8 KiB
INI
[conv1a]
|
|
epsW=0.0001
|
|
epsB=0.002
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
|
|
[conv1b]
|
|
epsW=0.0001
|
|
epsB=0.002
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0.00
|
|
|
|
[conv2a]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0.00,0.00
|
|
|
|
[conv2b]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0.00,0.00
|
|
|
|
[conv3a]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv3b]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv4a]
|
|
epsW=0.0001
|
|
epsB=0.002
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv4b]
|
|
epsW=0.0001
|
|
epsB=0.002
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv5a]
|
|
epsW=0.0001
|
|
epsB=0.002
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv5b]
|
|
epsW=0.0001
|
|
epsB=0.002
|
|
momW=0.9
|
|
momB=0.9
|
|
wc=0.0005
|
|
wball=0
|
|
|
|
[conv6a]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[conv6b]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[fc2048a]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[fc2048b]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[fc2048ba]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[fc2048bb]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[fc1000]
|
|
epsW=0.0001,0.0001
|
|
epsB=0.002
|
|
momW=0.9,0.9
|
|
momB=0.9
|
|
wc=0.0005,0.0005
|
|
wball=0,0
|
|
|
|
[logprob]
|
|
coeff=1
|
|
topk=5
|
|
|
|
[hs1a]
|
|
enable=true
|
|
|
|
[hs2a]
|
|
enable=true
|
|
|
|
[hs1b]
|
|
enable=true
|
|
|
|
[hs2b]
|
|
enable=true
|
|
|
|
[rnorm1a]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm1b]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm2a]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[rnorm2b]
|
|
scale=0.0001
|
|
pow=0.75
|
|
minDiv=2
|
|
|
|
[cnorm2a]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
[cnorm2b]
|
|
scale=0.001
|
|
pow=0.75
|
|
|
|
# this is like 141, but trained on half of 2009 imgnet, to be comparable to google's results
|
|
# logs/layers-141-2009-half.log
|
|
# /nobackup/kriz/tmp/ConvNet__2012-09-09_00.26.31
|
|
# on guppy9
|
|
# epoch 6.2600: set epsw to 0.001 from 0.01
|
|
# epoch 13.3361: set epsw to 0.0001 from 0.001
|
|
# epoch 18.2396: set epsw to 0.00001 from 0.0001 on conv1,conv2
|
|
# set color noise to 0 from 0.1
|
|
# epoch 21.1949: set epsw to 0 from 0.00001 on conv1,conv2
|
|
# epoch 25.3718: set epsw to 0.00001 from 0.0001
|
|
# epoch 28.3271: killed
|
|
# ok test erro rate is a bit worse than 131, restarting with epsw 0.001, color noise 0.1
|
|
# epoch 44.183: set epsw to 0.0001 from 0.001
|
|
# epoch 56: eek, it started getting worse on validation :/
|
|
|
|
# 141 notes:
|
|
# this is like #137 but with conv6, also communication in conv6
|
|
# /nobackup/kriz/tmp/ConvNet__2012-09-03_16.27.48
|
|
# logs/layers-141.log
|
|
# epoch 23: set epsw to 0.001 from 0.01
|
|
# epoch 48: set epsw to 0.0001 from 0.001
|
|
# epoch 60: this seems overfitty....killing
|
|
# but will use these weights to initialize a net on 2009... why the hell not?
|