2016-06-06 23:22:45 +03:00
|
|
|
[net]
|
|
|
|
inputs=256
|
2017-06-10 02:41:00 +03:00
|
|
|
|
|
|
|
# Test
|
2016-06-06 23:22:45 +03:00
|
|
|
batch = 1
|
2017-06-10 02:41:00 +03:00
|
|
|
time_steps=1
|
|
|
|
|
|
|
|
# Train
|
|
|
|
# batch = 512
|
|
|
|
# time_steps=64
|
|
|
|
|
|
|
|
subdivisions=1
|
2016-06-06 23:22:45 +03:00
|
|
|
momentum=0.9
|
|
|
|
decay=0.001
|
2017-06-10 02:41:00 +03:00
|
|
|
learning_rate=0.1
|
2016-06-06 23:22:45 +03:00
|
|
|
|
2017-06-10 02:41:00 +03:00
|
|
|
burn_in=100
|
2016-06-06 23:22:45 +03:00
|
|
|
policy=poly
|
|
|
|
power=4
|
2017-06-10 02:41:00 +03:00
|
|
|
max_batches=10000
|
2016-06-06 23:22:45 +03:00
|
|
|
|
|
|
|
[gru]
|
|
|
|
batch_normalize=1
|
|
|
|
output = 1024
|
|
|
|
|
|
|
|
[connected]
|
|
|
|
output=256
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[softmax]
|
|
|
|
|
|
|
|
[cost]
|
|
|
|
type=sse
|
|
|
|
|