2018-08-15 20:59:59 +03:00
|
|
|
[net]
|
2018-09-05 03:25:05 +03:00
|
|
|
# Training
|
|
|
|
# batch=128
|
|
|
|
# subdivisions=16
|
|
|
|
|
|
|
|
# Testing
|
|
|
|
batch=1
|
|
|
|
subdivisions=1
|
|
|
|
|
2018-08-15 20:59:59 +03:00
|
|
|
height=256
|
|
|
|
width=256
|
2018-09-05 03:25:05 +03:00
|
|
|
channels=3
|
2018-08-15 20:59:59 +03:00
|
|
|
min_crop=128
|
|
|
|
max_crop=448
|
|
|
|
|
|
|
|
burn_in=1000
|
|
|
|
learning_rate=0.1
|
|
|
|
policy=poly
|
|
|
|
power=4
|
|
|
|
max_batches=800000
|
2018-09-05 03:25:05 +03:00
|
|
|
momentum=0.9
|
|
|
|
decay=0.0005
|
2018-08-15 20:59:59 +03:00
|
|
|
|
|
|
|
angle=7
|
|
|
|
hue=.1
|
|
|
|
saturation=.75
|
|
|
|
exposure=.75
|
|
|
|
aspect=.75
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=7
|
|
|
|
stride=2
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[maxpool]
|
|
|
|
size=2
|
|
|
|
stride=2
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=64
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=2
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=128
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=1024
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=2
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=256
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=2048
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=3
|
|
|
|
stride=2
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=4096
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=4096
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
groups = 32
|
|
|
|
batch_normalize=1
|
|
|
|
filters=512
|
|
|
|
size=3
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
batch_normalize=1
|
|
|
|
filters=4096
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[shortcut]
|
|
|
|
from=-4
|
|
|
|
activation=leaky
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
[avgpool]
|
|
|
|
|
|
|
|
[convolutional]
|
|
|
|
filters=1000
|
|
|
|
size=1
|
|
|
|
stride=1
|
|
|
|
pad=1
|
|
|
|
activation=linear
|
|
|
|
|
|
|
|
[softmax]
|
|
|
|
groups=1
|
|
|
|
|