mirror of https://github.com/AlexeyAB/darknet.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1018 lines
10 KiB
1018 lines
10 KiB
[net] |
|
# Testing |
|
#batch=1 |
|
#subdivisions=1 |
|
# Training |
|
batch=64 |
|
subdivisions=16 |
|
width=512 |
|
height=512 |
|
channels=3 |
|
momentum=0.9 |
|
decay=0.0005 |
|
angle=0 |
|
saturation = 1.5 |
|
exposure = 1.5 |
|
hue=.1 |
|
|
|
learning_rate=0.001 |
|
burn_in=1000 |
|
max_batches = 500500 |
|
policy=steps |
|
steps=400000,450000 |
|
scales=.1,.1 |
|
|
|
#19:104x104 38:52x52 65:26x26 80:13x13 for 416 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=64 |
|
size=7 |
|
stride=2 |
|
pad=1 |
|
activation=leaky |
|
|
|
[maxpool] |
|
size=2 |
|
stride=2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=64 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
# 1-1 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 1-2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 1-3 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 1-T |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1,-16 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=3 |
|
groups=32 |
|
stride=2 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[route] |
|
layers = -2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
# 2-1 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 2-2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 2-3 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 2-T |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1,-16 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=3 |
|
groups=32 |
|
stride=2 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[route] |
|
layers = -2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
# 3-1 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 3-2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 3-3 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 3-4 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 3-5 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 3-T |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1,-24 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=3 |
|
groups=32 |
|
stride=2 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
# 4-1 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 4-2 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=3 |
|
groups=32 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=linear |
|
|
|
[shortcut] |
|
from=-4 |
|
activation=leaky |
|
|
|
# 4-T |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=1024 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1,-12 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=2048 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
########################## |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=1024 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
### SPP ### |
|
[maxpool] |
|
stride=1 |
|
size=5 |
|
|
|
[route] |
|
layers=-2 |
|
|
|
[maxpool] |
|
stride=1 |
|
size=9 |
|
|
|
[route] |
|
layers=-4 |
|
|
|
[maxpool] |
|
stride=1 |
|
size=13 |
|
|
|
[route] |
|
layers=-1,-3,-5,-6 |
|
### End SPP ### |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=1024 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[upsample] |
|
stride=2 |
|
|
|
[route] |
|
layers = 65 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1, -3 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=512 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=512 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[upsample] |
|
stride=2 |
|
|
|
[route] |
|
layers = 38 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1, -3 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=256 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=256 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=128 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
########################## |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=256 |
|
activation=leaky |
|
|
|
[convolutional] |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
filters=255 |
|
activation=linear |
|
|
|
|
|
[yolo] |
|
mask = 0,1,2 |
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326 |
|
classes=80 |
|
num=9 |
|
jitter=.3 |
|
ignore_thresh = .7 |
|
truth_thresh = 1 |
|
random=1 |
|
|
|
[route] |
|
layers = -4 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=2 |
|
pad=1 |
|
filters=256 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1, -16 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=512 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=512 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=256 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=512 |
|
activation=leaky |
|
|
|
[convolutional] |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
filters=255 |
|
activation=linear |
|
|
|
|
|
[yolo] |
|
mask = 3,4,5 |
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326 |
|
classes=80 |
|
num=9 |
|
jitter=.3 |
|
ignore_thresh = .7 |
|
truth_thresh = 1 |
|
random=1 |
|
|
|
[route] |
|
layers = -4 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=2 |
|
pad=1 |
|
filters=512 |
|
activation=leaky |
|
|
|
[route] |
|
layers = -1, -37 |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=1024 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=1024 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
filters=512 |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
activation=leaky |
|
|
|
[convolutional] |
|
batch_normalize=1 |
|
size=3 |
|
stride=1 |
|
pad=1 |
|
filters=1024 |
|
activation=leaky |
|
|
|
[convolutional] |
|
size=1 |
|
stride=1 |
|
pad=1 |
|
filters=255 |
|
activation=linear |
|
|
|
|
|
[yolo] |
|
mask = 6,7,8 |
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326 |
|
classes=80 |
|
num=9 |
|
jitter=.3 |
|
ignore_thresh = .7 |
|
truth_thresh = 1 |
|
random=1
|
|
|