mirror of https://github.com/AlexeyAB/darknet.git
809 lines
8.5 KiB
INI
809 lines
8.5 KiB
INI
[net]
|
|
# Testing
|
|
# batch=1
|
|
# subdivisions=1
|
|
# Training
|
|
batch=64
|
|
subdivisions=16
|
|
width=416
|
|
height=416
|
|
channels=3
|
|
momentum=0.9
|
|
decay=0.0005
|
|
angle=0
|
|
saturation = 1.5
|
|
exposure = 1.5
|
|
hue=.1
|
|
|
|
## single gpu
|
|
learning_rate=0.001
|
|
burn_in=1000
|
|
max_batches = 100400
|
|
|
|
## 2x
|
|
#learning_rate=0.0005
|
|
#burn_in=2000
|
|
#max_batches = 100400
|
|
#max_batches = 200800
|
|
|
|
## 4x
|
|
#learning_rate=0.00025
|
|
#burn_in=4000
|
|
#max_batches = 50200
|
|
##max_batches = 200800
|
|
|
|
policy=steps
|
|
steps=40000,45000
|
|
scales=.1,.1
|
|
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=32
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
# Downsample
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=64
|
|
size=3
|
|
stride=2
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=32
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=64
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
# Downsample
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=3
|
|
stride=2
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=64
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=64
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
# Downsample
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=2
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
# Downsample
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=2
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
# Downsample
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=1024
|
|
size=3
|
|
stride=2
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=1024
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=1024
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=1024
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=1024
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[shortcut]
|
|
from=-3
|
|
activation=linear
|
|
|
|
######################
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=1024
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=1024
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=512
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=1024
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
filters=75
|
|
activation=linear
|
|
|
|
[yolo]
|
|
mask = 6,7,8
|
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
|
|
classes=20
|
|
num=9
|
|
jitter=.3
|
|
ignore_thresh = .5
|
|
truth_thresh = 1
|
|
random=1
|
|
iou_normalizer=0.25
|
|
cls_normalizer=1.0
|
|
iou_loss=giou
|
|
|
|
[route]
|
|
layers = -4
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[upsample]
|
|
stride=2
|
|
|
|
[route]
|
|
layers = -1, 61
|
|
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=512
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=512
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=256
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=512
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
filters=75
|
|
activation=linear
|
|
|
|
[yolo]
|
|
mask = 3,4,5
|
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
|
|
classes=20
|
|
num=9
|
|
jitter=.3
|
|
ignore_thresh = .5
|
|
truth_thresh = 1
|
|
random=1
|
|
iou_normalizer=0.25
|
|
cls_normalizer=1.0
|
|
iou_loss=giou
|
|
|
|
[route]
|
|
layers = -4
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[upsample]
|
|
stride=2
|
|
|
|
[route]
|
|
layers = -1, 36
|
|
|
|
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=256
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=256
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
filters=128
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
batch_normalize=1
|
|
size=3
|
|
stride=1
|
|
pad=1
|
|
filters=256
|
|
activation=leaky
|
|
|
|
[convolutional]
|
|
size=1
|
|
stride=1
|
|
pad=1
|
|
filters=75
|
|
activation=linear
|
|
|
|
[yolo]
|
|
mask = 0,1,2
|
|
anchors = 10,13, 16,30, 33,23, 30,61, 62,45, 59,119, 116,90, 156,198, 373,326
|
|
classes=20
|
|
num=9
|
|
jitter=.3
|
|
ignore_thresh = .5
|
|
truth_thresh = 1
|
|
random=1
|
|
iou_normalizer=0.25
|
|
cls_normalizer=1.0
|
|
iou_loss=giou
|
|
|