nc: 80
depth_multiple: 1.0
width_multiple: 1.0
anchors:
- [10,14, 23,27, 37,58]
- [81,82, 135,169, 344,319]
backbone:
[[-1, 1, Conv, [16, 3, 1]],
[-1, 1, nn.MaxPool2d, [2, 2, 0]],
[-1, 1, Conv, [32, 3, 1]],
[-1, 1, nn.MaxPool2d, [2, 2, 0]],
[-1, 1, Conv, [64, 3, 1]],
[-1, 1, nn.MaxPool2d, [2, 2, 0]],
[-1, 1, Conv, [128, 3, 1]],
[-1, 1, nn.MaxPool2d, [2, 2, 0]],
[-1, 1, Conv, [256, 3, 1]],
[-1, 1, nn.MaxPool2d, [2, 2, 0]],
[-1, 1, Conv, [512, 3, 1]],
[-1, 1, nn.ZeroPad2d, [[0, 1, 0, 1]]],
[-1, 1, nn.MaxPool2d, [2, 1, 0]],
]
head:
[[-1, 1, Conv, [1024, 3, 1]],
[-1, 1, Conv, [256, 1, 1]],
[-1, 1, Conv, [512, 3, 1]],
[-2, 1, Conv, [128, 1, 1]],
[-1, 1, nn.Upsample, [None, 2, 'nearest']],
[[-1, 8], 1, Concat, [1]],
[-1, 1, Conv, [256, 3, 1]],
[[19, 15], 1, Detect, [nc, anchors]],
]