1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
| class YOLOv3Backbone(nn.Module): """YOLOv3骨干网络(Darknet-53)""" def __init__(self): super().__init__() self.stem = self._make_conv(3, 32, 3, 1) self.layer1 = self._make_residual(32, 64, 1) self.layer2 = self._make_residual(64, 128, 2) self.layer3 = self._make_residual(128, 256, 8) self.layer4 = self._make_residual(256, 512, 8) self.layer5 = self._make_residual(512, 1024, 4) def _make_conv(self, in_ch, out_ch, kernel, stride): return nn.Sequential( nn.Conv2d(in_ch, out_ch, kernel, stride, kernel//2, bias=False), nn.BatchNorm2d(out_ch), nn.LeakyReLU(0.1) ) def _make_residual(self, in_ch, out_ch, num_blocks): layers = [self._make_conv(in_ch, out_ch, 3, 2)] for _ in range(num_blocks): layers.append(self._make_conv(out_ch, out_ch, 1, 1)) return nn.Sequential(*layers) def forward(self, x): c1 = self.layer3(self.layer2(self.layer1(self.stem(x)))) c2 = self.layer4(c1) c3 = self.layer5(c2) return c1, c2, c3
class YOLOv3Neck(nn.Module): """YOLOv3的FPN颈部网络""" def __init__(self): super().__init__() self.up1 = nn.Sequential( nn.Conv2d(1024, 512, 1), nn.Upsample(scale_factor=2, mode='nearest') ) self.conv1 = nn.Sequential( nn.Conv2d(768, 512, 1), nn.Conv2d(512, 1024, 3, padding=1), nn.Conv2d(1024, 512, 1) ) self.up2 = nn.Sequential( nn.Conv2d(512, 256, 1), nn.Upsample(scale_factor=2, mode='nearest') ) self.conv2 = nn.Sequential( nn.Conv2d(384, 256, 1), nn.Conv2d(256, 512, 3, padding=1), nn.Conv2d(512, 256, 1) )
class YOLOv3Head(nn.Module): """YOLOv3检测头""" def __init__(self, num_classes=80, anchors_per_scale=3): super().__init__() self.num_classes = num_classes self.num_anchors = anchors_per_scale self.detect1 = self._make_detect_layer(512, num_classes) self.detect2 = self._make_detect_layer(256, num_classes) self.detect3 = self._make_detect_layer(128, num_classes) def _make_detect_layer(self, in_channels, num_classes): return nn.Sequential( nn.Conv2d(in_channels, 1024, 3, padding=1), nn.Conv2d(1024, 255, 1) ) def forward(self, features): out1 = self.detect1(features[2]) out2 = self.detect2(features[1]) out3 = self.detect3(features[0]) return [out1, out2, out3]
|