1[net]
2batch=64
3subdivisions=8
4# Training
5#width=512
6#height=512
7width=608
8height=608
9channels=3
10momentum=0.949
11decay=0.0005
12angle=0
13saturation = 1.5
14exposure = 1.5
15hue=.1
16
17learning_rate=0.00261
18burn_in=1000
19max_batches = 500500
20policy=steps
21steps=400000,450000
22scales=.1,.1
23
24#cutmix=1
25mosaic=1
26
27#:104x104 54:52x52 85:26x26 104:13x13 for 416
28
29[convolutional]
30batch_normalize=1
31filters=32
32size=3
33stride=1
34pad=1
35activation=mish
36
37# Downsample
38
39[convolutional]
40batch_normalize=1
41filters=64
42size=3
43stride=2
44pad=1
45activation=mish
46
47[convolutional]
48batch_normalize=1
49filters=64
50size=1
51stride=1
52pad=1
53activation=mish
54
55[route]
56layers = -2
57
58[convolutional]
59batch_normalize=1
60filters=64
61size=1
62stride=1
63pad=1
64activation=mish
65
66[convolutional]
67batch_normalize=1
68filters=32
69size=1
70stride=1
71pad=1
72activation=mish
73
74[convolutional]
75batch_normalize=1
76filters=64
77size=3
78stride=1
79pad=1
80activation=mish
81
82[shortcut]
83from=-3
84activation=linear
85
86[convolutional]
87batch_normalize=1
88filters=64
89size=1
90stride=1
91pad=1
92activation=mish
93
94[route]
95layers = -1,-7
96
97[convolutional]
98batch_normalize=1
99filters=64
100size=1
101stride=1
102pad=1
103activation=mish
104
105# Downsample
106
107[convolutional]
108batch_normalize=1
109filters=128
110size=3
111stride=2
112pad=1
113activation=mish
114
115[convolutional]
116batch_normalize=1
117filters=64
118size=1
119stride=1
120pad=1
121activation=mish
122
123[route]
124layers = -2
125
126[convolutional]
127batch_normalize=1
128filters=64
129size=1
130stride=1
131pad=1
132activation=mish
133
134[convolutional]
135batch_normalize=1
136filters=64
137size=1
138stride=1
139pad=1
140activation=mish
141
142[convolutional]
143batch_normalize=1
144filters=64
145size=3
146stride=1
147pad=1
148activation=mish
149
150[shortcut]
151from=-3
152activation=linear
153
154[convolutional]
155batch_normalize=1
156filters=64
157size=1
158stride=1
159pad=1
160activation=mish
161
162[convolutional]
163batch_normalize=1
164filters=64
165size=3
166stride=1
167pad=1
168activation=mish
169
170[shortcut]
171from=-3
172activation=linear
173
174[convolutional]
175batch_normalize=1
176filters=64
177size=1
178stride=1
179pad=1
180activation=mish
181
182[route]
183layers = -1,-10
184
185[convolutional]
186batch_normalize=1
187filters=128
188size=1
189stride=1
190pad=1
191activation=mish
192
193# Downsample
194
195[convolutional]
196batch_normalize=1
197filters=256
198size=3
199stride=2
200pad=1
201activation=mish
202
203[convolutional]
204batch_normalize=1
205filters=128
206size=1
207stride=1
208pad=1
209activation=mish
210
211[route]
212layers = -2
213
214[convolutional]
215batch_normalize=1
216filters=128
217size=1
218stride=1
219pad=1
220activation=mish
221
222[convolutional]
223batch_normalize=1
224filters=128
225size=1
226stride=1
227pad=1
228activation=mish
229
230[convolutional]
231batch_normalize=1
232filters=128
233size=3
234stride=1
235pad=1
236activation=mish
237
238[shortcut]
239from=-3
240activation=linear
241
242[convolutional]
243batch_normalize=1
244filters=128
245size=1
246stride=1
247pad=1
248activation=mish
249
250[convolutional]
251batch_normalize=1
252filters=128
253size=3
254stride=1
255pad=1
256activation=mish
257
258[shortcut]
259from=-3
260activation=linear
261
262[convolutional]
263batch_normalize=1
264filters=128
265size=1
266stride=1
267pad=1
268activation=mish
269
270[convolutional]
271batch_normalize=1
272filters=128
273size=3
274stride=1
275pad=1
276activation=mish
277
278[shortcut]
279from=-3
280activation=linear
281
282[convolutional]
283batch_normalize=1
284filters=128
285size=1
286stride=1
287pad=1
288activation=mish
289
290[convolutional]
291batch_normalize=1
292filters=128
293size=3
294stride=1
295pad=1
296activation=mish
297
298[shortcut]
299from=-3
300activation=linear
301
302
303[convolutional]
304batch_normalize=1
305filters=128
306size=1
307stride=1
308pad=1
309activation=mish
310
311[convolutional]
312batch_normalize=1
313filters=128
314size=3
315stride=1
316pad=1
317activation=mish
318
319[shortcut]
320from=-3
321activation=linear
322
323[convolutional]
324batch_normalize=1
325filters=128
326size=1
327stride=1
328pad=1
329activation=mish
330
331[convolutional]
332batch_normalize=1
333filters=128
334size=3
335stride=1
336pad=1
337activation=mish
338
339[shortcut]
340from=-3
341activation=linear
342
343[convolutional]
344batch_normalize=1
345filters=128
346size=1
347stride=1
348pad=1
349activation=mish
350
351[convolutional]
352batch_normalize=1
353filters=128
354size=3
355stride=1
356pad=1
357activation=mish
358
359[shortcut]
360from=-3
361activation=linear
362
363[convolutional]
364batch_normalize=1
365filters=128
366size=1
367stride=1
368pad=1
369activation=mish
370
371[convolutional]
372batch_normalize=1
373filters=128
374size=3
375stride=1
376pad=1
377activation=mish
378
379[shortcut]
380from=-3
381activation=linear
382
383[convolutional]
384batch_normalize=1
385filters=128
386size=1
387stride=1
388pad=1
389activation=mish
390
391[route]
392layers = -1,-28
393
394[convolutional]
395batch_normalize=1
396filters=256
397size=1
398stride=1
399pad=1
400activation=mish
401
402# Downsample
403
404[convolutional]
405batch_normalize=1
406filters=512
407size=3
408stride=2
409pad=1
410activation=mish
411
412[convolutional]
413batch_normalize=1
414filters=256
415size=1
416stride=1
417pad=1
418activation=mish
419
420[route]
421layers = -2
422
423[convolutional]
424batch_normalize=1
425filters=256
426size=1
427stride=1
428pad=1
429activation=mish
430
431[convolutional]
432batch_normalize=1
433filters=256
434size=1
435stride=1
436pad=1
437activation=mish
438
439[convolutional]
440batch_normalize=1
441filters=256
442size=3
443stride=1
444pad=1
445activation=mish
446
447[shortcut]
448from=-3
449activation=linear
450
451
452[convolutional]
453batch_normalize=1
454filters=256
455size=1
456stride=1
457pad=1
458activation=mish
459
460[convolutional]
461batch_normalize=1
462filters=256
463size=3
464stride=1
465pad=1
466activation=mish
467
468[shortcut]
469from=-3
470activation=linear
471
472
473[convolutional]
474batch_normalize=1
475filters=256
476size=1
477stride=1
478pad=1
479activation=mish
480
481[convolutional]
482batch_normalize=1
483filters=256
484size=3
485stride=1
486pad=1
487activation=mish
488
489[shortcut]
490from=-3
491activation=linear
492
493
494[convolutional]
495batch_normalize=1
496filters=256
497size=1
498stride=1
499pad=1
500activation=mish
501
502[convolutional]
503batch_normalize=1
504filters=256
505size=3
506stride=1
507pad=1
508activation=mish
509
510[shortcut]
511from=-3
512activation=linear
513
514
515[convolutional]
516batch_normalize=1
517filters=256
518size=1
519stride=1
520pad=1
521activation=mish
522
523[convolutional]
524batch_normalize=1
525filters=256
526size=3
527stride=1
528pad=1
529activation=mish
530
531[shortcut]
532from=-3
533activation=linear
534
535
536[convolutional]
537batch_normalize=1
538filters=256
539size=1
540stride=1
541pad=1
542activation=mish
543
544[convolutional]
545batch_normalize=1
546filters=256
547size=3
548stride=1
549pad=1
550activation=mish
551
552[shortcut]
553from=-3
554activation=linear
555
556
557[convolutional]
558batch_normalize=1
559filters=256
560size=1
561stride=1
562pad=1
563activation=mish
564
565[convolutional]
566batch_normalize=1
567filters=256
568size=3
569stride=1
570pad=1
571activation=mish
572
573[shortcut]
574from=-3
575activation=linear
576
577[convolutional]
578batch_normalize=1
579filters=256
580size=1
581stride=1
582pad=1
583activation=mish
584
585[convolutional]
586batch_normalize=1
587filters=256
588size=3
589stride=1
590pad=1
591activation=mish
592
593[shortcut]
594from=-3
595activation=linear
596
597[convolutional]
598batch_normalize=1
599filters=256
600size=1
601stride=1
602pad=1
603activation=mish
604
605[route]
606layers = -1,-28
607
608[convolutional]
609batch_normalize=1
610filters=512
611size=1
612stride=1
613pad=1
614activation=mish
615
616# Downsample
617
618[convolutional]
619batch_normalize=1
620filters=1024
621size=3
622stride=2
623pad=1
624activation=mish
625
626[convolutional]
627batch_normalize=1
628filters=512
629size=1
630stride=1
631pad=1
632activation=mish
633
634[route]
635layers = -2
636
637[convolutional]
638batch_normalize=1
639filters=512
640size=1
641stride=1
642pad=1
643activation=mish
644
645[convolutional]
646batch_normalize=1
647filters=512
648size=1
649stride=1
650pad=1
651activation=mish
652
653[convolutional]
654batch_normalize=1
655filters=512
656size=3
657stride=1
658pad=1
659activation=mish
660
661[shortcut]
662from=-3
663activation=linear
664
665[convolutional]
666batch_normalize=1
667filters=512
668size=1
669stride=1
670pad=1
671activation=mish
672
673[convolutional]
674batch_normalize=1
675filters=512
676size=3
677stride=1
678pad=1
679activation=mish
680
681[shortcut]
682from=-3
683activation=linear
684
685[convolutional]
686batch_normalize=1
687filters=512
688size=1
689stride=1
690pad=1
691activation=mish
692
693[convolutional]
694batch_normalize=1
695filters=512
696size=3
697stride=1
698pad=1
699activation=mish
700
701[shortcut]
702from=-3
703activation=linear
704
705[convolutional]
706batch_normalize=1
707filters=512
708size=1
709stride=1
710pad=1
711activation=mish
712
713[convolutional]
714batch_normalize=1
715filters=512
716size=3
717stride=1
718pad=1
719activation=mish
720
721[shortcut]
722from=-3
723activation=linear
724
725[convolutional]
726batch_normalize=1
727filters=512
728size=1
729stride=1
730pad=1
731activation=mish
732
733[route]
734layers = -1,-16
735
736[convolutional]
737batch_normalize=1
738filters=1024
739size=1
740stride=1
741pad=1
742activation=mish
743
744##########################
745
746[convolutional]
747batch_normalize=1
748filters=512
749size=1
750stride=1
751pad=1
752activation=leaky
753
754[convolutional]
755batch_normalize=1
756size=3
757stride=1
758pad=1
759filters=1024
760activation=leaky
761
762[convolutional]
763batch_normalize=1
764filters=512
765size=1
766stride=1
767pad=1
768activation=leaky
769
770### SPP ###
771[maxpool]
772stride=1
773size=5
774
775[route]
776layers=-2
777
778[maxpool]
779stride=1
780size=9
781
782[route]
783layers=-4
784
785[maxpool]
786stride=1
787size=13
788
789[route]
790layers=-1,-3,-5,-6
791### End SPP ###
792
793[convolutional]
794batch_normalize=1
795filters=512
796size=1
797stride=1
798pad=1
799activation=leaky
800
801[convolutional]
802batch_normalize=1
803size=3
804stride=1
805pad=1
806filters=1024
807activation=leaky
808
809[convolutional]
810batch_normalize=1
811filters=512
812size=1
813stride=1
814pad=1
815activation=leaky
816
817[convolutional]
818batch_normalize=1
819filters=256
820size=1
821stride=1
822pad=1
823activation=leaky
824
825[upsample]
826stride=2
827
828[route]
829layers = 85
830
831[convolutional]
832batch_normalize=1
833filters=256
834size=1
835stride=1
836pad=1
837activation=leaky
838
839[route]
840layers = -1, -3
841
842[convolutional]
843batch_normalize=1
844filters=256
845size=1
846stride=1
847pad=1
848activation=leaky
849
850[convolutional]
851batch_normalize=1
852size=3
853stride=1
854pad=1
855filters=512
856activation=leaky
857
858[convolutional]
859batch_normalize=1
860filters=256
861size=1
862stride=1
863pad=1
864activation=leaky
865
866[convolutional]
867batch_normalize=1
868size=3
869stride=1
870pad=1
871filters=512
872activation=leaky
873
874[convolutional]
875batch_normalize=1
876filters=256
877size=1
878stride=1
879pad=1
880activation=leaky
881
882[convolutional]
883batch_normalize=1
884filters=128
885size=1
886stride=1
887pad=1
888activation=leaky
889
890[upsample]
891stride=2
892
893[route]
894layers = 54
895
896[convolutional]
897batch_normalize=1
898filters=128
899size=1
900stride=1
901pad=1
902activation=leaky
903
904[route]
905layers = -1, -3
906
907[convolutional]
908batch_normalize=1
909filters=128
910size=1
911stride=1
912pad=1
913activation=leaky
914
915[convolutional]
916batch_normalize=1
917size=3
918stride=1
919pad=1
920filters=256
921activation=leaky
922
923[convolutional]
924batch_normalize=1
925filters=128
926size=1
927stride=1
928pad=1
929activation=leaky
930
931[convolutional]
932batch_normalize=1
933size=3
934stride=1
935pad=1
936filters=256
937activation=leaky
938
939[convolutional]
940batch_normalize=1
941filters=128
942size=1
943stride=1
944pad=1
945activation=leaky
946
947##########################
948
949[convolutional]
950batch_normalize=1
951size=3
952stride=1
953pad=1
954filters=256
955activation=leaky
956
957[convolutional]
958size=1
959stride=1
960pad=1
961filters=255
962activation=linear
963
964
965[yolo]
966mask = 0,1,2
967anchors = 12, 16, 19, 36, 40, 28, 36, 75, 76, 55, 72, 146, 142, 110, 192, 243, 459, 401
968classes=80
969num=9
970jitter=.3
971ignore_thresh = .7
972truth_thresh = 1
973scale_x_y = 1.2
974iou_thresh=0.213
975cls_normalizer=1.0
976iou_normalizer=0.07
977iou_loss=ciou
978nms_kind=greedynms
979beta_nms=0.6
980
981
982[route]
983layers = -4
984
985[convolutional]
986batch_normalize=1
987size=3
988stride=2
989pad=1
990filters=256
991activation=leaky
992
993[route]
994layers = -1, -16
995
996[convolutional]
997batch_normalize=1
998filters=256
999size=1
1000stride=1
1001pad=1
1002activation=leaky
1003
1004[convolutional]
1005batch_normalize=1
1006size=3
1007stride=1
1008pad=1
1009filters=512
1010activation=leaky
1011
1012[convolutional]
1013batch_normalize=1
1014filters=256
1015size=1
1016stride=1
1017pad=1
1018activation=leaky
1019
1020[convolutional]
1021batch_normalize=1
1022size=3
1023stride=1
1024pad=1
1025filters=512
1026activation=leaky
1027
1028[convolutional]
1029batch_normalize=1
1030filters=256
1031size=1
1032stride=1
1033pad=1
1034activation=leaky
1035
1036[convolutional]
1037batch_normalize=1
1038size=3
1039stride=1
1040pad=1
1041filters=512
1042activation=leaky
1043
1044[convolutional]
1045size=1
1046stride=1
1047pad=1
1048filters=255
1049activation=linear
1050
1051
1052[yolo]
1053mask = 3,4,5
1054anchors = 12, 16, 19, 36, 40, 28, 36, 75, 76, 55, 72, 146, 142, 110, 192, 243, 459, 401
1055classes=80
1056num=9
1057jitter=.3
1058ignore_thresh = .7
1059truth_thresh = 1
1060scale_x_y = 1.1
1061iou_thresh=0.213
1062cls_normalizer=1.0
1063iou_normalizer=0.07
1064iou_loss=ciou
1065nms_kind=greedynms
1066beta_nms=0.6
1067
1068
1069[route]
1070layers = -4
1071
1072[convolutional]
1073batch_normalize=1
1074size=3
1075stride=2
1076pad=1
1077filters=512
1078activation=leaky
1079
1080[route]
1081layers = -1, -37
1082
1083[convolutional]
1084batch_normalize=1
1085filters=512
1086size=1
1087stride=1
1088pad=1
1089activation=leaky
1090
1091[convolutional]
1092batch_normalize=1
1093size=3
1094stride=1
1095pad=1
1096filters=1024
1097activation=leaky
1098
1099[convolutional]
1100batch_normalize=1
1101filters=512
1102size=1
1103stride=1
1104pad=1
1105activation=leaky
1106
1107[convolutional]
1108batch_normalize=1
1109size=3
1110stride=1
1111pad=1
1112filters=1024
1113activation=leaky
1114
1115[convolutional]
1116batch_normalize=1
1117filters=512
1118size=1
1119stride=1
1120pad=1
1121activation=leaky
1122
1123[convolutional]
1124batch_normalize=1
1125size=3
1126stride=1
1127pad=1
1128filters=1024
1129activation=leaky
1130
1131[convolutional]
1132size=1
1133stride=1
1134pad=1
1135filters=255
1136activation=linear
1137
1138
1139[yolo]
1140mask = 6,7,8
1141anchors = 12, 16, 19, 36, 40, 28, 36, 75, 76, 55, 72, 146, 142, 110, 192, 243, 459, 401
1142classes=80
1143num=9
1144jitter=.3
1145ignore_thresh = .7
1146truth_thresh = 1
1147random=1
1148scale_x_y = 1.05
1149iou_thresh=0.213
1150cls_normalizer=1.0
1151iou_normalizer=0.07
1152iou_loss=ciou
1153nms_kind=greedynms
1154beta_nms=0.6
1155
1156