1[net] 2batch=64 3subdivisions=8 4# Training 5#width=512 6#height=512 7width=608 8height=608 9channels=3 10momentum=0.949 11decay=0.0005 12angle=0 13saturation = 1.5 14exposure = 1.5 15hue=.1 16 17learning_rate=0.00261 18burn_in=1000 19max_batches = 500500 20policy=steps 21steps=400000,450000 22scales=.1,.1 23 24#cutmix=1 25mosaic=1 26 27#:104x104 54:52x52 85:26x26 104:13x13 for 416 28 29[convolutional] 30batch_normalize=1 31filters=32 32size=3 33stride=1 34pad=1 35activation=mish 36 37# Downsample 38 39[convolutional] 40batch_normalize=1 41filters=64 42size=3 43stride=2 44pad=1 45activation=mish 46 47[convolutional] 48batch_normalize=1 49filters=64 50size=1 51stride=1 52pad=1 53activation=mish 54 55[route] 56layers = -2 57 58[convolutional] 59batch_normalize=1 60filters=64 61size=1 62stride=1 63pad=1 64activation=mish 65 66[convolutional] 67batch_normalize=1 68filters=32 69size=1 70stride=1 71pad=1 72activation=mish 73 74[convolutional] 75batch_normalize=1 76filters=64 77size=3 78stride=1 79pad=1 80activation=mish 81 82[shortcut] 83from=-3 84activation=linear 85 86[convolutional] 87batch_normalize=1 88filters=64 89size=1 90stride=1 91pad=1 92activation=mish 93 94[route] 95layers = -1,-7 96 97[convolutional] 98batch_normalize=1 99filters=64 100size=1 101stride=1 102pad=1 103activation=mish 104 105# Downsample 106 107[convolutional] 108batch_normalize=1 109filters=128 110size=3 111stride=2 112pad=1 113activation=mish 114 115[convolutional] 116batch_normalize=1 117filters=64 118size=1 119stride=1 120pad=1 121activation=mish 122 123[route] 124layers = -2 125 126[convolutional] 127batch_normalize=1 128filters=64 129size=1 130stride=1 131pad=1 132activation=mish 133 134[convolutional] 135batch_normalize=1 136filters=64 137size=1 138stride=1 139pad=1 140activation=mish 141 142[convolutional] 143batch_normalize=1 144filters=64 145size=3 146stride=1 147pad=1 148activation=mish 149 150[shortcut] 151from=-3 152activation=linear 153 154[convolutional] 155batch_normalize=1 156filters=64 157size=1 158stride=1 159pad=1 160activation=mish 161 162[convolutional] 163batch_normalize=1 164filters=64 165size=3 166stride=1 167pad=1 168activation=mish 169 170[shortcut] 171from=-3 172activation=linear 173 174[convolutional] 175batch_normalize=1 176filters=64 177size=1 178stride=1 179pad=1 180activation=mish 181 182[route] 183layers = -1,-10 184 185[convolutional] 186batch_normalize=1 187filters=128 188size=1 189stride=1 190pad=1 191activation=mish 192 193# Downsample 194 195[convolutional] 196batch_normalize=1 197filters=256 198size=3 199stride=2 200pad=1 201activation=mish 202 203[convolutional] 204batch_normalize=1 205filters=128 206size=1 207stride=1 208pad=1 209activation=mish 210 211[route] 212layers = -2 213 214[convolutional] 215batch_normalize=1 216filters=128 217size=1 218stride=1 219pad=1 220activation=mish 221 222[convolutional] 223batch_normalize=1 224filters=128 225size=1 226stride=1 227pad=1 228activation=mish 229 230[convolutional] 231batch_normalize=1 232filters=128 233size=3 234stride=1 235pad=1 236activation=mish 237 238[shortcut] 239from=-3 240activation=linear 241 242[convolutional] 243batch_normalize=1 244filters=128 245size=1 246stride=1 247pad=1 248activation=mish 249 250[convolutional] 251batch_normalize=1 252filters=128 253size=3 254stride=1 255pad=1 256activation=mish 257 258[shortcut] 259from=-3 260activation=linear 261 262[convolutional] 263batch_normalize=1 264filters=128 265size=1 266stride=1 267pad=1 268activation=mish 269 270[convolutional] 271batch_normalize=1 272filters=128 273size=3 274stride=1 275pad=1 276activation=mish 277 278[shortcut] 279from=-3 280activation=linear 281 282[convolutional] 283batch_normalize=1 284filters=128 285size=1 286stride=1 287pad=1 288activation=mish 289 290[convolutional] 291batch_normalize=1 292filters=128 293size=3 294stride=1 295pad=1 296activation=mish 297 298[shortcut] 299from=-3 300activation=linear 301 302 303[convolutional] 304batch_normalize=1 305filters=128 306size=1 307stride=1 308pad=1 309activation=mish 310 311[convolutional] 312batch_normalize=1 313filters=128 314size=3 315stride=1 316pad=1 317activation=mish 318 319[shortcut] 320from=-3 321activation=linear 322 323[convolutional] 324batch_normalize=1 325filters=128 326size=1 327stride=1 328pad=1 329activation=mish 330 331[convolutional] 332batch_normalize=1 333filters=128 334size=3 335stride=1 336pad=1 337activation=mish 338 339[shortcut] 340from=-3 341activation=linear 342 343[convolutional] 344batch_normalize=1 345filters=128 346size=1 347stride=1 348pad=1 349activation=mish 350 351[convolutional] 352batch_normalize=1 353filters=128 354size=3 355stride=1 356pad=1 357activation=mish 358 359[shortcut] 360from=-3 361activation=linear 362 363[convolutional] 364batch_normalize=1 365filters=128 366size=1 367stride=1 368pad=1 369activation=mish 370 371[convolutional] 372batch_normalize=1 373filters=128 374size=3 375stride=1 376pad=1 377activation=mish 378 379[shortcut] 380from=-3 381activation=linear 382 383[convolutional] 384batch_normalize=1 385filters=128 386size=1 387stride=1 388pad=1 389activation=mish 390 391[route] 392layers = -1,-28 393 394[convolutional] 395batch_normalize=1 396filters=256 397size=1 398stride=1 399pad=1 400activation=mish 401 402# Downsample 403 404[convolutional] 405batch_normalize=1 406filters=512 407size=3 408stride=2 409pad=1 410activation=mish 411 412[convolutional] 413batch_normalize=1 414filters=256 415size=1 416stride=1 417pad=1 418activation=mish 419 420[route] 421layers = -2 422 423[convolutional] 424batch_normalize=1 425filters=256 426size=1 427stride=1 428pad=1 429activation=mish 430 431[convolutional] 432batch_normalize=1 433filters=256 434size=1 435stride=1 436pad=1 437activation=mish 438 439[convolutional] 440batch_normalize=1 441filters=256 442size=3 443stride=1 444pad=1 445activation=mish 446 447[shortcut] 448from=-3 449activation=linear 450 451 452[convolutional] 453batch_normalize=1 454filters=256 455size=1 456stride=1 457pad=1 458activation=mish 459 460[convolutional] 461batch_normalize=1 462filters=256 463size=3 464stride=1 465pad=1 466activation=mish 467 468[shortcut] 469from=-3 470activation=linear 471 472 473[convolutional] 474batch_normalize=1 475filters=256 476size=1 477stride=1 478pad=1 479activation=mish 480 481[convolutional] 482batch_normalize=1 483filters=256 484size=3 485stride=1 486pad=1 487activation=mish 488 489[shortcut] 490from=-3 491activation=linear 492 493 494[convolutional] 495batch_normalize=1 496filters=256 497size=1 498stride=1 499pad=1 500activation=mish 501 502[convolutional] 503batch_normalize=1 504filters=256 505size=3 506stride=1 507pad=1 508activation=mish 509 510[shortcut] 511from=-3 512activation=linear 513 514 515[convolutional] 516batch_normalize=1 517filters=256 518size=1 519stride=1 520pad=1 521activation=mish 522 523[convolutional] 524batch_normalize=1 525filters=256 526size=3 527stride=1 528pad=1 529activation=mish 530 531[shortcut] 532from=-3 533activation=linear 534 535 536[convolutional] 537batch_normalize=1 538filters=256 539size=1 540stride=1 541pad=1 542activation=mish 543 544[convolutional] 545batch_normalize=1 546filters=256 547size=3 548stride=1 549pad=1 550activation=mish 551 552[shortcut] 553from=-3 554activation=linear 555 556 557[convolutional] 558batch_normalize=1 559filters=256 560size=1 561stride=1 562pad=1 563activation=mish 564 565[convolutional] 566batch_normalize=1 567filters=256 568size=3 569stride=1 570pad=1 571activation=mish 572 573[shortcut] 574from=-3 575activation=linear 576 577[convolutional] 578batch_normalize=1 579filters=256 580size=1 581stride=1 582pad=1 583activation=mish 584 585[convolutional] 586batch_normalize=1 587filters=256 588size=3 589stride=1 590pad=1 591activation=mish 592 593[shortcut] 594from=-3 595activation=linear 596 597[convolutional] 598batch_normalize=1 599filters=256 600size=1 601stride=1 602pad=1 603activation=mish 604 605[route] 606layers = -1,-28 607 608[convolutional] 609batch_normalize=1 610filters=512 611size=1 612stride=1 613pad=1 614activation=mish 615 616# Downsample 617 618[convolutional] 619batch_normalize=1 620filters=1024 621size=3 622stride=2 623pad=1 624activation=mish 625 626[convolutional] 627batch_normalize=1 628filters=512 629size=1 630stride=1 631pad=1 632activation=mish 633 634[route] 635layers = -2 636 637[convolutional] 638batch_normalize=1 639filters=512 640size=1 641stride=1 642pad=1 643activation=mish 644 645[convolutional] 646batch_normalize=1 647filters=512 648size=1 649stride=1 650pad=1 651activation=mish 652 653[convolutional] 654batch_normalize=1 655filters=512 656size=3 657stride=1 658pad=1 659activation=mish 660 661[shortcut] 662from=-3 663activation=linear 664 665[convolutional] 666batch_normalize=1 667filters=512 668size=1 669stride=1 670pad=1 671activation=mish 672 673[convolutional] 674batch_normalize=1 675filters=512 676size=3 677stride=1 678pad=1 679activation=mish 680 681[shortcut] 682from=-3 683activation=linear 684 685[convolutional] 686batch_normalize=1 687filters=512 688size=1 689stride=1 690pad=1 691activation=mish 692 693[convolutional] 694batch_normalize=1 695filters=512 696size=3 697stride=1 698pad=1 699activation=mish 700 701[shortcut] 702from=-3 703activation=linear 704 705[convolutional] 706batch_normalize=1 707filters=512 708size=1 709stride=1 710pad=1 711activation=mish 712 713[convolutional] 714batch_normalize=1 715filters=512 716size=3 717stride=1 718pad=1 719activation=mish 720 721[shortcut] 722from=-3 723activation=linear 724 725[convolutional] 726batch_normalize=1 727filters=512 728size=1 729stride=1 730pad=1 731activation=mish 732 733[route] 734layers = -1,-16 735 736[convolutional] 737batch_normalize=1 738filters=1024 739size=1 740stride=1 741pad=1 742activation=mish 743 744########################## 745 746[convolutional] 747batch_normalize=1 748filters=512 749size=1 750stride=1 751pad=1 752activation=leaky 753 754[convolutional] 755batch_normalize=1 756size=3 757stride=1 758pad=1 759filters=1024 760activation=leaky 761 762[convolutional] 763batch_normalize=1 764filters=512 765size=1 766stride=1 767pad=1 768activation=leaky 769 770### SPP ### 771[maxpool] 772stride=1 773size=5 774 775[route] 776layers=-2 777 778[maxpool] 779stride=1 780size=9 781 782[route] 783layers=-4 784 785[maxpool] 786stride=1 787size=13 788 789[route] 790layers=-1,-3,-5,-6 791### End SPP ### 792 793[convolutional] 794batch_normalize=1 795filters=512 796size=1 797stride=1 798pad=1 799activation=leaky 800 801[convolutional] 802batch_normalize=1 803size=3 804stride=1 805pad=1 806filters=1024 807activation=leaky 808 809[convolutional] 810batch_normalize=1 811filters=512 812size=1 813stride=1 814pad=1 815activation=leaky 816 817[convolutional] 818batch_normalize=1 819filters=256 820size=1 821stride=1 822pad=1 823activation=leaky 824 825[upsample] 826stride=2 827 828[route] 829layers = 85 830 831[convolutional] 832batch_normalize=1 833filters=256 834size=1 835stride=1 836pad=1 837activation=leaky 838 839[route] 840layers = -1, -3 841 842[convolutional] 843batch_normalize=1 844filters=256 845size=1 846stride=1 847pad=1 848activation=leaky 849 850[convolutional] 851batch_normalize=1 852size=3 853stride=1 854pad=1 855filters=512 856activation=leaky 857 858[convolutional] 859batch_normalize=1 860filters=256 861size=1 862stride=1 863pad=1 864activation=leaky 865 866[convolutional] 867batch_normalize=1 868size=3 869stride=1 870pad=1 871filters=512 872activation=leaky 873 874[convolutional] 875batch_normalize=1 876filters=256 877size=1 878stride=1 879pad=1 880activation=leaky 881 882[convolutional] 883batch_normalize=1 884filters=128 885size=1 886stride=1 887pad=1 888activation=leaky 889 890[upsample] 891stride=2 892 893[route] 894layers = 54 895 896[convolutional] 897batch_normalize=1 898filters=128 899size=1 900stride=1 901pad=1 902activation=leaky 903 904[route] 905layers = -1, -3 906 907[convolutional] 908batch_normalize=1 909filters=128 910size=1 911stride=1 912pad=1 913activation=leaky 914 915[convolutional] 916batch_normalize=1 917size=3 918stride=1 919pad=1 920filters=256 921activation=leaky 922 923[convolutional] 924batch_normalize=1 925filters=128 926size=1 927stride=1 928pad=1 929activation=leaky 930 931[convolutional] 932batch_normalize=1 933size=3 934stride=1 935pad=1 936filters=256 937activation=leaky 938 939[convolutional] 940batch_normalize=1 941filters=128 942size=1 943stride=1 944pad=1 945activation=leaky 946 947########################## 948 949[convolutional] 950batch_normalize=1 951size=3 952stride=1 953pad=1 954filters=256 955activation=leaky 956 957[convolutional] 958size=1 959stride=1 960pad=1 961filters=255 962activation=linear 963 964 965[yolo] 966mask = 0,1,2 967anchors = 12, 16, 19, 36, 40, 28, 36, 75, 76, 55, 72, 146, 142, 110, 192, 243, 459, 401 968classes=80 969num=9 970jitter=.3 971ignore_thresh = .7 972truth_thresh = 1 973scale_x_y = 1.2 974iou_thresh=0.213 975cls_normalizer=1.0 976iou_normalizer=0.07 977iou_loss=ciou 978nms_kind=greedynms 979beta_nms=0.6 980 981 982[route] 983layers = -4 984 985[convolutional] 986batch_normalize=1 987size=3 988stride=2 989pad=1 990filters=256 991activation=leaky 992 993[route] 994layers = -1, -16 995 996[convolutional] 997batch_normalize=1 998filters=256 999size=1 1000stride=1 1001pad=1 1002activation=leaky 1003 1004[convolutional] 1005batch_normalize=1 1006size=3 1007stride=1 1008pad=1 1009filters=512 1010activation=leaky 1011 1012[convolutional] 1013batch_normalize=1 1014filters=256 1015size=1 1016stride=1 1017pad=1 1018activation=leaky 1019 1020[convolutional] 1021batch_normalize=1 1022size=3 1023stride=1 1024pad=1 1025filters=512 1026activation=leaky 1027 1028[convolutional] 1029batch_normalize=1 1030filters=256 1031size=1 1032stride=1 1033pad=1 1034activation=leaky 1035 1036[convolutional] 1037batch_normalize=1 1038size=3 1039stride=1 1040pad=1 1041filters=512 1042activation=leaky 1043 1044[convolutional] 1045size=1 1046stride=1 1047pad=1 1048filters=255 1049activation=linear 1050 1051 1052[yolo] 1053mask = 3,4,5 1054anchors = 12, 16, 19, 36, 40, 28, 36, 75, 76, 55, 72, 146, 142, 110, 192, 243, 459, 401 1055classes=80 1056num=9 1057jitter=.3 1058ignore_thresh = .7 1059truth_thresh = 1 1060scale_x_y = 1.1 1061iou_thresh=0.213 1062cls_normalizer=1.0 1063iou_normalizer=0.07 1064iou_loss=ciou 1065nms_kind=greedynms 1066beta_nms=0.6 1067 1068 1069[route] 1070layers = -4 1071 1072[convolutional] 1073batch_normalize=1 1074size=3 1075stride=2 1076pad=1 1077filters=512 1078activation=leaky 1079 1080[route] 1081layers = -1, -37 1082 1083[convolutional] 1084batch_normalize=1 1085filters=512 1086size=1 1087stride=1 1088pad=1 1089activation=leaky 1090 1091[convolutional] 1092batch_normalize=1 1093size=3 1094stride=1 1095pad=1 1096filters=1024 1097activation=leaky 1098 1099[convolutional] 1100batch_normalize=1 1101filters=512 1102size=1 1103stride=1 1104pad=1 1105activation=leaky 1106 1107[convolutional] 1108batch_normalize=1 1109size=3 1110stride=1 1111pad=1 1112filters=1024 1113activation=leaky 1114 1115[convolutional] 1116batch_normalize=1 1117filters=512 1118size=1 1119stride=1 1120pad=1 1121activation=leaky 1122 1123[convolutional] 1124batch_normalize=1 1125size=3 1126stride=1 1127pad=1 1128filters=1024 1129activation=leaky 1130 1131[convolutional] 1132size=1 1133stride=1 1134pad=1 1135filters=255 1136activation=linear 1137 1138 1139[yolo] 1140mask = 6,7,8 1141anchors = 12, 16, 19, 36, 40, 28, 36, 75, 76, 55, 72, 146, 142, 110, 192, 243, 459, 401 1142classes=80 1143num=9 1144jitter=.3 1145ignore_thresh = .7 1146truth_thresh = 1 1147random=1 1148scale_x_y = 1.05 1149iou_thresh=0.213 1150cls_normalizer=1.0 1151iou_normalizer=0.07 1152iou_loss=ciou 1153nms_kind=greedynms 1154beta_nms=0.6 1155 1156