1node { 2 name: "data" 3 type: "JitterData" 4 top: "data" 5 top: "label" 6 propagate_down: false 7 mode: TRAIN 8 data_param { 9 train_source: "/home/local_scratch/jpegs_256resized" 10 train_list: "/home/local_scratch/train_images_labels.list" 11 test_source: "/home/local_scratch/jpegs_256resized" 12 test_list: "/home/local_scratch/val_images_labels.list" 13 batch_size: 54 #number of cores(54) - number of EP servers (2) 14 num_train_files: 80073 # per node when numsplits=16 15 num_test_files: 3125 # per node when numsplits=16 16 numsplits: 16 17 lookahead: 2 18 shuffle: true 19 engine: XSMM 20 data_type: BF16 21 22 image_xform_param { 23 orig_size: 256 24 mirror: true 25 crop_image: true 26 physical_padding: true 27 crop_size: 224 28 channels: 4 29 pad_h: 3 30 pad_w: 3 31 mean_values: 0.406 32 mean_values: 0.456 33 mean_values: 0.485 34 scale_values: 0.225 35 scale_values: 0.224 36 scale_values: 0.229 37 test_views: 1 38 } 39 } 40} 41node { 42 name: "conv1" 43 type: "Convolution" 44 bottom: "data" 45 top: "conv1" 46 propagate_down: false 47 param { 48 lr_mult: 1.0 49 decay_mult: 1.0 50 } 51 convolution_param { 52 data_type: BF16 53 engine: XSMM 54 num_output: 64 55 pad: 3 56 opad: 3 57 bias_term: false 58 physical_padding: true 59 kernel_size: 7 60 stride: 2 61 weight_filler { 62 type: "msra" 63 variance_norm: FAN_OUT 64 } 65 bias_filler { 66 type: "constant" 67 value: 0.0 68 } 69 } 70} 71node { 72 name: "bn1" 73 type: "FusedBatchNorm" 74 fused_bnorm_param { 75 data_type: BF16 76 use_global_stats: false 77 ipad: 3 78 pad: 0 79 stride: 1 80 engine: XSMM 81 } 82 bottom: "conv1" 83 top: "bn1" 84} 85node { 86 name: "conv1_pool" 87 type: "Pooling" 88 bottom: "bn1" 89 top: "conv1_pool" 90 pooling_param { 91 data_type: BF16 92 pool: MAX 93 engine: XSMM 94 kernel_size: 3 95 stride: 2 96 pad: 1 97 } 98} 99node { 100 name: "node_64_1_convbn4" 101 type: "FusedConvBN" 102 bottom: "conv1_pool" 103 top: "node_64_1_convbn4" 104 param { 105 lr_mult: 1.0 106 decay_mult: 1.0 107 } 108 param { 109 lr_mult: 1.0 110 decay_mult: 0.0 111 } 112 fused_conv_bn_param { 113 data_type: BF16 114 engine: XSMM 115 num_output: 256 116 ipad: 0 117 mpad: 0 118 opad: 0 119 kernel_size: 1 120 c_stride: 1 121 bn_stride: 1 122 relu_fwd: false 123 relu_bwd: false 124 weight_filler { 125 type: "msra" 126 variance_norm: FAN_OUT 127 } 128 } 129} 130node { 131 name: "node_64_1_convbn1" 132 type: "FusedConvBN" 133 bottom: "conv1_pool" 134 top: "node_64_1_convbn1" 135 param { 136 lr_mult: 1.0 137 decay_mult: 1.0 138 } 139 param { 140 lr_mult: 1.0 141 decay_mult: 0.0 142 } 143 fused_conv_bn_param { 144 data_type: BF16 145 engine: XSMM 146 num_output: 64 147 ipad: 0 148 mpad: 0 149 opad: 1 150 physical_padding: true 151 kernel_size: 1 152 c_stride: 1 153 bn_stride: 1 154 weight_filler { 155 type: "msra" 156 variance_norm: FAN_OUT 157 } 158 } 159} 160node { 161 name: "node_64_1_convbn2" 162 type: "FusedConvBN" 163 bottom: "node_64_1_convbn1" 164 top: "node_64_1_convbn2" 165 param { 166 lr_mult: 1.0 167 decay_mult: 1.0 168 } 169 param { 170 lr_mult: 1.0 171 decay_mult: 0.0 172 } 173 fused_conv_bn_param { 174 data_type: BF16 175 engine: XSMM 176 num_output: 64 177 ipad: 1 178 mpad: 1 179 opad: 0 180 physical_padding: true 181 kernel_size: 3 182 c_stride: 1 183 bn_stride: 1 184 weight_filler { 185 type: "msra" 186 variance_norm: FAN_OUT 187 } 188 } 189} 190node { 191 name: "node_64_1_convbn3" 192 type: "FusedConvBN" 193 bottom: "node_64_1_convbn2" 194 bottom: "node_64_1_convbn4" 195 top: "node_64_1_convbn3" 196 param { 197 lr_mult: 1.0 198 decay_mult: 1.0 199 } 200 param { 201 lr_mult: 1.0 202 decay_mult: 0.0 203 } 204 fused_conv_bn_param{ 205 data_type: BF16 206 engine: XSMM 207 num_output: 256 208 ipad: 0 209 mpad: 0 210 opad: 0 211 kernel_size: 1 212 c_stride: 1 213 bn_stride: 1 214 eltwise: true 215 weight_filler { 216 type: "msra" 217 variance_norm: FAN_OUT 218 } 219 } 220} 221node { 222 name: "node_64_2_convbn1" 223 type: "FusedConvBN" 224 bottom: "node_64_1_convbn3" 225 top: "node_64_2_convbn1" 226 param { 227 lr_mult: 1.0 228 decay_mult: 1.0 229 } 230 param { 231 lr_mult: 1.0 232 decay_mult: 0.0 233 } 234 fused_conv_bn_param { 235 data_type: BF16 236 engine: XSMM 237 num_output: 64 238 ipad: 0 239 mpad: 0 240 opad: 1 241 kernel_size: 1 242 physical_padding: true 243 c_stride: 1 244 bn_stride: 1 245 weight_filler { 246 type: "msra" 247 variance_norm: FAN_OUT 248 } 249 } 250} 251node { 252 name: "node_64_2_convbn2" 253 type: "FusedConvBN" 254 bottom: "node_64_2_convbn1" 255 top: "node_64_2_convbn2" 256 param { 257 lr_mult: 1.0 258 decay_mult: 1.0 259 } 260 param { 261 lr_mult: 1.0 262 decay_mult: 0.0 263 } 264 fused_conv_bn_param { 265 data_type: BF16 266 engine: XSMM 267 num_output: 64 268 ipad: 1 269 mpad: 1 270 opad: 0 271 physical_padding: true 272 kernel_size: 3 273 c_stride: 1 274 bn_stride: 1 275 weight_filler { 276 type: "msra" 277 variance_norm: FAN_OUT 278 } 279 } 280} 281node { 282 name: "node_64_2_convbn3" 283 type: "FusedConvBN" 284 bottom: "node_64_2_convbn2" 285 bottom: "node_64_1_convbn3" 286 top: "node_64_2_convbn3" 287 param { 288 lr_mult: 1.0 289 decay_mult: 1.0 290 } 291 param { 292 lr_mult: 1.0 293 decay_mult: 0.0 294 } 295 fused_conv_bn_param { 296 data_type: BF16 297 engine: XSMM 298 num_output: 256 299 ipad: 0 300 mpad: 0 301 opad: 0 302 kernel_size: 1 303 c_stride: 1 304 bn_stride: 1 305 eltwise: true 306 weight_filler { 307 type: "msra" 308 variance_norm: FAN_OUT 309 } 310 } 311} 312node { 313 name: "node_64_3_convbn1" 314 type: "FusedConvBN" 315 bottom: "node_64_2_convbn3" 316 top: "node_64_3_convbn1" 317 param { 318 lr_mult: 1.0 319 decay_mult: 1.0 320 } 321 param { 322 lr_mult: 1.0 323 decay_mult: 0.0 324 } 325 fused_conv_bn_param { 326 data_type: BF16 327 engine: XSMM 328 num_output: 64 329 ipad: 0 330 mpad: 0 331 opad: 1 332 physical_padding: true 333 kernel_size: 1 334 c_stride: 1 335 bn_stride: 1 336 weight_filler { 337 type: "msra" 338 variance_norm: FAN_OUT 339 } 340 } 341} 342node { 343 name: "node_64_3_convbn2" 344 type: "FusedConvBN" 345 bottom: "node_64_3_convbn1" 346 top: "node_64_3_convbn2" 347 param { 348 lr_mult: 1.0 349 decay_mult: 1.0 350 } 351 param { 352 lr_mult: 1.0 353 decay_mult: 0.0 354 } 355 fused_conv_bn_param { 356 data_type: BF16 357 engine: XSMM 358 num_output: 64 359 ipad: 1 360 mpad: 1 361 opad: 0 362 physical_padding: true 363 kernel_size: 3 364 c_stride: 1 365 bn_stride: 1 366 weight_filler { 367 type: "msra" 368 variance_norm: FAN_OUT 369 } 370 } 371} 372node { 373 name: "node_64_3_convbn3" 374 type: "FusedConvBN" 375 bottom: "node_64_3_convbn2" 376 bottom: "node_64_2_convbn3" 377 top: "node_64_3_convbn3" 378 param { 379 lr_mult: 1.0 380 decay_mult: 1.0 381 } 382 param { 383 lr_mult: 1.0 384 decay_mult: 0.0 385 } 386 fused_conv_bn_param { 387 data_type: BF16 388 engine: XSMM 389 num_output: 256 390 ipad: 0 391 mpad: 0 392 opad: 0 393 kernel_size: 1 394 c_stride: 1 395 bn_stride: 2 396 eltwise: true 397 weight_filler { 398 type: "msra" 399 variance_norm: FAN_OUT 400 } 401 } 402} 403node { 404 name: "node_128_1_convbn4" 405 type: "FusedConvBN" 406 bottom: "node_64_3_convbn3" 407 top: "node_128_1_convbn4" 408 param { 409 lr_mult: 1.0 410 decay_mult: 1.0 411 } 412 param { 413 lr_mult: 1.0 414 decay_mult: 0.0 415 } 416 fused_conv_bn_param { 417 data_type: BF16 418 engine: XSMM 419 num_output: 512 420 ipad: 0 421 mpad: 0 422 opad: 0 423 kernel_size: 1 424 c_stride: 1 425 bn_stride: 1 426 relu_fwd: false 427 relu_bwd: false 428 weight_filler { 429 type: "msra" 430 variance_norm: FAN_OUT 431 } 432 } 433} 434node { 435 name: "node_128_1_convbn1" 436 type: "FusedConvBN" 437 bottom: "node_64_3_convbn3" 438 top: "node_128_1_convbn1" 439 param { 440 lr_mult: 1.0 441 decay_mult: 1.0 442 } 443 param { 444 lr_mult: 1.0 445 decay_mult: 0.0 446 } 447 fused_conv_bn_param { 448 data_type: BF16 449 engine: XSMM 450 num_output: 128 451 ipad: 0 452 mpad: 0 453 opad: 1 454 physical_padding: true 455 kernel_size: 1 456 c_stride: 1 457 bn_stride: 1 458 weight_filler { 459 type: "msra" 460 variance_norm: FAN_OUT 461 } 462 } 463} 464node { 465 name: "node_128_1_convbn2" 466 type: "FusedConvBN" 467 bottom: "node_128_1_convbn1" 468 top: "node_128_1_convbn2" 469 param { 470 lr_mult: 1.0 471 decay_mult: 1.0 472 } 473 param { 474 lr_mult: 1.0 475 decay_mult: 0.0 476 } 477 fused_conv_bn_param { 478 data_type: BF16 479 engine: XSMM 480 num_output: 128 481 ipad: 1 482 mpad: 1 483 opad: 0 484 physical_padding: true 485 kernel_size: 3 486 c_stride: 1 487 bn_stride: 1 488 weight_filler { 489 type: "msra" 490 variance_norm: FAN_OUT 491 } 492 } 493} 494node { 495 name: "node_128_1_convbn3" 496 type: "FusedConvBN" 497 bottom: "node_128_1_convbn2" 498 bottom: "node_128_1_convbn4" 499 top: "node_128_1_convbn3" 500 param { 501 lr_mult: 1.0 502 decay_mult: 1.0 503 } 504 param { 505 lr_mult: 1.0 506 decay_mult: 0.0 507 } 508 fused_conv_bn_param { 509 data_type: BF16 510 engine: XSMM 511 num_output: 512 512 ipad: 0 513 mpad: 0 514 opad: 0 515 kernel_size: 1 516 c_stride: 1 517 bn_stride: 1 518 eltwise: true 519 weight_filler { 520 type: "msra" 521 variance_norm: FAN_OUT 522 } 523 } 524} 525node { 526 name: "node_128_2_convbn1" 527 type: "FusedConvBN" 528 bottom: "node_128_1_convbn3" 529 top: "node_128_2_convbn1" 530 param { 531 lr_mult: 1.0 532 decay_mult: 1.0 533 } 534 param { 535 lr_mult: 1.0 536 decay_mult: 0.0 537 } 538 fused_conv_bn_param { 539 data_type: BF16 540 engine: XSMM 541 num_output: 128 542 ipad: 0 543 mpad: 0 544 opad: 1 545 physical_padding: true 546 kernel_size: 1 547 c_stride: 1 548 bn_stride: 1 549 weight_filler { 550 type: "msra" 551 variance_norm: FAN_OUT 552 } 553 } 554} 555node { 556 name: "node_128_2_convbn2" 557 type: "FusedConvBN" 558 bottom: "node_128_2_convbn1" 559 top: "node_128_2_convbn2" 560 param { 561 lr_mult: 1.0 562 decay_mult: 1.0 563 } 564 param { 565 lr_mult: 1.0 566 decay_mult: 0.0 567 } 568 fused_conv_bn_param { 569 data_type: BF16 570 engine: XSMM 571 num_output: 128 572 ipad: 1 573 mpad: 1 574 opad: 0 575 physical_padding: true 576 kernel_size: 3 577 c_stride: 1 578 bn_stride: 1 579 weight_filler { 580 type: "msra" 581 variance_norm: FAN_OUT 582 } 583 } 584} 585node { 586 name: "node_128_2_convbn3" 587 type: "FusedConvBN" 588 bottom: "node_128_2_convbn2" 589 bottom: "node_128_1_convbn3" 590 top: "node_128_2_convbn3" 591 param { 592 lr_mult: 1.0 593 decay_mult: 1.0 594 } 595 param { 596 lr_mult: 1.0 597 decay_mult: 0.0 598 } 599 fused_conv_bn_param { 600 data_type: BF16 601 engine: XSMM 602 num_output: 512 603 ipad: 0 604 mpad: 0 605 opad: 0 606 kernel_size: 1 607 c_stride: 1 608 bn_stride: 1 609 eltwise: true 610 weight_filler { 611 type: "msra" 612 variance_norm: FAN_OUT 613 } 614 } 615} 616node { 617 name: "node_128_3_convbn1" 618 type: "FusedConvBN" 619 bottom: "node_128_2_convbn3" 620 top: "node_128_3_convbn1" 621 param { 622 lr_mult: 1.0 623 decay_mult: 1.0 624 } 625 param { 626 lr_mult: 1.0 627 decay_mult: 0.0 628 } 629 fused_conv_bn_param { 630 data_type: BF16 631 engine: XSMM 632 num_output: 128 633 ipad: 0 634 mpad: 0 635 opad: 1 636 physical_padding: true 637 kernel_size: 1 638 c_stride: 1 639 bn_stride: 1 640 weight_filler { 641 type: "msra" 642 variance_norm: FAN_OUT 643 } 644 } 645} 646node { 647 name: "node_128_3_convbn2" 648 type: "FusedConvBN" 649 bottom: "node_128_3_convbn1" 650 top: "node_128_3_convbn2" 651 param { 652 lr_mult: 1.0 653 decay_mult: 1.0 654 } 655 param { 656 lr_mult: 1.0 657 decay_mult: 0.0 658 } 659 fused_conv_bn_param { 660 data_type: BF16 661 engine: XSMM 662 num_output: 128 663 ipad: 1 664 mpad: 1 665 opad: 0 666 physical_padding: true 667 kernel_size: 3 668 c_stride: 1 669 bn_stride: 1 670 weight_filler { 671 type: "msra" 672 variance_norm: FAN_OUT 673 } 674 } 675} 676node { 677 name: "node_128_3_convbn3" 678 type: "FusedConvBN" 679 bottom: "node_128_3_convbn2" 680 bottom: "node_128_2_convbn3" 681 top: "node_128_3_convbn3" 682 param { 683 lr_mult: 1.0 684 decay_mult: 1.0 685 } 686 param { 687 lr_mult: 1.0 688 decay_mult: 0.0 689 } 690 fused_conv_bn_param { 691 data_type: BF16 692 engine: XSMM 693 num_output: 512 694 ipad: 0 695 mpad: 0 696 opad: 0 697 kernel_size: 1 698 c_stride: 1 699 bn_stride: 1 700 eltwise: true 701 weight_filler { 702 type: "msra" 703 variance_norm: FAN_OUT 704 } 705 } 706} 707node { 708 name: "node_128_4_convbn1" 709 type: "FusedConvBN" 710 bottom: "node_128_3_convbn3" 711 top: "node_128_4_convbn1" 712 param { 713 lr_mult: 1.0 714 decay_mult: 1.0 715 } 716 param { 717 lr_mult: 1.0 718 decay_mult: 0.0 719 } 720 fused_conv_bn_param { 721 data_type: BF16 722 engine: XSMM 723 num_output: 128 724 ipad: 0 725 mpad: 0 726 opad: 1 727 physical_padding: true 728 kernel_size: 1 729 c_stride: 1 730 bn_stride: 1 731 weight_filler { 732 type: "msra" 733 variance_norm: FAN_OUT 734 } 735 } 736} 737node { 738 name: "node_128_4_convbn2" 739 type: "FusedConvBN" 740 bottom: "node_128_4_convbn1" 741 top: "node_128_4_convbn2" 742 param { 743 lr_mult: 1.0 744 decay_mult: 1.0 745 } 746 param { 747 lr_mult: 1.0 748 decay_mult: 0.0 749 } 750 fused_conv_bn_param { 751 data_type: BF16 752 engine: XSMM 753 num_output: 128 754 ipad: 1 755 mpad: 1 756 opad: 0 757 physical_padding: true 758 kernel_size: 3 759 c_stride: 1 760 bn_stride: 1 761 weight_filler { 762 type: "msra" 763 variance_norm: FAN_OUT 764 } 765 } 766} 767node { 768 name: "node_128_4_convbn3" 769 type: "FusedConvBN" 770 bottom: "node_128_4_convbn2" 771 bottom: "node_128_3_convbn3" 772 top: "node_128_4_convbn3" 773 param { 774 lr_mult: 1.0 775 decay_mult: 1.0 776 } 777 param { 778 lr_mult: 1.0 779 decay_mult: 0.0 780 } 781 fused_conv_bn_param { 782 data_type: BF16 783 engine: XSMM 784 num_output: 512 785 ipad: 0 786 mpad: 0 787 opad: 0 788 kernel_size: 1 789 c_stride: 1 790 bn_stride: 2 791 eltwise: true 792 weight_filler { 793 type: "msra" 794 variance_norm: FAN_OUT 795 } 796 } 797} 798node { 799 name: "node_256_1_convbn4" 800 type: "FusedConvBN" 801 bottom: "node_128_4_convbn3" 802 top: "node_256_1_convbn4" 803 param { 804 lr_mult: 1.0 805 decay_mult: 1.0 806 } 807 param { 808 lr_mult: 1.0 809 decay_mult: 0.0 810 } 811 fused_conv_bn_param { 812 data_type: BF16 813 engine: XSMM 814 num_output: 1024 815 ipad: 0 816 mpad: 0 817 opad: 0 818 kernel_size: 1 819 c_stride: 1 820 bn_stride: 1 821 relu_fwd: false 822 relu_bwd: false 823 weight_filler { 824 type: "msra" 825 variance_norm: FAN_OUT 826 } 827 } 828} 829node { 830 name: "node_256_1_convbn1" 831 type: "FusedConvBN" 832 bottom: "node_128_4_convbn3" 833 top: "node_256_1_convbn1" 834 param { 835 lr_mult: 1.0 836 decay_mult: 1.0 837 } 838 param { 839 lr_mult: 1.0 840 decay_mult: 0.0 841 } 842 fused_conv_bn_param { 843 data_type: BF16 844 engine: XSMM 845 num_output: 256 846 ipad: 0 847 mpad: 0 848 opad: 1 849 physical_padding: true 850 kernel_size: 1 851 c_stride: 1 852 bn_stride: 1 853 weight_filler { 854 type: "msra" 855 variance_norm: FAN_OUT 856 } 857 } 858} 859node { 860 name: "node_256_1_convbn2" 861 type: "FusedConvBN" 862 bottom: "node_256_1_convbn1" 863 top: "node_256_1_convbn2" 864 param { 865 lr_mult: 1.0 866 decay_mult: 1.0 867 } 868 param { 869 lr_mult: 1.0 870 decay_mult: 0.0 871 } 872 fused_conv_bn_param { 873 data_type: BF16 874 engine: XSMM 875 num_output: 256 876 ipad: 1 877 mpad: 1 878 opad: 0 879 physical_padding: true 880 kernel_size: 3 881 c_stride: 1 882 bn_stride: 1 883 weight_filler { 884 type: "msra" 885 variance_norm: FAN_OUT 886 } 887 } 888} 889node { 890 name: "node_256_1_convbn3" 891 type: "FusedConvBN" 892 bottom: "node_256_1_convbn2" 893 bottom: "node_256_1_convbn4" 894 top: "node_256_1_convbn3" 895 param { 896 lr_mult: 1.0 897 decay_mult: 1.0 898 } 899 param { 900 lr_mult: 1.0 901 decay_mult: 0.0 902 } 903 fused_conv_bn_param { 904 data_type: BF16 905 engine: XSMM 906 num_output: 1024 907 ipad: 0 908 mpad: 0 909 opad: 0 910 kernel_size: 1 911 c_stride: 1 912 bn_stride: 1 913 eltwise: true 914 weight_filler { 915 type: "msra" 916 variance_norm: FAN_OUT 917 } 918 } 919} 920node { 921 name: "node_256_2_convbn1" 922 type: "FusedConvBN" 923 bottom: "node_256_1_convbn3" 924 top: "node_256_2_convbn1" 925 param { 926 lr_mult: 1.0 927 decay_mult: 1.0 928 } 929 param { 930 lr_mult: 1.0 931 decay_mult: 0.0 932 } 933 fused_conv_bn_param { 934 data_type: BF16 935 engine: XSMM 936 num_output: 256 937 ipad: 0 938 mpad: 0 939 opad: 1 940 physical_padding: true 941 kernel_size: 1 942 c_stride: 1 943 bn_stride: 1 944 weight_filler { 945 type: "msra" 946 variance_norm: FAN_OUT 947 } 948 } 949} 950node { 951 name: "node_256_2_convbn2" 952 type: "FusedConvBN" 953 bottom: "node_256_2_convbn1" 954 top: "node_256_2_convbn2" 955 param { 956 lr_mult: 1.0 957 decay_mult: 1.0 958 } 959 param { 960 lr_mult: 1.0 961 decay_mult: 0.0 962 } 963 fused_conv_bn_param { 964 data_type: BF16 965 engine: XSMM 966 num_output: 256 967 ipad: 1 968 mpad: 1 969 opad: 0 970 physical_padding: true 971 kernel_size: 3 972 c_stride: 1 973 bn_stride: 1 974 weight_filler { 975 type: "msra" 976 variance_norm: FAN_OUT 977 } 978 } 979} 980node { 981 name: "node_256_2_convbn3" 982 type: "FusedConvBN" 983 bottom: "node_256_2_convbn2" 984 bottom: "node_256_1_convbn3" 985 top: "node_256_2_convbn3" 986 param { 987 lr_mult: 1.0 988 decay_mult: 1.0 989 } 990 param { 991 lr_mult: 1.0 992 decay_mult: 0.0 993 } 994 fused_conv_bn_param { 995 data_type: BF16 996 engine: XSMM 997 num_output: 1024 998 ipad: 0 999 mpad: 0 1000 opad: 0 1001 kernel_size: 1 1002 c_stride: 1 1003 bn_stride: 1 1004 eltwise: true 1005 weight_filler { 1006 type: "msra" 1007 variance_norm: FAN_OUT 1008 } 1009 } 1010} 1011node { 1012 name: "node_256_3_convbn1" 1013 type: "FusedConvBN" 1014 bottom: "node_256_2_convbn3" 1015 top: "node_256_3_convbn1" 1016 param { 1017 lr_mult: 1.0 1018 decay_mult: 1.0 1019 } 1020 param { 1021 lr_mult: 1.0 1022 decay_mult: 0.0 1023 } 1024 fused_conv_bn_param { 1025 data_type: BF16 1026 engine: XSMM 1027 num_output: 256 1028 ipad: 0 1029 mpad: 0 1030 opad: 1 1031 physical_padding: true 1032 kernel_size: 1 1033 c_stride: 1 1034 bn_stride: 1 1035 weight_filler { 1036 type: "msra" 1037 variance_norm: FAN_OUT 1038 } 1039 } 1040} 1041node { 1042 name: "node_256_3_convbn2" 1043 type: "FusedConvBN" 1044 bottom: "node_256_3_convbn1" 1045 top: "node_256_3_convbn2" 1046 param { 1047 lr_mult: 1.0 1048 decay_mult: 1.0 1049 } 1050 param { 1051 lr_mult: 1.0 1052 decay_mult: 0.0 1053 } 1054 fused_conv_bn_param { 1055 data_type: BF16 1056 engine: XSMM 1057 num_output: 256 1058 ipad: 1 1059 mpad: 1 1060 opad: 0 1061 physical_padding: true 1062 kernel_size: 3 1063 c_stride: 1 1064 bn_stride: 1 1065 weight_filler { 1066 type: "msra" 1067 variance_norm: FAN_OUT 1068 } 1069 } 1070} 1071node { 1072 name: "node_256_3_convbn3" 1073 type: "FusedConvBN" 1074 bottom: "node_256_3_convbn2" 1075 bottom: "node_256_2_convbn3" 1076 top: "node_256_3_convbn3" 1077 param { 1078 lr_mult: 1.0 1079 decay_mult: 1.0 1080 } 1081 param { 1082 lr_mult: 1.0 1083 decay_mult: 0.0 1084 } 1085 fused_conv_bn_param { 1086 data_type: BF16 1087 engine: XSMM 1088 num_output: 1024 1089 ipad: 0 1090 mpad: 0 1091 opad: 0 1092 kernel_size: 1 1093 c_stride: 1 1094 bn_stride: 1 1095 eltwise: true 1096 weight_filler { 1097 type: "msra" 1098 variance_norm: FAN_OUT 1099 } 1100 } 1101} 1102node { 1103 name: "node_256_4_convbn1" 1104 type: "FusedConvBN" 1105 bottom: "node_256_3_convbn3" 1106 top: "node_256_4_convbn1" 1107 param { 1108 lr_mult: 1.0 1109 decay_mult: 1.0 1110 } 1111 param { 1112 lr_mult: 1.0 1113 decay_mult: 0.0 1114 } 1115 fused_conv_bn_param { 1116 data_type: BF16 1117 engine: XSMM 1118 num_output: 256 1119 ipad: 0 1120 mpad: 0 1121 opad: 1 1122 physical_padding: true 1123 kernel_size: 1 1124 c_stride: 1 1125 bn_stride: 1 1126 weight_filler { 1127 type: "msra" 1128 variance_norm: FAN_OUT 1129 } 1130 } 1131} 1132node { 1133 name: "node_256_4_convbn2" 1134 type: "FusedConvBN" 1135 bottom: "node_256_4_convbn1" 1136 top: "node_256_4_convbn2" 1137 param { 1138 lr_mult: 1.0 1139 decay_mult: 1.0 1140 } 1141 param { 1142 lr_mult: 1.0 1143 decay_mult: 0.0 1144 } 1145 fused_conv_bn_param { 1146 data_type: BF16 1147 engine: XSMM 1148 num_output: 256 1149 ipad: 1 1150 mpad: 1 1151 opad: 0 1152 physical_padding: true 1153 kernel_size: 3 1154 c_stride: 1 1155 bn_stride: 1 1156 weight_filler { 1157 type: "msra" 1158 variance_norm: FAN_OUT 1159 } 1160 } 1161} 1162node { 1163 name: "node_256_4_convbn3" 1164 type: "FusedConvBN" 1165 bottom: "node_256_4_convbn2" 1166 bottom: "node_256_3_convbn3" 1167 top: "node_256_4_convbn3" 1168 param { 1169 lr_mult: 1.0 1170 decay_mult: 1.0 1171 } 1172 param { 1173 lr_mult: 1.0 1174 decay_mult: 0.0 1175 } 1176 fused_conv_bn_param { 1177 data_type: BF16 1178 engine: XSMM 1179 num_output: 1024 1180 ipad: 0 1181 mpad: 0 1182 opad: 0 1183 kernel_size: 1 1184 c_stride: 1 1185 bn_stride: 1 1186 eltwise: true 1187 weight_filler { 1188 type: "msra" 1189 variance_norm: FAN_OUT 1190 } 1191 } 1192} 1193node { 1194 name: "node_256_5_convbn1" 1195 type: "FusedConvBN" 1196 bottom: "node_256_4_convbn3" 1197 top: "node_256_5_convbn1" 1198 param { 1199 lr_mult: 1.0 1200 decay_mult: 1.0 1201 } 1202 param { 1203 lr_mult: 1.0 1204 decay_mult: 0.0 1205 } 1206 fused_conv_bn_param { 1207 data_type: BF16 1208 engine: XSMM 1209 num_output: 256 1210 ipad: 0 1211 mpad: 0 1212 opad: 1 1213 physical_padding: true 1214 kernel_size: 1 1215 c_stride: 1 1216 bn_stride: 1 1217 weight_filler { 1218 type: "msra" 1219 variance_norm: FAN_OUT 1220 } 1221 } 1222} 1223node { 1224 name: "node_256_5_convbn2" 1225 type: "FusedConvBN" 1226 bottom: "node_256_5_convbn1" 1227 top: "node_256_5_convbn2" 1228 param { 1229 lr_mult: 1.0 1230 decay_mult: 1.0 1231 } 1232 param { 1233 lr_mult: 1.0 1234 decay_mult: 0.0 1235 } 1236 fused_conv_bn_param { 1237 data_type: BF16 1238 engine: XSMM 1239 num_output: 256 1240 ipad: 1 1241 mpad: 1 1242 opad: 0 1243 physical_padding: true 1244 kernel_size: 3 1245 c_stride: 1 1246 bn_stride: 1 1247 weight_filler { 1248 type: "msra" 1249 variance_norm: FAN_OUT 1250 } 1251 } 1252} 1253node { 1254 name: "node_256_5_convbn3" 1255 type: "FusedConvBN" 1256 bottom: "node_256_5_convbn2" 1257 bottom: "node_256_4_convbn3" 1258 top: "node_256_5_convbn3" 1259 param { 1260 lr_mult: 1.0 1261 decay_mult: 1.0 1262 } 1263 param { 1264 lr_mult: 1.0 1265 decay_mult: 0.0 1266 } 1267 fused_conv_bn_param { 1268 data_type: BF16 1269 engine: XSMM 1270 num_output: 1024 1271 ipad: 0 1272 mpad: 0 1273 opad: 0 1274 kernel_size: 1 1275 c_stride: 1 1276 bn_stride: 1 1277 eltwise: true 1278 weight_filler { 1279 type: "msra" 1280 variance_norm: FAN_OUT 1281 } 1282 } 1283} 1284node { 1285 name: "node_256_6_convbn1" 1286 type: "FusedConvBN" 1287 bottom: "node_256_5_convbn3" 1288 top: "node_256_6_convbn1" 1289 param { 1290 lr_mult: 1.0 1291 decay_mult: 1.0 1292 } 1293 param { 1294 lr_mult: 1.0 1295 decay_mult: 0.0 1296 } 1297 fused_conv_bn_param { 1298 data_type: BF16 1299 engine: XSMM 1300 num_output: 256 1301 ipad: 0 1302 mpad: 0 1303 opad: 1 1304 physical_padding: true 1305 kernel_size: 1 1306 c_stride: 1 1307 bn_stride: 1 1308 weight_filler { 1309 type: "msra" 1310 variance_norm: FAN_OUT 1311 } 1312 } 1313} 1314node { 1315 name: "node_256_6_convbn2" 1316 type: "FusedConvBN" 1317 bottom: "node_256_6_convbn1" 1318 top: "node_256_6_convbn2" 1319 param { 1320 lr_mult: 1.0 1321 decay_mult: 1.0 1322 } 1323 param { 1324 lr_mult: 1.0 1325 decay_mult: 0.0 1326 } 1327 fused_conv_bn_param { 1328 data_type: BF16 1329 engine: XSMM 1330 num_output: 256 1331 ipad: 1 1332 mpad: 1 1333 opad: 0 1334 physical_padding: true 1335 kernel_size: 3 1336 c_stride: 1 1337 bn_stride: 1 1338 weight_filler { 1339 type: "msra" 1340 variance_norm: FAN_OUT 1341 } 1342 } 1343} 1344node { 1345 name: "node_256_6_convbn3" 1346 type: "FusedConvBN" 1347 bottom: "node_256_6_convbn2" 1348 bottom: "node_256_5_convbn3" 1349 top: "node_256_6_convbn3" 1350 param { 1351 lr_mult: 1.0 1352 decay_mult: 1.0 1353 } 1354 param { 1355 lr_mult: 1.0 1356 decay_mult: 0.0 1357 } 1358 fused_conv_bn_param { 1359 data_type: BF16 1360 engine: XSMM 1361 num_output: 1024 1362 ipad: 0 1363 mpad: 0 1364 opad: 0 1365 kernel_size: 1 1366 c_stride: 1 1367 bn_stride: 2 1368 eltwise: true 1369 weight_filler { 1370 type: "msra" 1371 variance_norm: FAN_OUT 1372 } 1373 } 1374} 1375node { 1376 name: "node_512_1_convbn4" 1377 type: "FusedConvBN" 1378 bottom: "node_256_6_convbn3" 1379 top: "node_512_1_convbn4" 1380 param { 1381 lr_mult: 1.0 1382 decay_mult: 1.0 1383 } 1384 param { 1385 lr_mult: 1.0 1386 decay_mult: 0.0 1387 } 1388 fused_conv_bn_param { 1389 data_type: BF16 1390 engine: XSMM 1391 num_output: 2048 1392 ipad: 0 1393 mpad: 0 1394 opad: 0 1395 relu_fwd: false 1396 relu_bwd: false 1397 kernel_size: 1 1398 c_stride: 1 1399 bn_stride: 1 1400 weight_filler { 1401 type: "msra" 1402 variance_norm: FAN_OUT 1403 } 1404 } 1405} 1406node { 1407 name: "node_512_1_convbn1" 1408 type: "FusedConvBN" 1409 bottom: "node_256_6_convbn3" 1410 top: "node_512_1_convbn1" 1411 param { 1412 lr_mult: 1.0 1413 decay_mult: 1.0 1414 } 1415 param { 1416 lr_mult: 1.0 1417 decay_mult: 0.0 1418 } 1419 fused_conv_bn_param { 1420 data_type: BF16 1421 engine: XSMM 1422 num_output: 512 1423 ipad: 0 1424 mpad: 0 1425 opad: 1 1426 physical_padding: true 1427 kernel_size: 1 1428 c_stride: 1 1429 bn_stride: 1 1430 weight_filler { 1431 type: "msra" 1432 variance_norm: FAN_OUT 1433 } 1434 } 1435} 1436node { 1437 name: "node_512_1_convbn2" 1438 type: "FusedConvBN" 1439 bottom: "node_512_1_convbn1" 1440 top: "node_512_1_convbn2" 1441 param { 1442 lr_mult: 1.0 1443 decay_mult: 1.0 1444 } 1445 param { 1446 lr_mult: 1.0 1447 decay_mult: 0.0 1448 } 1449 fused_conv_bn_param { 1450 data_type: BF16 1451 engine: XSMM 1452 num_output: 512 1453 ipad: 1 1454 mpad: 1 1455 opad: 0 1456 physical_padding: true 1457 kernel_size: 3 1458 c_stride: 1 1459 bn_stride: 1 1460 weight_filler { 1461 type: "msra" 1462 variance_norm: FAN_OUT 1463 } 1464 } 1465} 1466node { 1467 name: "node_512_1_convbn3" 1468 type: "FusedConvBN" 1469 bottom: "node_512_1_convbn2" 1470 bottom: "node_512_1_convbn4" 1471 top: "node_512_1_convbn3" 1472 param { 1473 lr_mult: 1.0 1474 decay_mult: 1.0 1475 } 1476 param { 1477 lr_mult: 1.0 1478 decay_mult: 0.0 1479 } 1480 fused_conv_bn_param { 1481 data_type: BF16 1482 engine: XSMM 1483 num_output: 2048 1484 ipad: 0 1485 mpad: 0 1486 opad: 0 1487 kernel_size: 1 1488 c_stride: 1 1489 bn_stride: 1 1490 eltwise: true 1491 weight_filler { 1492 type: "msra" 1493 variance_norm: FAN_OUT 1494 } 1495 } 1496} 1497node { 1498 name: "node_512_2_convbn1" 1499 type: "FusedConvBN" 1500 bottom: "node_512_1_convbn3" 1501 top: "node_512_2_convbn1" 1502 param { 1503 lr_mult: 1.0 1504 decay_mult: 1.0 1505 } 1506 param { 1507 lr_mult: 1.0 1508 decay_mult: 0.0 1509 } 1510 fused_conv_bn_param { 1511 data_type: BF16 1512 engine: XSMM 1513 num_output: 512 1514 ipad: 0 1515 mpad: 0 1516 opad: 1 1517 physical_padding: true 1518 kernel_size: 1 1519 c_stride: 1 1520 bn_stride: 1 1521 weight_filler { 1522 type: "msra" 1523 variance_norm: FAN_OUT 1524 } 1525 } 1526} 1527node { 1528 name: "node_512_2_convbn2" 1529 type: "FusedConvBN" 1530 bottom: "node_512_2_convbn1" 1531 top: "node_512_2_convbn2" 1532 param { 1533 lr_mult: 1.0 1534 decay_mult: 1.0 1535 } 1536 param { 1537 lr_mult: 1.0 1538 decay_mult: 0.0 1539 } 1540 fused_conv_bn_param { 1541 data_type: BF16 1542 engine: XSMM 1543 num_output: 512 1544 ipad: 1 1545 mpad: 1 1546 opad: 0 1547 physical_padding: true 1548 kernel_size: 3 1549 c_stride: 1 1550 bn_stride: 1 1551 weight_filler { 1552 type: "msra" 1553 variance_norm: FAN_OUT 1554 } 1555 } 1556} 1557node { 1558 name: "node_512_2_convbn3" 1559 type: "FusedConvBN" 1560 bottom: "node_512_2_convbn2" 1561 bottom: "node_512_1_convbn3" 1562 top: "node_512_2_convbn3" 1563 param { 1564 lr_mult: 1.0 1565 decay_mult: 1.0 1566 } 1567 param { 1568 lr_mult: 1.0 1569 decay_mult: 0.0 1570 } 1571 fused_conv_bn_param { 1572 data_type: BF16 1573 engine: XSMM 1574 num_output: 2048 1575 ipad: 0 1576 mpad: 0 1577 opad: 0 1578 kernel_size: 1 1579 c_stride: 1 1580 bn_stride: 1 1581 eltwise: true 1582 weight_filler { 1583 type: "msra" 1584 variance_norm: FAN_OUT 1585 } 1586 } 1587} 1588node { 1589 name: "node_512_3_convbn1" 1590 type: "FusedConvBN" 1591 bottom: "node_512_2_convbn3" 1592 top: "node_512_3_convbn1" 1593 param { 1594 lr_mult: 1.0 1595 decay_mult: 1.0 1596 } 1597 param { 1598 lr_mult: 1.0 1599 decay_mult: 0.0 1600 } 1601 fused_conv_bn_param { 1602 data_type: BF16 1603 engine: XSMM 1604 num_output: 512 1605 ipad: 0 1606 mpad: 0 1607 opad: 1 1608 physical_padding: true 1609 kernel_size: 1 1610 c_stride: 1 1611 bn_stride: 1 1612 weight_filler { 1613 type: "msra" 1614 variance_norm: FAN_OUT 1615 } 1616 } 1617} 1618node { 1619 name: "node_512_3_convbn2" 1620 type: "FusedConvBN" 1621 bottom: "node_512_3_convbn1" 1622 top: "node_512_3_convbn2" 1623 param { 1624 lr_mult: 1.0 1625 decay_mult: 1.0 1626 } 1627 param { 1628 lr_mult: 1.0 1629 decay_mult: 0.0 1630 } 1631 fused_conv_bn_param { 1632 data_type: BF16 1633 engine: XSMM 1634 num_output: 512 1635 ipad: 1 1636 mpad: 1 1637 opad: 0 1638 physical_padding: true 1639 kernel_size: 3 1640 c_stride: 1 1641 bn_stride: 1 1642 weight_filler { 1643 type: "msra" 1644 variance_norm: FAN_OUT 1645 } 1646 } 1647} 1648node { 1649 name: "node_512_3_convbn3" 1650 type: "FusedConvBN" 1651 bottom: "node_512_3_convbn2" 1652 bottom: "node_512_2_convbn3" 1653 top: "node_512_3_convbn3" 1654 param { 1655 lr_mult: 1.0 1656 decay_mult: 1.0 1657 } 1658 param { 1659 lr_mult: 1.0 1660 decay_mult: 0.0 1661 } 1662 fused_conv_bn_param { 1663 data_type: BF16 1664 engine: XSMM 1665 num_output: 2048 1666 ipad: 0 1667 mpad: 0 1668 opad: 0 1669 kernel_size: 1 1670 c_stride: 1 1671 bn_stride: 1 1672 eltwise: true 1673 weight_filler { 1674 type: "msra" 1675 variance_norm: FAN_OUT 1676 } 1677 } 1678} 1679node { 1680 name: "pool5" 1681 type: "Pooling" 1682 bottom: "node_512_3_convbn3" 1683 top: "pool5" 1684 pooling_param { 1685 data_type: BF16 1686 engine: XSMM 1687 pool: AVE 1688 kernel_size: 7 1689 stride: 1 1690 } 1691} 1692node { 1693 name: "fc1000" 1694 type: "FullyConnected" 1695 bottom: "pool5" 1696 top: "fc1000" 1697 param { 1698 lr_mult: 1.0 1699 decay_mult: 1.0 1700 } 1701 fc_param { 1702 data_type: FLOAT 1703 num_output: 1000 1704 engine: XSMM 1705 bias_term: false 1706 weight_filler { 1707 type: "Gaussian" 1708 std: 0.01 1709 } 1710 } 1711} 1712node { 1713 name: "prob" 1714 type: "SoftmaxWithLoss" 1715 bottom: "fc1000" 1716 bottom: "label" 1717 top: "prob" 1718 loss_weight: 1 1719} 1720node { 1721 name: "accuracy1" 1722 type: "Accuracy" 1723 bottom: "fc1000" 1724 bottom: "label" 1725 top: "accuracy1" 1726 propagate_down: false 1727 accuracy_param{ 1728 top_k: 1 1729 } 1730} 1731node { 1732 name: "accuracy5" 1733 type: "Accuracy" 1734 bottom: "fc1000" 1735 bottom: "label" 1736 top: "accuracy5" 1737 propagate_down: false 1738 accuracy_param{ 1739 top_k: 5 1740 } 1741} 1742