1node {
2  name: "data"
3  type: "JitterData"
4  top: "data"
5  top: "label"
6  propagate_down: false
7  mode: TRAIN
8  data_param {
9    train_source: "/home/local_scratch/jpegs_256resized"
10    train_list: "/home/local_scratch/train_images_labels.list"
11    test_source: "/home/local_scratch/jpegs_256resized"
12    test_list: "/home/local_scratch/val_images_labels.list"
13    batch_size: 54    #number of cores(54) - number of EP servers (2)
14    num_train_files: 80073  # per node when numsplits=16
15    num_test_files: 3125    # per node when numsplits=16
16    numsplits: 16
17    lookahead: 2
18    shuffle: true
19    engine: XSMM
20    data_type: BF16
21
22    image_xform_param {
23      orig_size: 256
24      mirror: true
25      crop_image: true
26      physical_padding: true
27      crop_size: 224
28      channels: 4
29      pad_h: 3
30      pad_w: 3
31      mean_values: 0.406
32      mean_values: 0.456
33      mean_values: 0.485
34      scale_values: 0.225
35      scale_values: 0.224
36      scale_values: 0.229
37      test_views: 1
38    }
39  }
40}
41node {
42  name: "conv1"
43  type: "Convolution"
44  bottom: "data"
45  top: "conv1"
46  propagate_down: false
47  param {
48    lr_mult: 1.0
49    decay_mult: 1.0
50  }
51  convolution_param {
52    data_type: BF16
53    engine: XSMM
54    num_output: 64
55    pad: 3
56    opad: 3
57    bias_term: false
58    physical_padding: true
59    kernel_size: 7
60    stride: 2
61    weight_filler {
62      type: "msra"
63      variance_norm: FAN_OUT
64    }
65    bias_filler {
66      type: "constant"
67      value: 0.0
68    }
69  }
70}
71node {
72  name: "bn1"
73  type: "FusedBatchNorm"
74  fused_bnorm_param {
75    data_type: BF16
76    use_global_stats: false
77    ipad: 3
78    pad: 0
79    stride: 1
80    engine: XSMM
81  }
82  bottom: "conv1"
83  top: "bn1"
84}
85node {
86  name: "conv1_pool"
87  type: "Pooling"
88  bottom: "bn1"
89  top: "conv1_pool"
90  pooling_param {
91    data_type: BF16
92    pool: MAX
93    engine: XSMM
94    kernel_size: 3
95    stride: 2
96    pad: 1
97  }
98}
99node {
100  name: "node_64_1_convbn4"
101  type: "FusedConvBN"
102  bottom: "conv1_pool"
103  top: "node_64_1_convbn4"
104  param {
105    lr_mult: 1.0
106    decay_mult: 1.0
107  }
108  param {
109    lr_mult: 1.0
110    decay_mult: 0.0
111  }
112  fused_conv_bn_param {
113    data_type: BF16
114    engine: XSMM
115    num_output: 256
116    ipad: 0
117    mpad: 0
118    opad: 0
119    kernel_size: 1
120    c_stride: 1
121    bn_stride: 1
122    relu_fwd: false
123    relu_bwd: false
124    weight_filler {
125      type: "msra"
126      variance_norm: FAN_OUT
127    }
128  }
129}
130node {
131  name: "node_64_1_convbn1"
132  type: "FusedConvBN"
133  bottom: "conv1_pool"
134  top: "node_64_1_convbn1"
135  param {
136    lr_mult: 1.0
137    decay_mult: 1.0
138  }
139  param {
140    lr_mult: 1.0
141    decay_mult: 0.0
142  }
143  fused_conv_bn_param {
144    data_type: BF16
145    engine: XSMM
146    num_output: 64
147    ipad: 0
148    mpad: 0
149    opad: 1
150    physical_padding: true
151    kernel_size: 1
152    c_stride: 1
153    bn_stride: 1
154    weight_filler {
155      type: "msra"
156      variance_norm: FAN_OUT
157    }
158  }
159}
160node {
161  name: "node_64_1_convbn2"
162  type: "FusedConvBN"
163  bottom: "node_64_1_convbn1"
164  top: "node_64_1_convbn2"
165  param {
166    lr_mult: 1.0
167    decay_mult: 1.0
168  }
169  param {
170    lr_mult: 1.0
171    decay_mult: 0.0
172  }
173  fused_conv_bn_param {
174    data_type: BF16
175    engine: XSMM
176    num_output: 64
177    ipad: 1
178    mpad: 1
179    opad: 0
180    physical_padding: true
181    kernel_size: 3
182    c_stride: 1
183    bn_stride: 1
184    weight_filler {
185      type: "msra"
186      variance_norm: FAN_OUT
187    }
188  }
189}
190node {
191  name: "node_64_1_convbn3"
192  type: "FusedConvBN"
193  bottom: "node_64_1_convbn2"
194  bottom: "node_64_1_convbn4"
195  top: "node_64_1_convbn3"
196  param {
197    lr_mult: 1.0
198    decay_mult: 1.0
199  }
200  param {
201    lr_mult: 1.0
202    decay_mult: 0.0
203  }
204  fused_conv_bn_param{
205    data_type: BF16
206    engine: XSMM
207    num_output: 256
208    ipad: 0
209    mpad: 0
210    opad: 0
211    kernel_size: 1
212    c_stride: 1
213    bn_stride: 1
214    eltwise: true
215    weight_filler {
216      type: "msra"
217      variance_norm: FAN_OUT
218    }
219  }
220}
221node {
222  name: "node_64_2_convbn1"
223  type: "FusedConvBN"
224  bottom: "node_64_1_convbn3"
225  top: "node_64_2_convbn1"
226  param {
227    lr_mult: 1.0
228    decay_mult: 1.0
229  }
230  param {
231    lr_mult: 1.0
232    decay_mult: 0.0
233  }
234  fused_conv_bn_param {
235    data_type: BF16
236    engine: XSMM
237    num_output: 64
238    ipad: 0
239    mpad: 0
240    opad: 1
241    kernel_size: 1
242    physical_padding: true
243    c_stride: 1
244    bn_stride: 1
245    weight_filler {
246      type: "msra"
247      variance_norm: FAN_OUT
248    }
249  }
250}
251node {
252  name: "node_64_2_convbn2"
253  type: "FusedConvBN"
254  bottom: "node_64_2_convbn1"
255  top: "node_64_2_convbn2"
256  param {
257    lr_mult: 1.0
258    decay_mult: 1.0
259  }
260  param {
261    lr_mult: 1.0
262    decay_mult: 0.0
263  }
264  fused_conv_bn_param {
265    data_type: BF16
266    engine: XSMM
267    num_output: 64
268    ipad: 1
269    mpad: 1
270    opad: 0
271    physical_padding: true
272    kernel_size: 3
273    c_stride: 1
274    bn_stride: 1
275    weight_filler {
276      type: "msra"
277      variance_norm: FAN_OUT
278    }
279  }
280}
281node {
282  name: "node_64_2_convbn3"
283  type: "FusedConvBN"
284  bottom: "node_64_2_convbn2"
285  bottom: "node_64_1_convbn3"
286  top: "node_64_2_convbn3"
287  param {
288    lr_mult: 1.0
289    decay_mult: 1.0
290  }
291  param {
292    lr_mult: 1.0
293    decay_mult: 0.0
294  }
295  fused_conv_bn_param {
296    data_type: BF16
297    engine: XSMM
298    num_output: 256
299    ipad: 0
300    mpad: 0
301    opad: 0
302    kernel_size: 1
303    c_stride: 1
304    bn_stride: 1
305    eltwise: true
306    weight_filler {
307      type: "msra"
308      variance_norm: FAN_OUT
309    }
310  }
311}
312node {
313  name: "node_64_3_convbn1"
314  type: "FusedConvBN"
315  bottom: "node_64_2_convbn3"
316  top: "node_64_3_convbn1"
317  param {
318    lr_mult: 1.0
319    decay_mult: 1.0
320  }
321  param {
322    lr_mult: 1.0
323    decay_mult: 0.0
324  }
325  fused_conv_bn_param {
326    data_type: BF16
327    engine: XSMM
328    num_output: 64
329    ipad: 0
330    mpad: 0
331    opad: 1
332    physical_padding: true
333    kernel_size: 1
334    c_stride: 1
335    bn_stride: 1
336    weight_filler {
337      type: "msra"
338      variance_norm: FAN_OUT
339    }
340  }
341}
342node {
343  name: "node_64_3_convbn2"
344  type: "FusedConvBN"
345  bottom: "node_64_3_convbn1"
346  top: "node_64_3_convbn2"
347  param {
348    lr_mult: 1.0
349    decay_mult: 1.0
350  }
351  param {
352    lr_mult: 1.0
353    decay_mult: 0.0
354  }
355  fused_conv_bn_param {
356    data_type: BF16
357    engine: XSMM
358    num_output: 64
359    ipad: 1
360    mpad: 1
361    opad: 0
362    physical_padding: true
363    kernel_size: 3
364    c_stride: 1
365    bn_stride: 1
366    weight_filler {
367      type: "msra"
368      variance_norm: FAN_OUT
369    }
370  }
371}
372node {
373  name: "node_64_3_convbn3"
374  type: "FusedConvBN"
375  bottom: "node_64_3_convbn2"
376  bottom: "node_64_2_convbn3"
377  top: "node_64_3_convbn3"
378  param {
379    lr_mult: 1.0
380    decay_mult: 1.0
381  }
382  param {
383    lr_mult: 1.0
384    decay_mult: 0.0
385  }
386  fused_conv_bn_param {
387    data_type: BF16
388    engine: XSMM
389    num_output: 256
390    ipad: 0
391    mpad: 0
392    opad: 0
393    kernel_size: 1
394    c_stride: 1
395    bn_stride: 2
396    eltwise: true
397    weight_filler {
398      type: "msra"
399      variance_norm: FAN_OUT
400    }
401  }
402}
403node {
404  name: "node_128_1_convbn4"
405  type: "FusedConvBN"
406  bottom: "node_64_3_convbn3"
407  top: "node_128_1_convbn4"
408  param {
409    lr_mult: 1.0
410    decay_mult: 1.0
411  }
412  param {
413    lr_mult: 1.0
414    decay_mult: 0.0
415  }
416  fused_conv_bn_param {
417    data_type: BF16
418    engine: XSMM
419    num_output: 512
420    ipad: 0
421    mpad: 0
422    opad: 0
423    kernel_size: 1
424    c_stride: 1
425    bn_stride: 1
426    relu_fwd: false
427    relu_bwd: false
428    weight_filler {
429      type: "msra"
430      variance_norm: FAN_OUT
431    }
432  }
433}
434node {
435  name: "node_128_1_convbn1"
436  type: "FusedConvBN"
437  bottom: "node_64_3_convbn3"
438  top: "node_128_1_convbn1"
439  param {
440    lr_mult: 1.0
441    decay_mult: 1.0
442  }
443  param {
444    lr_mult: 1.0
445    decay_mult: 0.0
446  }
447  fused_conv_bn_param {
448    data_type: BF16
449    engine: XSMM
450    num_output: 128
451    ipad: 0
452    mpad: 0
453    opad: 1
454    physical_padding: true
455    kernel_size: 1
456    c_stride: 1
457    bn_stride: 1
458    weight_filler {
459      type: "msra"
460      variance_norm: FAN_OUT
461    }
462  }
463}
464node {
465  name: "node_128_1_convbn2"
466  type: "FusedConvBN"
467  bottom: "node_128_1_convbn1"
468  top: "node_128_1_convbn2"
469  param {
470    lr_mult: 1.0
471    decay_mult: 1.0
472  }
473  param {
474    lr_mult: 1.0
475    decay_mult: 0.0
476  }
477  fused_conv_bn_param {
478    data_type: BF16
479    engine: XSMM
480    num_output: 128
481    ipad: 1
482    mpad: 1
483    opad: 0
484    physical_padding: true
485    kernel_size: 3
486    c_stride: 1
487    bn_stride: 1
488    weight_filler {
489      type: "msra"
490      variance_norm: FAN_OUT
491    }
492  }
493}
494node {
495  name: "node_128_1_convbn3"
496  type: "FusedConvBN"
497  bottom: "node_128_1_convbn2"
498  bottom: "node_128_1_convbn4"
499  top: "node_128_1_convbn3"
500  param {
501    lr_mult: 1.0
502    decay_mult: 1.0
503  }
504  param {
505    lr_mult: 1.0
506    decay_mult: 0.0
507  }
508  fused_conv_bn_param {
509    data_type: BF16
510    engine: XSMM
511    num_output: 512
512    ipad: 0
513    mpad: 0
514    opad: 0
515    kernel_size: 1
516    c_stride: 1
517    bn_stride: 1
518    eltwise: true
519    weight_filler {
520      type: "msra"
521      variance_norm: FAN_OUT
522    }
523  }
524}
525node {
526  name: "node_128_2_convbn1"
527  type: "FusedConvBN"
528  bottom: "node_128_1_convbn3"
529  top: "node_128_2_convbn1"
530  param {
531    lr_mult: 1.0
532    decay_mult: 1.0
533  }
534  param {
535    lr_mult: 1.0
536    decay_mult: 0.0
537  }
538  fused_conv_bn_param {
539    data_type: BF16
540    engine: XSMM
541    num_output: 128
542    ipad: 0
543    mpad: 0
544    opad: 1
545    physical_padding: true
546    kernel_size: 1
547    c_stride: 1
548    bn_stride: 1
549    weight_filler {
550      type: "msra"
551      variance_norm: FAN_OUT
552    }
553  }
554}
555node {
556  name: "node_128_2_convbn2"
557  type: "FusedConvBN"
558  bottom: "node_128_2_convbn1"
559  top: "node_128_2_convbn2"
560  param {
561    lr_mult: 1.0
562    decay_mult: 1.0
563  }
564  param {
565    lr_mult: 1.0
566    decay_mult: 0.0
567  }
568  fused_conv_bn_param {
569    data_type: BF16
570    engine: XSMM
571    num_output: 128
572    ipad: 1
573    mpad: 1
574    opad: 0
575    physical_padding: true
576    kernel_size: 3
577    c_stride: 1
578    bn_stride: 1
579    weight_filler {
580      type: "msra"
581      variance_norm: FAN_OUT
582    }
583  }
584}
585node {
586  name: "node_128_2_convbn3"
587  type: "FusedConvBN"
588  bottom: "node_128_2_convbn2"
589  bottom: "node_128_1_convbn3"
590  top: "node_128_2_convbn3"
591  param {
592    lr_mult: 1.0
593    decay_mult: 1.0
594  }
595  param {
596    lr_mult: 1.0
597    decay_mult: 0.0
598  }
599  fused_conv_bn_param {
600    data_type: BF16
601    engine: XSMM
602    num_output: 512
603    ipad: 0
604    mpad: 0
605    opad: 0
606    kernel_size: 1
607    c_stride: 1
608    bn_stride: 1
609    eltwise: true
610    weight_filler {
611      type: "msra"
612      variance_norm: FAN_OUT
613    }
614  }
615}
616node {
617  name: "node_128_3_convbn1"
618  type: "FusedConvBN"
619  bottom: "node_128_2_convbn3"
620  top: "node_128_3_convbn1"
621  param {
622    lr_mult: 1.0
623    decay_mult: 1.0
624  }
625  param {
626    lr_mult: 1.0
627    decay_mult: 0.0
628  }
629  fused_conv_bn_param {
630    data_type: BF16
631    engine: XSMM
632    num_output: 128
633    ipad: 0
634    mpad: 0
635    opad: 1
636    physical_padding: true
637    kernel_size: 1
638    c_stride: 1
639    bn_stride: 1
640    weight_filler {
641      type: "msra"
642      variance_norm: FAN_OUT
643    }
644  }
645}
646node {
647  name: "node_128_3_convbn2"
648  type: "FusedConvBN"
649  bottom: "node_128_3_convbn1"
650  top: "node_128_3_convbn2"
651  param {
652    lr_mult: 1.0
653    decay_mult: 1.0
654  }
655  param {
656    lr_mult: 1.0
657    decay_mult: 0.0
658  }
659  fused_conv_bn_param {
660    data_type: BF16
661    engine: XSMM
662    num_output: 128
663    ipad: 1
664    mpad: 1
665    opad: 0
666    physical_padding: true
667    kernel_size: 3
668    c_stride: 1
669    bn_stride: 1
670    weight_filler {
671      type: "msra"
672      variance_norm: FAN_OUT
673    }
674  }
675}
676node {
677  name: "node_128_3_convbn3"
678  type: "FusedConvBN"
679  bottom: "node_128_3_convbn2"
680  bottom: "node_128_2_convbn3"
681  top: "node_128_3_convbn3"
682  param {
683    lr_mult: 1.0
684    decay_mult: 1.0
685  }
686  param {
687    lr_mult: 1.0
688    decay_mult: 0.0
689  }
690  fused_conv_bn_param {
691    data_type: BF16
692    engine: XSMM
693    num_output: 512
694    ipad: 0
695    mpad: 0
696    opad: 0
697    kernel_size: 1
698    c_stride: 1
699    bn_stride: 1
700    eltwise: true
701    weight_filler {
702      type: "msra"
703      variance_norm: FAN_OUT
704    }
705  }
706}
707node {
708  name: "node_128_4_convbn1"
709  type: "FusedConvBN"
710  bottom: "node_128_3_convbn3"
711  top: "node_128_4_convbn1"
712  param {
713    lr_mult: 1.0
714    decay_mult: 1.0
715  }
716  param {
717    lr_mult: 1.0
718    decay_mult: 0.0
719  }
720  fused_conv_bn_param {
721    data_type: BF16
722    engine: XSMM
723    num_output: 128
724    ipad: 0
725    mpad: 0
726    opad: 1
727    physical_padding: true
728    kernel_size: 1
729    c_stride: 1
730    bn_stride: 1
731    weight_filler {
732      type: "msra"
733      variance_norm: FAN_OUT
734    }
735  }
736}
737node {
738  name: "node_128_4_convbn2"
739  type: "FusedConvBN"
740  bottom: "node_128_4_convbn1"
741  top: "node_128_4_convbn2"
742  param {
743    lr_mult: 1.0
744    decay_mult: 1.0
745  }
746  param {
747    lr_mult: 1.0
748    decay_mult: 0.0
749  }
750  fused_conv_bn_param {
751    data_type: BF16
752    engine: XSMM
753    num_output: 128
754    ipad: 1
755    mpad: 1
756    opad: 0
757    physical_padding: true
758    kernel_size: 3
759    c_stride: 1
760    bn_stride: 1
761    weight_filler {
762      type: "msra"
763      variance_norm: FAN_OUT
764    }
765  }
766}
767node {
768  name: "node_128_4_convbn3"
769  type: "FusedConvBN"
770  bottom: "node_128_4_convbn2"
771  bottom: "node_128_3_convbn3"
772  top: "node_128_4_convbn3"
773  param {
774    lr_mult: 1.0
775    decay_mult: 1.0
776  }
777  param {
778    lr_mult: 1.0
779    decay_mult: 0.0
780  }
781  fused_conv_bn_param {
782    data_type: BF16
783    engine: XSMM
784    num_output: 512
785    ipad: 0
786    mpad: 0
787    opad: 0
788    kernel_size: 1
789    c_stride: 1
790    bn_stride: 2
791    eltwise: true
792    weight_filler {
793      type: "msra"
794      variance_norm: FAN_OUT
795    }
796  }
797}
798node {
799  name: "node_256_1_convbn4"
800  type: "FusedConvBN"
801  bottom: "node_128_4_convbn3"
802  top: "node_256_1_convbn4"
803  param {
804    lr_mult: 1.0
805    decay_mult: 1.0
806  }
807  param {
808    lr_mult: 1.0
809    decay_mult: 0.0
810  }
811  fused_conv_bn_param {
812    data_type: BF16
813    engine: XSMM
814    num_output: 1024
815    ipad: 0
816    mpad: 0
817    opad: 0
818    kernel_size: 1
819    c_stride: 1
820    bn_stride: 1
821    relu_fwd: false
822    relu_bwd: false
823    weight_filler {
824      type: "msra"
825      variance_norm: FAN_OUT
826    }
827  }
828}
829node {
830  name: "node_256_1_convbn1"
831  type: "FusedConvBN"
832  bottom: "node_128_4_convbn3"
833  top: "node_256_1_convbn1"
834  param {
835    lr_mult: 1.0
836    decay_mult: 1.0
837  }
838  param {
839    lr_mult: 1.0
840    decay_mult: 0.0
841  }
842  fused_conv_bn_param {
843    data_type: BF16
844    engine: XSMM
845    num_output: 256
846    ipad: 0
847    mpad: 0
848    opad: 1
849    physical_padding: true
850    kernel_size: 1
851    c_stride: 1
852    bn_stride: 1
853    weight_filler {
854      type: "msra"
855      variance_norm: FAN_OUT
856    }
857  }
858}
859node {
860  name: "node_256_1_convbn2"
861  type: "FusedConvBN"
862  bottom: "node_256_1_convbn1"
863  top: "node_256_1_convbn2"
864  param {
865    lr_mult: 1.0
866    decay_mult: 1.0
867  }
868  param {
869    lr_mult: 1.0
870    decay_mult: 0.0
871  }
872  fused_conv_bn_param {
873    data_type: BF16
874    engine: XSMM
875    num_output: 256
876    ipad: 1
877    mpad: 1
878    opad: 0
879    physical_padding: true
880    kernel_size: 3
881    c_stride: 1
882    bn_stride: 1
883    weight_filler {
884      type: "msra"
885      variance_norm: FAN_OUT
886    }
887  }
888}
889node {
890  name: "node_256_1_convbn3"
891  type: "FusedConvBN"
892  bottom: "node_256_1_convbn2"
893  bottom: "node_256_1_convbn4"
894  top: "node_256_1_convbn3"
895  param {
896    lr_mult: 1.0
897    decay_mult: 1.0
898  }
899  param {
900    lr_mult: 1.0
901    decay_mult: 0.0
902  }
903  fused_conv_bn_param {
904    data_type: BF16
905    engine: XSMM
906    num_output: 1024
907    ipad: 0
908    mpad: 0
909    opad: 0
910    kernel_size: 1
911    c_stride: 1
912    bn_stride: 1
913    eltwise: true
914    weight_filler {
915      type: "msra"
916      variance_norm: FAN_OUT
917    }
918  }
919}
920node {
921  name: "node_256_2_convbn1"
922  type: "FusedConvBN"
923  bottom: "node_256_1_convbn3"
924  top: "node_256_2_convbn1"
925  param {
926    lr_mult: 1.0
927    decay_mult: 1.0
928  }
929  param {
930    lr_mult: 1.0
931    decay_mult: 0.0
932  }
933  fused_conv_bn_param {
934    data_type: BF16
935    engine: XSMM
936    num_output: 256
937    ipad: 0
938    mpad: 0
939    opad: 1
940    physical_padding: true
941    kernel_size: 1
942    c_stride: 1
943    bn_stride: 1
944    weight_filler {
945      type: "msra"
946      variance_norm: FAN_OUT
947    }
948  }
949}
950node {
951  name: "node_256_2_convbn2"
952  type: "FusedConvBN"
953  bottom: "node_256_2_convbn1"
954  top: "node_256_2_convbn2"
955  param {
956    lr_mult: 1.0
957    decay_mult: 1.0
958  }
959  param {
960    lr_mult: 1.0
961    decay_mult: 0.0
962  }
963  fused_conv_bn_param {
964    data_type: BF16
965    engine: XSMM
966    num_output: 256
967    ipad: 1
968    mpad: 1
969    opad: 0
970    physical_padding: true
971    kernel_size: 3
972    c_stride: 1
973    bn_stride: 1
974    weight_filler {
975      type: "msra"
976      variance_norm: FAN_OUT
977    }
978  }
979}
980node {
981  name: "node_256_2_convbn3"
982  type: "FusedConvBN"
983  bottom: "node_256_2_convbn2"
984  bottom: "node_256_1_convbn3"
985  top: "node_256_2_convbn3"
986  param {
987    lr_mult: 1.0
988    decay_mult: 1.0
989  }
990  param {
991    lr_mult: 1.0
992    decay_mult: 0.0
993  }
994  fused_conv_bn_param {
995    data_type: BF16
996    engine: XSMM
997    num_output: 1024
998    ipad: 0
999    mpad: 0
1000    opad: 0
1001    kernel_size: 1
1002    c_stride: 1
1003    bn_stride: 1
1004    eltwise: true
1005    weight_filler {
1006      type: "msra"
1007      variance_norm: FAN_OUT
1008    }
1009  }
1010}
1011node {
1012  name: "node_256_3_convbn1"
1013  type: "FusedConvBN"
1014  bottom: "node_256_2_convbn3"
1015  top: "node_256_3_convbn1"
1016  param {
1017    lr_mult: 1.0
1018    decay_mult: 1.0
1019  }
1020  param {
1021    lr_mult: 1.0
1022    decay_mult: 0.0
1023  }
1024  fused_conv_bn_param {
1025    data_type: BF16
1026    engine: XSMM
1027    num_output: 256
1028    ipad: 0
1029    mpad: 0
1030    opad: 1
1031    physical_padding: true
1032    kernel_size: 1
1033    c_stride: 1
1034    bn_stride: 1
1035    weight_filler {
1036      type: "msra"
1037      variance_norm: FAN_OUT
1038    }
1039  }
1040}
1041node {
1042  name: "node_256_3_convbn2"
1043  type: "FusedConvBN"
1044  bottom: "node_256_3_convbn1"
1045  top: "node_256_3_convbn2"
1046  param {
1047    lr_mult: 1.0
1048    decay_mult: 1.0
1049  }
1050  param {
1051    lr_mult: 1.0
1052    decay_mult: 0.0
1053  }
1054  fused_conv_bn_param {
1055    data_type: BF16
1056    engine: XSMM
1057    num_output: 256
1058    ipad: 1
1059    mpad: 1
1060    opad: 0
1061    physical_padding: true
1062    kernel_size: 3
1063    c_stride: 1
1064    bn_stride: 1
1065    weight_filler {
1066      type: "msra"
1067      variance_norm: FAN_OUT
1068    }
1069  }
1070}
1071node {
1072  name: "node_256_3_convbn3"
1073  type: "FusedConvBN"
1074  bottom: "node_256_3_convbn2"
1075  bottom: "node_256_2_convbn3"
1076  top: "node_256_3_convbn3"
1077  param {
1078    lr_mult: 1.0
1079    decay_mult: 1.0
1080  }
1081  param {
1082    lr_mult: 1.0
1083    decay_mult: 0.0
1084  }
1085  fused_conv_bn_param {
1086    data_type: BF16
1087    engine: XSMM
1088    num_output: 1024
1089    ipad: 0
1090    mpad: 0
1091    opad: 0
1092    kernel_size: 1
1093    c_stride: 1
1094    bn_stride: 1
1095    eltwise: true
1096    weight_filler {
1097      type: "msra"
1098      variance_norm: FAN_OUT
1099    }
1100  }
1101}
1102node {
1103  name: "node_256_4_convbn1"
1104  type: "FusedConvBN"
1105  bottom: "node_256_3_convbn3"
1106  top: "node_256_4_convbn1"
1107  param {
1108    lr_mult: 1.0
1109    decay_mult: 1.0
1110  }
1111  param {
1112    lr_mult: 1.0
1113    decay_mult: 0.0
1114  }
1115  fused_conv_bn_param {
1116    data_type: BF16
1117    engine: XSMM
1118    num_output: 256
1119    ipad: 0
1120    mpad: 0
1121    opad: 1
1122    physical_padding: true
1123    kernel_size: 1
1124    c_stride: 1
1125    bn_stride: 1
1126    weight_filler {
1127      type: "msra"
1128      variance_norm: FAN_OUT
1129    }
1130  }
1131}
1132node {
1133  name: "node_256_4_convbn2"
1134  type: "FusedConvBN"
1135  bottom: "node_256_4_convbn1"
1136  top: "node_256_4_convbn2"
1137  param {
1138    lr_mult: 1.0
1139    decay_mult: 1.0
1140  }
1141  param {
1142    lr_mult: 1.0
1143    decay_mult: 0.0
1144  }
1145  fused_conv_bn_param {
1146    data_type: BF16
1147    engine: XSMM
1148    num_output: 256
1149    ipad: 1
1150    mpad: 1
1151    opad: 0
1152    physical_padding: true
1153    kernel_size: 3
1154    c_stride: 1
1155    bn_stride: 1
1156    weight_filler {
1157      type: "msra"
1158      variance_norm: FAN_OUT
1159    }
1160  }
1161}
1162node {
1163  name: "node_256_4_convbn3"
1164  type: "FusedConvBN"
1165  bottom: "node_256_4_convbn2"
1166  bottom: "node_256_3_convbn3"
1167  top: "node_256_4_convbn3"
1168  param {
1169    lr_mult: 1.0
1170    decay_mult: 1.0
1171  }
1172  param {
1173    lr_mult: 1.0
1174    decay_mult: 0.0
1175  }
1176  fused_conv_bn_param {
1177    data_type: BF16
1178    engine: XSMM
1179    num_output: 1024
1180    ipad: 0
1181    mpad: 0
1182    opad: 0
1183    kernel_size: 1
1184    c_stride: 1
1185    bn_stride: 1
1186    eltwise: true
1187    weight_filler {
1188      type: "msra"
1189      variance_norm: FAN_OUT
1190    }
1191  }
1192}
1193node {
1194  name: "node_256_5_convbn1"
1195  type: "FusedConvBN"
1196  bottom: "node_256_4_convbn3"
1197  top: "node_256_5_convbn1"
1198  param {
1199    lr_mult: 1.0
1200    decay_mult: 1.0
1201  }
1202  param {
1203    lr_mult: 1.0
1204    decay_mult: 0.0
1205  }
1206  fused_conv_bn_param {
1207    data_type: BF16
1208    engine: XSMM
1209    num_output: 256
1210    ipad: 0
1211    mpad: 0
1212    opad: 1
1213    physical_padding: true
1214    kernel_size: 1
1215    c_stride: 1
1216    bn_stride: 1
1217    weight_filler {
1218      type: "msra"
1219      variance_norm: FAN_OUT
1220    }
1221  }
1222}
1223node {
1224  name: "node_256_5_convbn2"
1225  type: "FusedConvBN"
1226  bottom: "node_256_5_convbn1"
1227  top: "node_256_5_convbn2"
1228  param {
1229    lr_mult: 1.0
1230    decay_mult: 1.0
1231  }
1232  param {
1233    lr_mult: 1.0
1234    decay_mult: 0.0
1235  }
1236  fused_conv_bn_param {
1237    data_type: BF16
1238    engine: XSMM
1239    num_output: 256
1240    ipad: 1
1241    mpad: 1
1242    opad: 0
1243    physical_padding: true
1244    kernel_size: 3
1245    c_stride: 1
1246    bn_stride: 1
1247    weight_filler {
1248      type: "msra"
1249      variance_norm: FAN_OUT
1250    }
1251  }
1252}
1253node {
1254  name: "node_256_5_convbn3"
1255  type: "FusedConvBN"
1256  bottom: "node_256_5_convbn2"
1257  bottom: "node_256_4_convbn3"
1258  top: "node_256_5_convbn3"
1259  param {
1260    lr_mult: 1.0
1261    decay_mult: 1.0
1262  }
1263  param {
1264    lr_mult: 1.0
1265    decay_mult: 0.0
1266  }
1267  fused_conv_bn_param {
1268    data_type: BF16
1269    engine: XSMM
1270    num_output: 1024
1271    ipad: 0
1272    mpad: 0
1273    opad: 0
1274    kernel_size: 1
1275    c_stride: 1
1276    bn_stride: 1
1277    eltwise: true
1278    weight_filler {
1279      type: "msra"
1280      variance_norm: FAN_OUT
1281    }
1282  }
1283}
1284node {
1285  name: "node_256_6_convbn1"
1286  type: "FusedConvBN"
1287  bottom: "node_256_5_convbn3"
1288  top: "node_256_6_convbn1"
1289  param {
1290    lr_mult: 1.0
1291    decay_mult: 1.0
1292  }
1293  param {
1294    lr_mult: 1.0
1295    decay_mult: 0.0
1296  }
1297  fused_conv_bn_param {
1298    data_type: BF16
1299    engine: XSMM
1300    num_output: 256
1301    ipad: 0
1302    mpad: 0
1303    opad: 1
1304    physical_padding: true
1305    kernel_size: 1
1306    c_stride: 1
1307    bn_stride: 1
1308    weight_filler {
1309      type: "msra"
1310      variance_norm: FAN_OUT
1311    }
1312  }
1313}
1314node {
1315  name: "node_256_6_convbn2"
1316  type: "FusedConvBN"
1317  bottom: "node_256_6_convbn1"
1318  top: "node_256_6_convbn2"
1319  param {
1320    lr_mult: 1.0
1321    decay_mult: 1.0
1322  }
1323  param {
1324    lr_mult: 1.0
1325    decay_mult: 0.0
1326  }
1327  fused_conv_bn_param {
1328    data_type: BF16
1329    engine: XSMM
1330    num_output: 256
1331    ipad: 1
1332    mpad: 1
1333    opad: 0
1334    physical_padding: true
1335    kernel_size: 3
1336    c_stride: 1
1337    bn_stride: 1
1338    weight_filler {
1339      type: "msra"
1340      variance_norm: FAN_OUT
1341    }
1342  }
1343}
1344node {
1345  name: "node_256_6_convbn3"
1346  type: "FusedConvBN"
1347  bottom: "node_256_6_convbn2"
1348  bottom: "node_256_5_convbn3"
1349  top: "node_256_6_convbn3"
1350  param {
1351    lr_mult: 1.0
1352    decay_mult: 1.0
1353  }
1354  param {
1355    lr_mult: 1.0
1356    decay_mult: 0.0
1357  }
1358  fused_conv_bn_param {
1359    data_type: BF16
1360    engine: XSMM
1361    num_output: 1024
1362    ipad: 0
1363    mpad: 0
1364    opad: 0
1365    kernel_size: 1
1366    c_stride: 1
1367    bn_stride: 2
1368    eltwise: true
1369    weight_filler {
1370      type: "msra"
1371      variance_norm: FAN_OUT
1372    }
1373  }
1374}
1375node {
1376  name: "node_512_1_convbn4"
1377  type: "FusedConvBN"
1378  bottom: "node_256_6_convbn3"
1379  top: "node_512_1_convbn4"
1380  param {
1381    lr_mult: 1.0
1382    decay_mult: 1.0
1383  }
1384  param {
1385    lr_mult: 1.0
1386    decay_mult: 0.0
1387  }
1388  fused_conv_bn_param {
1389    data_type: BF16
1390    engine: XSMM
1391    num_output: 2048
1392    ipad: 0
1393    mpad: 0
1394    opad: 0
1395    relu_fwd: false
1396    relu_bwd: false
1397    kernel_size: 1
1398    c_stride: 1
1399    bn_stride: 1
1400    weight_filler {
1401      type: "msra"
1402      variance_norm: FAN_OUT
1403    }
1404  }
1405}
1406node {
1407  name: "node_512_1_convbn1"
1408  type: "FusedConvBN"
1409  bottom: "node_256_6_convbn3"
1410  top: "node_512_1_convbn1"
1411  param {
1412    lr_mult: 1.0
1413    decay_mult: 1.0
1414  }
1415  param {
1416    lr_mult: 1.0
1417    decay_mult: 0.0
1418  }
1419  fused_conv_bn_param {
1420    data_type: BF16
1421    engine: XSMM
1422    num_output: 512
1423    ipad: 0
1424    mpad: 0
1425    opad: 1
1426    physical_padding: true
1427    kernel_size: 1
1428    c_stride: 1
1429    bn_stride: 1
1430    weight_filler {
1431      type: "msra"
1432      variance_norm: FAN_OUT
1433    }
1434  }
1435}
1436node {
1437  name: "node_512_1_convbn2"
1438  type: "FusedConvBN"
1439  bottom: "node_512_1_convbn1"
1440  top: "node_512_1_convbn2"
1441  param {
1442    lr_mult: 1.0
1443    decay_mult: 1.0
1444  }
1445  param {
1446    lr_mult: 1.0
1447    decay_mult: 0.0
1448  }
1449  fused_conv_bn_param {
1450    data_type: BF16
1451    engine: XSMM
1452    num_output: 512
1453    ipad: 1
1454    mpad: 1
1455    opad: 0
1456    physical_padding: true
1457    kernel_size: 3
1458    c_stride: 1
1459    bn_stride: 1
1460    weight_filler {
1461      type: "msra"
1462      variance_norm: FAN_OUT
1463    }
1464  }
1465}
1466node {
1467  name: "node_512_1_convbn3"
1468  type: "FusedConvBN"
1469  bottom: "node_512_1_convbn2"
1470  bottom: "node_512_1_convbn4"
1471  top: "node_512_1_convbn3"
1472  param {
1473    lr_mult: 1.0
1474    decay_mult: 1.0
1475  }
1476  param {
1477    lr_mult: 1.0
1478    decay_mult: 0.0
1479  }
1480  fused_conv_bn_param {
1481    data_type: BF16
1482    engine: XSMM
1483    num_output: 2048
1484    ipad: 0
1485    mpad: 0
1486    opad: 0
1487    kernel_size: 1
1488    c_stride: 1
1489    bn_stride: 1
1490    eltwise: true
1491    weight_filler {
1492      type: "msra"
1493      variance_norm: FAN_OUT
1494    }
1495  }
1496}
1497node {
1498  name: "node_512_2_convbn1"
1499  type: "FusedConvBN"
1500  bottom: "node_512_1_convbn3"
1501  top: "node_512_2_convbn1"
1502  param {
1503    lr_mult: 1.0
1504    decay_mult: 1.0
1505  }
1506  param {
1507    lr_mult: 1.0
1508    decay_mult: 0.0
1509  }
1510  fused_conv_bn_param {
1511    data_type: BF16
1512    engine: XSMM
1513    num_output: 512
1514    ipad: 0
1515    mpad: 0
1516    opad: 1
1517    physical_padding: true
1518    kernel_size: 1
1519    c_stride: 1
1520    bn_stride: 1
1521    weight_filler {
1522      type: "msra"
1523      variance_norm: FAN_OUT
1524    }
1525  }
1526}
1527node {
1528  name: "node_512_2_convbn2"
1529  type: "FusedConvBN"
1530  bottom: "node_512_2_convbn1"
1531  top: "node_512_2_convbn2"
1532  param {
1533    lr_mult: 1.0
1534    decay_mult: 1.0
1535  }
1536  param {
1537    lr_mult: 1.0
1538    decay_mult: 0.0
1539  }
1540  fused_conv_bn_param {
1541    data_type: BF16
1542    engine: XSMM
1543    num_output: 512
1544    ipad: 1
1545    mpad: 1
1546    opad: 0
1547    physical_padding: true
1548    kernel_size: 3
1549    c_stride: 1
1550    bn_stride: 1
1551    weight_filler {
1552      type: "msra"
1553      variance_norm: FAN_OUT
1554    }
1555  }
1556}
1557node {
1558  name: "node_512_2_convbn3"
1559  type: "FusedConvBN"
1560  bottom: "node_512_2_convbn2"
1561  bottom: "node_512_1_convbn3"
1562  top: "node_512_2_convbn3"
1563  param {
1564    lr_mult: 1.0
1565    decay_mult: 1.0
1566  }
1567  param {
1568    lr_mult: 1.0
1569    decay_mult: 0.0
1570  }
1571  fused_conv_bn_param {
1572    data_type: BF16
1573    engine: XSMM
1574    num_output: 2048
1575    ipad: 0
1576    mpad: 0
1577    opad: 0
1578    kernel_size: 1
1579    c_stride: 1
1580    bn_stride: 1
1581    eltwise: true
1582    weight_filler {
1583      type: "msra"
1584      variance_norm: FAN_OUT
1585    }
1586  }
1587}
1588node {
1589  name: "node_512_3_convbn1"
1590  type: "FusedConvBN"
1591  bottom: "node_512_2_convbn3"
1592  top: "node_512_3_convbn1"
1593  param {
1594    lr_mult: 1.0
1595    decay_mult: 1.0
1596  }
1597  param {
1598    lr_mult: 1.0
1599    decay_mult: 0.0
1600  }
1601  fused_conv_bn_param {
1602    data_type: BF16
1603    engine: XSMM
1604    num_output: 512
1605    ipad: 0
1606    mpad: 0
1607    opad: 1
1608    physical_padding: true
1609    kernel_size: 1
1610    c_stride: 1
1611    bn_stride: 1
1612    weight_filler {
1613      type: "msra"
1614      variance_norm: FAN_OUT
1615    }
1616  }
1617}
1618node {
1619  name: "node_512_3_convbn2"
1620  type: "FusedConvBN"
1621  bottom: "node_512_3_convbn1"
1622  top: "node_512_3_convbn2"
1623  param {
1624    lr_mult: 1.0
1625    decay_mult: 1.0
1626  }
1627  param {
1628    lr_mult: 1.0
1629    decay_mult: 0.0
1630  }
1631  fused_conv_bn_param {
1632    data_type: BF16
1633    engine: XSMM
1634    num_output: 512
1635    ipad: 1
1636    mpad: 1
1637    opad: 0
1638    physical_padding: true
1639    kernel_size: 3
1640    c_stride: 1
1641    bn_stride: 1
1642    weight_filler {
1643      type: "msra"
1644      variance_norm: FAN_OUT
1645    }
1646  }
1647}
1648node {
1649  name: "node_512_3_convbn3"
1650  type: "FusedConvBN"
1651  bottom: "node_512_3_convbn2"
1652  bottom: "node_512_2_convbn3"
1653  top: "node_512_3_convbn3"
1654  param {
1655    lr_mult: 1.0
1656    decay_mult: 1.0
1657  }
1658  param {
1659    lr_mult: 1.0
1660    decay_mult: 0.0
1661  }
1662  fused_conv_bn_param {
1663    data_type: BF16
1664    engine: XSMM
1665    num_output: 2048
1666    ipad: 0
1667    mpad: 0
1668    opad: 0
1669    kernel_size: 1
1670    c_stride: 1
1671    bn_stride: 1
1672    eltwise: true
1673    weight_filler {
1674      type: "msra"
1675      variance_norm: FAN_OUT
1676    }
1677  }
1678}
1679node {
1680  name: "pool5"
1681  type: "Pooling"
1682  bottom: "node_512_3_convbn3"
1683  top: "pool5"
1684  pooling_param {
1685    data_type: BF16
1686    engine: XSMM
1687    pool: AVE
1688    kernel_size: 7
1689    stride: 1
1690  }
1691}
1692node {
1693  name: "fc1000"
1694  type: "FullyConnected"
1695  bottom: "pool5"
1696  top: "fc1000"
1697  param {
1698    lr_mult: 1.0
1699    decay_mult: 1.0
1700  }
1701  fc_param {
1702    data_type: FLOAT
1703    num_output: 1000
1704    engine: XSMM
1705    bias_term: false
1706    weight_filler {
1707      type: "Gaussian"
1708      std: 0.01
1709    }
1710  }
1711}
1712node {
1713  name: "prob"
1714  type: "SoftmaxWithLoss"
1715  bottom: "fc1000"
1716  bottom: "label"
1717  top: "prob"
1718  loss_weight: 1
1719}
1720node {
1721  name: "accuracy1"
1722  type: "Accuracy"
1723  bottom: "fc1000"
1724  bottom: "label"
1725  top: "accuracy1"
1726  propagate_down: false
1727  accuracy_param{
1728     top_k: 1
1729  }
1730}
1731node {
1732  name: "accuracy5"
1733  type: "Accuracy"
1734  bottom: "fc1000"
1735  bottom: "label"
1736  top: "accuracy5"
1737  propagate_down: false
1738  accuracy_param{
1739     top_k: 5
1740  }
1741}
1742