Skip to content
Snippets Groups Projects
Commit ca084eba authored by Akash Kothari's avatar Akash Kothari
Browse files

Adding dev time soc results

parent f5e0ad39
No related branches found
No related tags found
No related merge requests found
Showing
with 10585 additions and 0 deletions
1114.3009809999999
+++++
conf1 1 1 84.98 0.0
1 gpu conv fp32 11 add fp32 1 tanh fp32 1
2 gpu conv fp32 11 add fp32 1 tanh fp32 1 pool_max fp32 1
3 gpu conv fp32 11 add fp32 1 tanh fp32 1
4 gpu conv fp32 11 add fp32 1 tanh fp32 1 pool_max fp32 1
5 gpu conv fp32 11 add fp32 1 tanh fp32 1
6 gpu conv fp32 11 add fp32 1 tanh fp32 1 pool_max fp32 1
7 gpu mul fp32 11 add fp32 1
8 gpu softmax fp32 1
-----
+++++
conf2 2.4248748377353113 2.0815908534183163 84.5 0.480000000000004
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf3 2.4055188425519614 2.0586265720811823 84.48 0.5
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 269 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf4 2.4156140842962985 2.0617867479342706 84.28 0.7000000000000028
1 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 267 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 163 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf5 2.396416918342732 2.0506214971794585 84.02 0.960000000000008
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 151 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf6 2.463002582910052 2.1171077568609458 83.84 1.1400000000000006
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 167 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf7 2.360283215266004 2.0255245321874304 83.78 1.2000000000000028
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv fp16 12 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf8 2.4140791541736157 2.0671513522247653 83.74000000000001 1.2399999999999949
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 267 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf9 2.457753689612079 2.1086250651240137 83.7 1.2800000000000011
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 163 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf10 2.459170454055443 2.1111925341396343 83.7 1.2800000000000011
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 164 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf11 2.4135986141645764 2.060453960420927 83.62 1.3599999999999994
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 267 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf12 2.4631278039012106 2.1092094797926637 83.58 1.4000000000000057
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf13 2.535761391794481 2.16998336112692 83.58 1.4000000000000057
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf14 2.289006193945062 1.961240158652051 83.54 1.4399999999999977
1 gpu conv perf_fp16 167 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 155 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf15 2.4257674844112573 2.0808440756495563 83.5 1.480000000000004
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 261 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 161 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf16 2.458122368488622 2.109531159729078 83.48 1.5
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 162 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf17 2.281072202152105 1.9539314420536427 83.46000000000001 1.519999999999996
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf18 2.4572171342078444 2.1088933553775697 83.46000000000001 1.519999999999996
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 163 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf19 2.3017607719030058 1.9782265708150768 83.42 1.5600000000000023
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 162 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 261 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 162 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf20 2.379206814483014 2.047909200292713 83.39999999999999 1.5800000000000125
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 151 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf21 2.4636282705302537 2.1162281156388527 83.39999999999999 1.5800000000000125
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf22 2.461590101374146 2.1108493881199184 83.22 1.7600000000000051
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 161 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf23 2.537054645442804 2.167568834938183 83.22 1.7600000000000051
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf24 2.4631604723407885 2.1099694757102845 83.17999999999999 1.8000000000000114
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 267 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf25 2.4636282705302537 2.1162281156388527 83.14 1.8400000000000034
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf26 2.462588899729088 2.109477918791931 83.14 1.8400000000000034
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf27 2.4638085754689025 2.1071960926343603 83.1 1.8800000000000097
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf28 2.4640079766123635 2.110326453157297 83.08 1.9000000000000057
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 261 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv fp16 12 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf29 2.459337622764853 2.107249218450713 83.06 1.9200000000000017
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 162 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf30 2.538176340059405 2.173287257415721 83.02000000000001 1.9599999999999937
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 261 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 164 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf31 2.3905426931959846 2.044333576277581 83.02000000000001 1.9599999999999937
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 261 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf32 2.459337622764853 2.107249218450713 83.0 1.980000000000004
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 162 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf33 2.458968579288317 2.1063450826631396 82.89999999999999 2.0800000000000125
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 266 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 163 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf34 2.2912974651603877 1.9670210508860688 82.8 2.180000000000007
1 gpu conv perf_fp16 168 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 155 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf35 2.4648489763056327 2.113931670664391 82.66 2.3200000000000074
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf36 2.4599076869402854 2.1077397371200193 82.6 2.3800000000000097
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 153 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 267 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 162 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf37 2.4636282705302537 2.1162281156388527 82.54 2.4399999999999977
1 gpu conv fp16 11 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 268 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 160 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
+++++
conf38 2.591814267389778 2.222680944458784 82.26 2.719999999999999
1 gpu conv fp16 12 add fp16 1 tanh fp16 1
2 gpu conv perf_fp16 154 add fp16 1 tanh fp16 1 pool_max fp16 1
3 gpu conv samp_fp16 261 add fp16 1 tanh fp16 1
4 gpu conv samp_fp16 262 add fp16 1 tanh fp16 1 pool_max fp16 1
5 gpu conv fp16 12 add fp16 1 tanh fp16 1
6 gpu conv perf_fp16 157 add fp16 1 tanh fp16 1 pool_max fp16 1
7 gpu mul fp16 12 add fp16 1
8 gpu softmax fp32 1
-----
2739.950736
+++++
conf1 1 1 56.3 0.0
1 gpu conv fp32 11 add fp32 1 relu fp32 1 pool_max fp32 1
2 gpu conv fp32 11 add fp32 1 relu fp32 1 pool_max fp32 1
3 gpu conv fp32 11 add fp32 1 relu fp32 1
4 gpu conv fp32 11 add fp32 1 relu fp32 1
5 gpu conv fp32 11 add fp32 1 relu fp32 1 pool_max fp32 1
6 gpu mul fp32 11 add fp32 1 relu fp32 1
7 gpu mul fp32 11 add fp32 1 relu fp32 1
8 gpu mul fp32 11 add fp32 1
9 gpu softmax fp32 1
-----
+++++
conf2 1.802133644103582 1.8186433204507424 55.76 0.5399999999999991
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv fp16 12 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf3 1.7574572103878898 1.7673706184460103 55.58 0.7199999999999989
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv fp16 12 add fp16 1 relu fp16 1
5 gpu conv samp_fp16 268 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf4 2.0227701930718065 2.043112495268932 55.42 0.8799999999999955
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 166 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv fp16 12 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf5 1.9872634777043927 2.002789650227035 55.120000000000005 1.1799999999999926
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv fp16 12 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf6 1.8204253918445088 1.843736069756362 54.84 1.4599999999999937
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 164 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 154 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf7 1.9308336510645352 1.934889049414224 54.74 1.5599999999999952
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 168 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf8 2.0146435217865446 2.0367475358800102 54.58 1.7199999999999989
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 162 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv fp16 12 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf9 2.0101709494490696 2.0329911158023064 54.400000000000006 1.8999999999999915
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 152 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf10 2.0052132441967916 2.0284931705407003 54.300000000000004 1.999999999999993
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 168 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf11 2.010827434817262 2.036001862538864 54.2 2.0999999999999943
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 154 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf12 2.019868378233057 2.0433540129730265 54.17999999999999 2.1200000000000045
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 162 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf13 1.9923471030291253 2.009177323959059 54.120000000000005 2.1799999999999926
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf14 1.9923471030291253 2.009177323959059 54.120000000000005 2.1799999999999926
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf15 2.028037341700216 2.049760395549724 54.0 2.299999999999997
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 166 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf16 1.9910730364852436 2.006510848093771 53.54 2.759999999999998
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 164 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf17 2.1567475543719614 2.159142310265706 53.300000000000004 2.999999999999993
1 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 166 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf18 2.1567475543719614 2.159142310265706 53.300000000000004 2.999999999999993
1 gpu conv perf_fp16 164 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 166 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 12 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 157 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
+++++
conf19 2.0232690820426464 2.0527698121318476 53.300000000000004 2.999999999999993
1 gpu conv fp16 12 add fp16 1 relu fp16 1 pool_max fp16 1
2 gpu conv perf_fp16 168 add fp16 1 relu fp16 1 pool_max fp16 1
3 gpu conv fp16 11 add fp16 1 relu fp16 1
4 gpu conv perf_fp16 163 add fp16 1 relu fp16 1
5 gpu conv perf_fp16 152 add fp16 1 relu fp16 1 pool_max fp16 1
6 gpu mul fp16 12 add fp16 1 relu fp16 1
7 gpu mul fp16 12 add fp16 1 relu fp16 1
8 gpu mul fp16 12 add fp16 1
9 gpu softmax fp32 1
-----
282.5141369999999
+++++
conf1 1 1 98.7 0.0
1 gpu conv fp32 11 add fp32 1 pool_max fp32 1 tanh fp32 1
2 gpu conv fp32 11 add fp32 1 pool_max fp32 1 tanh fp32 1
3 gpu mul fp32 11 add fp32 1 tanh fp32 1
4 gpu mul fp32 11 add fp32 1 tanh fp32 1
5 gpu softmax fp32 1
-----
+++++
conf2 1.828613181003043 2.071721708828981 98.65 0.04999999999999716
1 gpu conv perf_fp16 156 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 261 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf3 1.8936889628815377 2.139779619692146 98.65 0.04999999999999716
1 gpu conv perf_fp16 152 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf4 1.8936889628815377 2.139779619692146 98.65 0.04999999999999716
1 gpu conv perf_fp16 152 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf5 1.8936889628815377 2.139779619692146 98.65 0.04999999999999716
1 gpu conv perf_fp16 152 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf6 1.8247639611533713 2.0227145446958756 98.64 0.060000000000002274
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 261 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf7 1.8247639611533713 2.0227145446958756 98.64 0.060000000000002274
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 261 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf8 1.8406161850501603 2.037849502542524 98.64 0.060000000000002274
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf9 1.8406161850501603 2.037849502542524 98.64 0.060000000000002274
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf10 1.8406161850501603 2.037849502542524 98.64 0.060000000000002274
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf11 1.8663357888260776 2.115790921611576 98.64 0.060000000000002274
1 gpu conv perf_fp16 155 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf12 1.8663357888260776 2.115790921611576 98.64 0.060000000000002274
1 gpu conv perf_fp16 155 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf13 1.8663357888260776 2.115790921611576 98.64 0.060000000000002274
1 gpu conv perf_fp16 155 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf14 1.8645645142051612 2.1037012333044935 98.61999999999999 0.0800000000000125
1 gpu conv perf_fp16 167 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf15 1.8645645142051612 2.1037012333044935 98.61999999999999 0.0800000000000125
1 gpu conv perf_fp16 167 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf16 1.8645645142051612 2.1037012333044935 98.61999999999999 0.0800000000000125
1 gpu conv perf_fp16 167 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf17 2.2168527051833635 2.453341076720038 98.61999999999999 0.0800000000000125
1 gpu conv samp_fp16 264 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf18 2.2168527051833635 2.453341076720038 98.61999999999999 0.0800000000000125
1 gpu conv samp_fp16 264 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf19 2.2168527051833635 2.453341076720038 98.61999999999999 0.0800000000000125
1 gpu conv samp_fp16 264 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf20 1.8406161850501603 2.037849502542524 98.6 0.10000000000000853
1 gpu conv fp16 12 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf21 1.8406161850501603 2.037849502542524 98.6 0.10000000000000853
1 gpu conv fp16 12 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf22 1.8406161850501603 2.037849502542524 98.6 0.10000000000000853
1 gpu conv fp16 12 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf23 1.8406161850501603 2.037849502542524 98.6 0.10000000000000853
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf24 1.8406161850501603 2.037849502542524 98.6 0.10000000000000853
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf25 1.8406161850501603 2.037849502542524 98.6 0.10000000000000853
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf26 2.200653361151419 2.425091789360736 98.6 0.10000000000000853
1 gpu conv samp_fp16 266 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf27 2.200653361151419 2.425091789360736 98.6 0.10000000000000853
1 gpu conv samp_fp16 266 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf28 1.8406161850501603 2.037849502542524 98.58 0.12000000000000455
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf29 1.8406161850501603 2.037849502542524 98.58 0.12000000000000455
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf30 1.8406161850501603 2.037849502542524 98.58 0.12000000000000455
1 gpu conv fp16 11 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf31 1.8445326456180258 2.087601822059355 98.58 0.12000000000000455
1 gpu conv perf_fp16 156 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf32 1.8445326456180258 2.087601822059355 98.58 0.12000000000000455
1 gpu conv perf_fp16 156 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf33 1.8445326456180258 2.087601822059355 98.58 0.12000000000000455
1 gpu conv perf_fp16 156 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf34 1.8916677984300285 2.155437579874673 98.58 0.12000000000000455
1 gpu conv perf_fp16 158 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf35 1.8916677984300285 2.155437579874673 98.58 0.12000000000000455
1 gpu conv perf_fp16 158 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf36 1.8916677984300285 2.155437579874673 98.58 0.12000000000000455
1 gpu conv perf_fp16 158 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf37 1.8649226857257986 2.1076025277601325 98.56 0.14000000000000057
1 gpu conv perf_fp16 168 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf38 1.8649226857257986 2.1076025277601325 98.56 0.14000000000000057
1 gpu conv perf_fp16 168 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf39 1.8649226857257986 2.1076025277601325 98.56 0.14000000000000057
1 gpu conv perf_fp16 168 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf40 1.8463058650555446 2.067271423078985 98.56 0.14000000000000057
1 gpu conv perf_fp16 157 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf41 1.8463058650555446 2.067271423078985 98.56 0.14000000000000057
1 gpu conv perf_fp16 157 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf42 1.8463058650555446 2.067271423078985 98.56 0.14000000000000057
1 gpu conv perf_fp16 157 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf43 1.9234076467497994 2.1864740913112275 98.56 0.14000000000000057
1 gpu conv perf_fp16 153 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf44 1.9234076467497994 2.1864740913112275 98.56 0.14000000000000057
1 gpu conv perf_fp16 153 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf45 1.9234076467497994 2.1864740913112275 98.56 0.14000000000000057
1 gpu conv perf_fp16 153 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf46 1.8698191484268973 2.13979218727595 98.54 0.1599999999999966
1 gpu conv perf_fp16 159 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf47 1.8698191484268973 2.13979218727595 98.54 0.1599999999999966
1 gpu conv perf_fp16 159 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf48 1.8575043605938137 2.092057786757256 98.52 0.18000000000000682
1 gpu conv perf_fp16 165 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf49 1.8575043605938137 2.092057786757256 98.52 0.18000000000000682
1 gpu conv perf_fp16 165 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf50 1.8575043605938137 2.092057786757256 98.52 0.18000000000000682
1 gpu conv perf_fp16 165 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 262 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
+++++
conf51 1.8534621507951072 2.1231113105788597 98.44000000000001 0.2599999999999909
1 gpu conv perf_fp16 159 add fp16 1 pool_max fp16 1 tanh fp16 1
2 gpu conv samp_fp16 261 add fp16 1 pool_max fp16 1 tanh fp16 1
3 gpu mul fp16 12 add fp16 1 tanh fp16 1
4 gpu mul fp16 12 add fp16 1 tanh fp16 1
5 gpu softmax fp32 1
-----
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment