From f8577472c4b4c9ba1445520c6b0dfc843c78bfa2 Mon Sep 17 00:00:00 2001
From: hsharif3 <ubuntu@ip-172-31-14-218.us-east-2.compute.internal>
Date: Sun, 17 Nov 2019 23:29:57 +0000
Subject: [PATCH] Adding pareto confs for LeNet

---
 .../tuner_pareto_confs_batch220.txt           | 904 ++++++++++++++++++
 1 file changed, 904 insertions(+)
 create mode 100644 llvm/test/VISC/DNN_Benchmarks/benchmarks/lenet/data/autotuner_data/tuner_pareto_confs_batch220.txt

diff --git a/llvm/test/VISC/DNN_Benchmarks/benchmarks/lenet/data/autotuner_data/tuner_pareto_confs_batch220.txt b/llvm/test/VISC/DNN_Benchmarks/benchmarks/lenet/data/autotuner_data/tuner_pareto_confs_batch220.txt
new file mode 100644
index 0000000000..20b92832d4
--- /dev/null
+++ b/llvm/test/VISC/DNN_Benchmarks/benchmarks/lenet/data/autotuner_data/tuner_pareto_confs_batch220.txt
@@ -0,0 +1,904 @@
++++++
+conf1 1 0 99.69 0
+1 gpu conv fp32 1 add fp32 1 pool_max fp32 1 tanh fp32 1 
+2 gpu conv fp32 1 add fp32 1 pool_max fp32 1 tanh fp32 1 
+3 gpu mul fp32 1 add fp32 1 tanh fp32 1 
+4 gpu mul fp32 1 add fp32 1 tanh fp32 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf1 2.01610051566 0 99.400002 0.6899979999999971
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf2 2.01610051566 0 99.040001 0.974998499999991
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf3 2.00016617632 0 99.68 0.4099999999999909
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf4 2.00016617632 0 99.660004 0.42999599999999705
+1 gpu conv perf 29 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf5 1.97610564729 0 99.599998 0.4900019999999984
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf6 2.00016617632 0 99.599998 0.4900019999999984
+1 gpu conv perf 25 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf7 2.00016617632 0 99.080002 0.9149970000000067
+1 gpu conv perf 30 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf8 2.00016617632 0 99.239998 0.6750029999999967
+1 gpu conv perf 30 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf9 2.00016617632 0 99.199997 0.7350045000000023
+1 gpu conv perf 28 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf10 1.99590274244 0 99.099998 0.8850029999999975
+1 gpu conv samp 36 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf11 2.01610051566 0 99.559998 0.5300020000000046
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf12 1.99590274244 0 99.540001 0.549998999999994
+1 gpu conv samp 33 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf13 2.00016617632 0 99.639999 0.45000099999999466
+1 gpu conv perf 30 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf14 1.99590274244 0 99.580002 0.5099980000000045
+1 gpu conv samp 33 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf15 2.01610051566 0 99.099998 0.8850029999999975
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf16 2.01610051566 0 99.160004 0.7949939999999955
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf17 2.00016617632 0 99.379997 0.46500449999999205
+1 gpu conv perf 29 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf18 1.99590274244 0 99.639999 0.45000099999999466
+1 gpu conv samp 36 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf19 2.01610051566 0 99.580002 0.5099980000000045
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf20 1.97610564729 0 99.660004 0.42999599999999705
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf21 1.99590274244 0 99.440002 0.6499979999999909
+1 gpu conv samp 33 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf22 1.99590274244 0 99.260002 0.6449969999999965
+1 gpu conv samp 36 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf23 2.00016617632 0 99.360001 0.49499850000000123
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf24 2.01610051566 0 99.32 0.5550000000000068
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf25 2.00016617632 0 99.519997 0.5700029999999942
+1 gpu conv perf 30 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf26 1.97610564729 0 99.379997 0.46500449999999205
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf27 2.01610051566 0 99.68 0.4099999999999909
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf28 2.00016617632 0 99.559998 0.5300020000000046
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf29 2.00016617632 0 99.080002 0.9149970000000067
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf30 1.97610564729 0 99.660004 0.42999599999999705
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf31 2.01610051566 0 99.599998 0.4900019999999984
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf32 1.97610564729 0 99.080002 0.9149970000000067
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf33 2.01610051566 0 99.620003 0.4699970000000008
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf34 2.00016617632 0 99.620003 0.4699970000000008
+1 gpu conv perf 28 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf35 2.00016617632 0 99.599998 0.4900019999999984
+1 gpu conv perf 25 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf36 1.99590274244 0 99.599998 0.4900019999999984
+1 gpu conv samp 36 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf37 2.01610051566 0 99.540001 0.549998999999994
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf38 2.00016617632 0 99.339996 0.5250059999999976
+1 gpu conv perf 25 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf39 2.00016617632 0 99.599998 0.4900019999999984
+1 gpu conv perf 24 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf40 1.97610564729 0 99.379997 0.46500449999999205
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf41 2.00016617632 0 99.559998 0.5300020000000046
+1 gpu conv perf 28 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf42 1.99590274244 0 99.459999 0.6300010000000015
+1 gpu conv samp 34 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf43 1.99590274244 0 99.400002 0.6899979999999971
+1 gpu conv samp 34 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf44 2.00016617632 0 99.599998 0.4900019999999984
+1 gpu conv perf 29 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf45 2.01610051566 0 99.599998 0.4900019999999984
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf46 2.01610051566 0 99.080002 0.9149970000000067
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf47 2.01610051566 0 99.660004 0.42999599999999705
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf48 2.00016617632 0 99.639999 0.45000099999999466
+1 gpu conv perf 24 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf49 2.01610051566 0 99.480003 0.6099970000000013
+1 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf50 2.00016617632 0 98.400002 1.9349969999999956
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf51 2.01610051566 0 98.540001 1.724998499999991
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf52 2.01610051566 0 99.080002 0.9149970000000067
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf53 2.00016617632 0 99.660004 0.42999599999999705
+1 gpu conv perf 29 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf54 2.01610051566 0 99.660004 0.42999599999999705
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf55 1.97610564729 0 99.599998 0.4900019999999984
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf56 2.01610051566 0 98.900002 1.1849969999999956
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf57 1.99590274244 0 99.099998 0.8850029999999975
+1 gpu conv samp 36 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf58 2.01610051566 0 99.580002 0.5099980000000045
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf59 1.97610564729 0 99.080002 0.9149970000000067
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf60 2.01610051566 0 98.959999 1.0950015000000022
+1 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf61 2.01610051566 0 99.220001 0.7049985000000021
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf62 2.01610051566 0 98.839996 1.2750059999999976
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf63 1.99590274244 0 98.940002 1.1249969999999863
+1 gpu conv samp 34 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf64 1.97610564729 0 99.379997 0.46500449999999205
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf65 2.00016617632 0 99.559998 0.5300020000000046
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf66 2.00016617632 0 99.239998 0.6750029999999967
+1 gpu conv perf 30 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf67 2.01610051566 0 99.459999 0.6300010000000015
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf68 2.00016617632 0 99.360001 0.49499850000000123
+1 gpu conv perf 24 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf69 2.01610051566 0 99.559998 0.5300020000000046
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf70 1.99590274244 0 99.440002 0.6499979999999909
+1 gpu conv samp 33 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf71 2.00016617632 0 99.339996 0.5250059999999976
+1 gpu conv perf 25 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf72 2.01610051566 0 99.32 0.5550000000000068
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf73 1.97610564729 0 99.379997 0.46500449999999205
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf74 2.00016617632 0 99.019997 1.0050044999999912
+1 gpu conv perf 29 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf75 1.99590274244 0 99.260002 0.6449969999999965
+1 gpu conv samp 36 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf76 2.01610051566 0 99.099998 0.8850029999999975
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf77 1.97610564729 0 98.440002 1.8749969999999863
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf78 2.01610051566 0 98.440002 1.8749969999999863
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf79 2.01610051566 0 99.160004 0.7949939999999955
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf80 1.97610564729 0 98.480003 1.814995500000002
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf81 2.00016617632 0 99.360001 0.49499850000000123
+1 gpu conv perf 23 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf82 1.97610564729 0 99.660004 0.42999599999999705
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf83 1.99590274244 0 99.540001 0.549998999999994
+1 gpu conv samp 33 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf84 2.00016617632 0 99.199997 0.7350045000000023
+1 gpu conv perf 28 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf85 1.97610564729 0 98.440002 1.8749969999999863
+1 gpu conv fp16 1 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf86 2.00016617632 0 99.0 1.0349999999999966
+1 gpu conv perf 28 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf87 1.99590274244 0 98.519997 1.7550044999999912
+1 gpu conv samp 35 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf88 2.01610051566 0 99.400002 0.6899979999999971
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf89 2.01610051566 0 97.760002 2.8949969999999965
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf90 2.01610051566 0 99.519997 0.5700029999999942
+1 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf91 2.01610051566 0 99.32 0.5550000000000068
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf92 2.01610051566 0 99.580002 0.5099980000000045
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf93 2.01610051566 0 99.480003 0.6099970000000013
+1 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf94 2.01610051566 0 98.480003 1.814995500000002
+1 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf95 2.01610051566 0 98.540001 1.724998499999991
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf96 2.01610051566 0 97.82 2.805000000000007
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf97 2.01610051566 0 98.959999 1.0950015000000022
+1 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf98 2.01610051566 0 98.459999 1.8450015000000022
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf99 2.01610051566 0 99.660004 0.42999599999999705
+1 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf100 2.01610051566 0 99.620003 0.4699970000000008
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf101 2.01610051566 0 97.699997 2.9850045000000023
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf102 2.01610051566 0 99.040001 0.974998499999991
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf103 2.01610051566 0 98.0 2.5349999999999966
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf104 2.01610051566 0 99.160004 0.7949939999999955
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf105 2.01610051566 0 99.540001 0.549998999999994
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf106 2.01610051566 0 99.519997 0.5700029999999942
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf107 2.01610051566 0 99.099998 0.8850029999999975
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 21 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf108 2.01610051566 0 98.120003 2.354995500000001
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf109 2.01610051566 0 99.459999 0.6300010000000015
+1 gpu conv perf 26 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 31 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf110 2.01610051566 0 99.68 0.4099999999999909
+1 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf111 2.01610051566 0 98.839996 1.2750059999999976
+1 gpu conv samp 32 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
++++++
+conf112 2.01610051566 0 98.18 2.2649999999999864
+1 gpu conv perf 22 add fp16 1 tanh fp16 1 pool_max fp16 1 
+2 gpu conv perf 27 add fp16 1 tanh fp16 1 pool_max fp16 1 
+3 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+4 gpu mul fp16 1 add fp16 1 tanh fp16 1 
+5 gpu softmax fp32 1
+-----
-- 
GitLab