&&&& RUNNING TensorRT.trtexec # /home/ubuntu/klass_fr/tensorrt-5.1.6.0/aarch64-linux-gnu/samples/trtexec/build/trtexec --uff=./libs/klass_fr/tensor_rt/data/ssrnet_nchw.uff --uffInput=input_1,3,64,64 --output=ssr_function/mul_9 [I] uff: ./libs/klass_fr/tensor_rt/data/ssrnet_nchw.uff [I] uffInput: input_1,3,64,64 [I] output: ssr_function/mul_9 conv2d_7/Conv2D 0.097ms activation_7/Tanh 0.141ms max_pooling2d/MaxPool 0.071ms conv2d_8/Conv2D 0.079ms activation_8/Tanh 0.146ms conv2d_9/Conv2D 0.096ms activation_9/Tanh 0.132ms max_pooling2d_1/MaxPool 0.069ms conv2d_10/Conv2D 0.070ms activation_10/Tanh 0.149ms conv2d_11/Conv2D 0.071ms activation_11/Tanh 0.148ms max_pooling2d_2/MaxPool 0.072ms conv2d_12/Conv2D 0.067ms activation_12/Tanh 0.152ms conv2d_13/Conv2D 0.085ms activation_13/Tanh 0.133ms conv2d_15/Conv2D 0.072ms conv2d_15/Tanh 0.150ms max_pooling2d_3/MaxPool 0.074ms conv2d/Conv2D + activation/Relu 0.090ms average_pooling2d/AvgPool 0.051ms conv2d_1/Conv2D + activation_1/Relu 0.078ms conv2d_2/Conv2D + activation_2/Relu 0.060ms average_pooling2d_1/AvgPool 0.066ms conv2d_3/Conv2D + activation_3/Relu 0.078ms conv2d_4/Conv2D + activation_4/Relu 0.069ms average_pooling2d_2/AvgPool 0.065ms conv2d_5/Conv2D + activation_5/Relu 0.068ms conv2d_6/Conv2D + activation_6/Relu 0.083ms conv2d_14/Conv2D + conv2d_14/Relu 0.055ms average_pooling2d_3/AvgPool 0.068ms multiply/mul 0.071ms transpose + (Unnamed Layer* 165) [Shuffl 0.078ms dense_1/MatMul 0.071ms dense_1/BiasAdd + dense_1/Tanh 0.076ms offset_stage1/MatMul 0.068ms offset_stage1/BiasAdd + offset_stage1/Ta 0.074ms ssr_function/add 0.068ms conv2d_16/Conv2D 0.071ms conv2d_16/Tanh 0.152ms max_pooling2d_4/MaxPool 0.069ms conv2d_17/Conv2D + conv2d_17/Relu 0.069ms average_pooling2d_4/AvgPool 0.067ms multiply_1/mul 0.067ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.073ms dense_4/MatMul 0.065ms dense_4/BiasAdd + dense_4/Tanh 0.070ms offset_stage2/MatMul 0.069ms offset_stage2/BiasAdd + offset_stage2/Ta 0.070ms ssr_function/add_1 0.069ms ssr_function/add copy 0.076ms offset_stage1/Tanh copy 0.076ms ssr_function/add_1 copy 0.078ms dense_2/MatMul 0.066ms dense_2/BiasAdd + dense_2/Relu 0.073ms reshape_1/Reshape 0.084ms ssr_function/Mul 0.068ms ssr_function/Reshape_3 0.075ms ssr_function/MatMul 0.068ms dense/MatMul 0.065ms dense/BiasAdd + dense/Tanh 0.070ms delta_stage1/MatMul 0.067ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.075ms ssr_function/add_6 0.076ms ssr_function/mul_3 0.069ms ssr_function/truediv 0.067ms ssr_function/add_2 0.070ms ssr_function/add_3 0.069ms ssr_function/add_2 copy 0.073ms offset_stage2/Tanh copy 0.072ms ssr_function/add_3 copy 0.073ms dense_5/MatMul 0.068ms dense_5/BiasAdd + dense_5/Relu 0.072ms reshape_3/Reshape 0.080ms ssr_function/Mul_1 0.068ms ssr_function/Reshape_7 0.075ms ssr_function/MatMul_1 0.069ms dense_3/MatMul 0.066ms dense_3/BiasAdd + dense_3/Tanh 0.071ms delta_stage2/MatMul 0.067ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.070ms ssr_function/add_7 0.069ms ssr_function/mul_4 0.067ms ssr_function/mul_6 0.070ms ssr_function/truediv_1 0.067ms ssr_function/add_9 0.068ms conv2d_18/Conv2D 0.073ms conv2d_18/Tanh 0.152ms max_pooling2d_5/MaxPool 0.073ms conv2d_19/Conv2D + conv2d_19/Relu 0.074ms average_pooling2d_5/AvgPool 0.070ms multiply_2/mul 0.068ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.077ms dense_7/MatMul 0.080ms dense_7/BiasAdd + dense_7/Tanh 0.059ms offset_stage3/MatMul 0.067ms offset_stage3/BiasAdd + offset_stage3/Ta 0.072ms ssr_function/add_4 0.069ms ssr_function/add_5 0.069ms ssr_function/add_4 copy 0.075ms offset_stage3/Tanh copy 0.073ms ssr_function/add_5 copy 0.072ms dense_8/MatMul 0.078ms dense_8/BiasAdd + dense_8/Relu 0.057ms reshape_5/Reshape 0.078ms ssr_function/Mul_2 0.070ms ssr_function/Reshape_11 0.075ms ssr_function/MatMul_2 0.070ms ssr_function/mul_7 0.066ms dense_6/MatMul 0.081ms dense_6/BiasAdd + dense_6/Tanh 0.058ms delta_stage3/MatMul 0.067ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.069ms ssr_function/add_8 0.070ms ssr_function/mul_5 0.075ms ssr_function/mul_8 0.067ms ssr_function/truediv_2 0.066ms ssr_function/add_10 0.065ms ssr_function/mul_9 0.069ms Time over all layers: 9.281 [I] Average over 10 runs is 10.8099 ms (host walltime is 10.8412 ms, 99% percentile time is 11.6637). conv2d_7/Conv2D 0.190ms activation_7/Tanh 0.274ms max_pooling2d/MaxPool 0.139ms conv2d_8/Conv2D 0.156ms activation_8/Tanh 0.284ms conv2d_9/Conv2D 0.186ms activation_9/Tanh 0.258ms max_pooling2d_1/MaxPool 0.141ms conv2d_10/Conv2D 0.139ms activation_10/Tanh 0.293ms conv2d_11/Conv2D 0.136ms activation_11/Tanh 0.296ms max_pooling2d_2/MaxPool 0.140ms conv2d_12/Conv2D 0.134ms activation_12/Tanh 0.300ms conv2d_13/Conv2D 0.167ms activation_13/Tanh 0.261ms conv2d_15/Conv2D 0.140ms conv2d_15/Tanh 0.295ms max_pooling2d_3/MaxPool 0.141ms conv2d/Conv2D + activation/Relu 0.182ms average_pooling2d/AvgPool 0.099ms conv2d_1/Conv2D + activation_1/Relu 0.152ms conv2d_2/Conv2D + activation_2/Relu 0.119ms average_pooling2d_1/AvgPool 0.132ms conv2d_3/Conv2D + activation_3/Relu 0.153ms conv2d_4/Conv2D + activation_4/Relu 0.135ms average_pooling2d_2/AvgPool 0.131ms conv2d_5/Conv2D + activation_5/Relu 0.134ms conv2d_6/Conv2D + activation_6/Relu 0.165ms conv2d_14/Conv2D + conv2d_14/Relu 0.105ms average_pooling2d_3/AvgPool 0.134ms multiply/mul 0.136ms transpose + (Unnamed Layer* 165) [Shuffl 0.149ms dense_1/MatMul 0.139ms dense_1/BiasAdd + dense_1/Tanh 0.145ms offset_stage1/MatMul 0.135ms offset_stage1/BiasAdd + offset_stage1/Ta 0.142ms ssr_function/add 0.139ms conv2d_16/Conv2D 0.141ms conv2d_16/Tanh 0.300ms max_pooling2d_4/MaxPool 0.137ms conv2d_17/Conv2D + conv2d_17/Relu 0.135ms average_pooling2d_4/AvgPool 0.132ms multiply_1/mul 0.131ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.143ms dense_4/MatMul 0.130ms dense_4/BiasAdd + dense_4/Tanh 0.140ms offset_stage2/MatMul 0.136ms offset_stage2/BiasAdd + offset_stage2/Ta 0.137ms ssr_function/add_1 0.136ms ssr_function/add copy 0.148ms offset_stage1/Tanh copy 0.147ms ssr_function/add_1 copy 0.149ms dense_2/MatMul 0.130ms dense_2/BiasAdd + dense_2/Relu 0.141ms reshape_1/Reshape 0.163ms ssr_function/Mul 0.134ms ssr_function/Reshape_3 0.147ms ssr_function/MatMul 0.135ms dense/MatMul 0.129ms dense/BiasAdd + dense/Tanh 0.140ms delta_stage1/MatMul 0.131ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.143ms ssr_function/add_6 0.143ms ssr_function/mul_3 0.136ms ssr_function/truediv 0.132ms ssr_function/add_2 0.137ms ssr_function/add_3 0.136ms ssr_function/add_2 copy 0.148ms offset_stage2/Tanh copy 0.142ms ssr_function/add_3 copy 0.143ms dense_5/MatMul 0.133ms dense_5/BiasAdd + dense_5/Relu 0.139ms reshape_3/Reshape 0.154ms ssr_function/Mul_1 0.133ms ssr_function/Reshape_7 0.150ms ssr_function/MatMul_1 0.134ms dense_3/MatMul 0.129ms dense_3/BiasAdd + dense_3/Tanh 0.138ms delta_stage2/MatMul 0.131ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.138ms ssr_function/add_7 0.140ms ssr_function/mul_4 0.134ms ssr_function/mul_6 0.137ms ssr_function/truediv_1 0.131ms ssr_function/add_9 0.133ms conv2d_18/Conv2D 0.141ms conv2d_18/Tanh 0.300ms max_pooling2d_5/MaxPool 0.140ms conv2d_19/Conv2D + conv2d_19/Relu 0.142ms average_pooling2d_5/AvgPool 0.136ms multiply_2/mul 0.133ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.150ms dense_7/MatMul 0.159ms dense_7/BiasAdd + dense_7/Tanh 0.116ms offset_stage3/MatMul 0.132ms offset_stage3/BiasAdd + offset_stage3/Ta 0.139ms ssr_function/add_4 0.137ms ssr_function/add_5 0.137ms ssr_function/add_4 copy 0.149ms offset_stage3/Tanh copy 0.143ms ssr_function/add_5 copy 0.142ms dense_8/MatMul 0.159ms dense_8/BiasAdd + dense_8/Relu 0.112ms reshape_5/Reshape 0.153ms ssr_function/Mul_2 0.138ms ssr_function/Reshape_11 0.149ms ssr_function/MatMul_2 0.136ms ssr_function/mul_7 0.132ms dense_6/MatMul 0.159ms dense_6/BiasAdd + dense_6/Tanh 0.112ms delta_stage3/MatMul 0.132ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.137ms ssr_function/add_8 0.139ms ssr_function/mul_5 0.143ms ssr_function/mul_8 0.132ms ssr_function/truediv_2 0.133ms ssr_function/add_10 0.129ms ssr_function/mul_9 0.138ms Time over all layers: 18.233 [I] Average over 10 runs is 10.4067 ms (host walltime is 10.4342 ms, 99% percentile time is 10.7064). conv2d_7/Conv2D 0.280ms activation_7/Tanh 0.406ms max_pooling2d/MaxPool 0.206ms conv2d_8/Conv2D 0.231ms activation_8/Tanh 0.419ms conv2d_9/Conv2D 0.276ms activation_9/Tanh 0.387ms max_pooling2d_1/MaxPool 0.209ms conv2d_10/Conv2D 0.206ms activation_10/Tanh 0.441ms conv2d_11/Conv2D 0.203ms activation_11/Tanh 0.444ms max_pooling2d_2/MaxPool 0.209ms conv2d_12/Conv2D 0.201ms activation_12/Tanh 0.445ms conv2d_13/Conv2D 0.249ms activation_13/Tanh 0.390ms conv2d_15/Conv2D 0.210ms conv2d_15/Tanh 0.441ms max_pooling2d_3/MaxPool 0.209ms conv2d/Conv2D + activation/Relu 0.270ms average_pooling2d/AvgPool 0.147ms conv2d_1/Conv2D + activation_1/Relu 0.227ms conv2d_2/Conv2D + activation_2/Relu 0.179ms average_pooling2d_1/AvgPool 0.195ms conv2d_3/Conv2D + activation_3/Relu 0.229ms conv2d_4/Conv2D + activation_4/Relu 0.200ms average_pooling2d_2/AvgPool 0.196ms conv2d_5/Conv2D + activation_5/Relu 0.201ms conv2d_6/Conv2D + activation_6/Relu 0.247ms conv2d_14/Conv2D + conv2d_14/Relu 0.156ms average_pooling2d_3/AvgPool 0.199ms multiply/mul 0.206ms transpose + (Unnamed Layer* 165) [Shuffl 0.222ms dense_1/MatMul 0.207ms dense_1/BiasAdd + dense_1/Tanh 0.216ms offset_stage1/MatMul 0.200ms offset_stage1/BiasAdd + offset_stage1/Ta 0.210ms ssr_function/add 0.209ms conv2d_16/Conv2D 0.209ms conv2d_16/Tanh 0.449ms max_pooling2d_4/MaxPool 0.204ms conv2d_17/Conv2D + conv2d_17/Relu 0.200ms average_pooling2d_4/AvgPool 0.199ms multiply_1/mul 0.195ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.213ms dense_4/MatMul 0.196ms dense_4/BiasAdd + dense_4/Tanh 0.208ms offset_stage2/MatMul 0.202ms offset_stage2/BiasAdd + offset_stage2/Ta 0.205ms ssr_function/add_1 0.205ms ssr_function/add copy 0.223ms offset_stage1/Tanh copy 0.218ms ssr_function/add_1 copy 0.218ms dense_2/MatMul 0.195ms dense_2/BiasAdd + dense_2/Relu 0.209ms reshape_1/Reshape 0.242ms ssr_function/Mul 0.199ms ssr_function/Reshape_3 0.228ms ssr_function/MatMul 0.201ms dense/MatMul 0.192ms dense/BiasAdd + dense/Tanh 0.208ms delta_stage1/MatMul 0.197ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.211ms ssr_function/add_6 0.214ms ssr_function/mul_3 0.204ms ssr_function/truediv 0.197ms ssr_function/add_2 0.204ms ssr_function/add_3 0.206ms ssr_function/add_2 copy 0.219ms offset_stage2/Tanh copy 0.212ms ssr_function/add_3 copy 0.213ms dense_5/MatMul 0.199ms dense_5/BiasAdd + dense_5/Relu 0.209ms reshape_3/Reshape 0.230ms ssr_function/Mul_1 0.198ms ssr_function/Reshape_7 0.224ms ssr_function/MatMul_1 0.200ms dense_3/MatMul 0.194ms dense_3/BiasAdd + dense_3/Tanh 0.209ms delta_stage2/MatMul 0.199ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.206ms ssr_function/add_7 0.208ms ssr_function/mul_4 0.201ms ssr_function/mul_6 0.202ms ssr_function/truediv_1 0.194ms ssr_function/add_9 0.201ms conv2d_18/Conv2D 0.209ms conv2d_18/Tanh 0.448ms max_pooling2d_5/MaxPool 0.210ms conv2d_19/Conv2D + conv2d_19/Relu 0.209ms average_pooling2d_5/AvgPool 0.204ms multiply_2/mul 0.199ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.226ms dense_7/MatMul 0.239ms dense_7/BiasAdd + dense_7/Tanh 0.173ms offset_stage3/MatMul 0.197ms offset_stage3/BiasAdd + offset_stage3/Ta 0.206ms ssr_function/add_4 0.203ms ssr_function/add_5 0.204ms ssr_function/add_4 copy 0.221ms offset_stage3/Tanh copy 0.215ms ssr_function/add_5 copy 0.212ms dense_8/MatMul 0.237ms dense_8/BiasAdd + dense_8/Relu 0.166ms reshape_5/Reshape 0.228ms ssr_function/Mul_2 0.204ms ssr_function/Reshape_11 0.222ms ssr_function/MatMul_2 0.207ms ssr_function/mul_7 0.198ms dense_6/MatMul 0.238ms dense_6/BiasAdd + dense_6/Tanh 0.167ms delta_stage3/MatMul 0.197ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.205ms ssr_function/add_8 0.206ms ssr_function/mul_5 0.211ms ssr_function/mul_8 0.196ms ssr_function/truediv_2 0.198ms ssr_function/add_10 0.192ms ssr_function/mul_9 0.206ms Time over all layers: 27.205 [I] Average over 10 runs is 10.4326 ms (host walltime is 10.4604 ms, 99% percentile time is 10.5315). conv2d_7/Conv2D 0.372ms activation_7/Tanh 0.537ms max_pooling2d/MaxPool 0.273ms conv2d_8/Conv2D 0.307ms activation_8/Tanh 0.556ms conv2d_9/Conv2D 0.371ms activation_9/Tanh 0.517ms max_pooling2d_1/MaxPool 0.277ms conv2d_10/Conv2D 0.272ms activation_10/Tanh 0.585ms conv2d_11/Conv2D 0.269ms activation_11/Tanh 0.589ms max_pooling2d_2/MaxPool 0.278ms conv2d_12/Conv2D 0.267ms activation_12/Tanh 0.594ms conv2d_13/Conv2D 0.332ms activation_13/Tanh 0.526ms conv2d_15/Conv2D 0.279ms conv2d_15/Tanh 0.586ms max_pooling2d_3/MaxPool 0.275ms conv2d/Conv2D + activation/Relu 0.357ms average_pooling2d/AvgPool 0.197ms conv2d_1/Conv2D + activation_1/Relu 0.301ms conv2d_2/Conv2D + activation_2/Relu 0.237ms average_pooling2d_1/AvgPool 0.262ms conv2d_3/Conv2D + activation_3/Relu 0.304ms conv2d_4/Conv2D + activation_4/Relu 0.265ms average_pooling2d_2/AvgPool 0.258ms conv2d_5/Conv2D + activation_5/Relu 0.267ms conv2d_6/Conv2D + activation_6/Relu 0.329ms conv2d_14/Conv2D + conv2d_14/Relu 0.209ms average_pooling2d_3/AvgPool 0.265ms multiply/mul 0.270ms transpose + (Unnamed Layer* 165) [Shuffl 0.294ms dense_1/MatMul 0.276ms dense_1/BiasAdd + dense_1/Tanh 0.285ms offset_stage1/MatMul 0.265ms offset_stage1/BiasAdd + offset_stage1/Ta 0.278ms ssr_function/add 0.278ms conv2d_16/Conv2D 0.276ms conv2d_16/Tanh 0.596ms max_pooling2d_4/MaxPool 0.272ms conv2d_17/Conv2D + conv2d_17/Relu 0.266ms average_pooling2d_4/AvgPool 0.264ms multiply_1/mul 0.260ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.285ms dense_4/MatMul 0.264ms dense_4/BiasAdd + dense_4/Tanh 0.279ms offset_stage2/MatMul 0.267ms offset_stage2/BiasAdd + offset_stage2/Ta 0.272ms ssr_function/add_1 0.271ms ssr_function/add copy 0.296ms offset_stage1/Tanh copy 0.288ms ssr_function/add_1 copy 0.288ms dense_2/MatMul 0.259ms dense_2/BiasAdd + dense_2/Relu 0.277ms reshape_1/Reshape 0.326ms ssr_function/Mul 0.265ms ssr_function/Reshape_3 0.301ms ssr_function/MatMul 0.268ms dense/MatMul 0.260ms dense/BiasAdd + dense/Tanh 0.275ms delta_stage1/MatMul 0.262ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.278ms ssr_function/add_6 0.281ms ssr_function/mul_3 0.270ms ssr_function/truediv 0.261ms ssr_function/add_2 0.270ms ssr_function/add_3 0.272ms ssr_function/add_2 copy 0.293ms offset_stage2/Tanh copy 0.282ms ssr_function/add_3 copy 0.284ms dense_5/MatMul 0.265ms dense_5/BiasAdd + dense_5/Relu 0.276ms reshape_3/Reshape 0.307ms ssr_function/Mul_1 0.266ms ssr_function/Reshape_7 0.297ms ssr_function/MatMul_1 0.265ms dense_3/MatMul 0.260ms dense_3/BiasAdd + dense_3/Tanh 0.277ms delta_stage2/MatMul 0.264ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.276ms ssr_function/add_7 0.275ms ssr_function/mul_4 0.267ms ssr_function/mul_6 0.266ms ssr_function/truediv_1 0.259ms ssr_function/add_9 0.265ms conv2d_18/Conv2D 0.277ms conv2d_18/Tanh 0.597ms max_pooling2d_5/MaxPool 0.279ms conv2d_19/Conv2D + conv2d_19/Relu 0.281ms average_pooling2d_5/AvgPool 0.271ms multiply_2/mul 0.264ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.297ms dense_7/MatMul 0.318ms dense_7/BiasAdd + dense_7/Tanh 0.229ms offset_stage3/MatMul 0.262ms offset_stage3/BiasAdd + offset_stage3/Ta 0.273ms ssr_function/add_4 0.270ms ssr_function/add_5 0.271ms ssr_function/add_4 copy 0.293ms offset_stage3/Tanh copy 0.285ms ssr_function/add_5 copy 0.282ms dense_8/MatMul 0.315ms dense_8/BiasAdd + dense_8/Relu 0.225ms reshape_5/Reshape 0.306ms ssr_function/Mul_2 0.272ms ssr_function/Reshape_11 0.296ms ssr_function/MatMul_2 0.273ms ssr_function/mul_7 0.263ms dense_6/MatMul 0.317ms dense_6/BiasAdd + dense_6/Tanh 0.220ms delta_stage3/MatMul 0.261ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.273ms ssr_function/add_8 0.276ms ssr_function/mul_5 0.278ms ssr_function/mul_8 0.261ms ssr_function/truediv_2 0.265ms ssr_function/add_10 0.256ms ssr_function/mul_9 0.275ms Time over all layers: 36.153 [I] Average over 10 runs is 10.408 ms (host walltime is 10.4351 ms, 99% percentile time is 10.5045). conv2d_7/Conv2D 0.463ms activation_7/Tanh 0.667ms max_pooling2d/MaxPool 0.340ms conv2d_8/Conv2D 0.383ms activation_8/Tanh 0.693ms conv2d_9/Conv2D 0.461ms activation_9/Tanh 0.646ms max_pooling2d_1/MaxPool 0.343ms conv2d_10/Conv2D 0.339ms activation_10/Tanh 0.729ms conv2d_11/Conv2D 0.334ms activation_11/Tanh 0.735ms max_pooling2d_2/MaxPool 0.349ms conv2d_12/Conv2D 0.335ms activation_12/Tanh 0.739ms conv2d_13/Conv2D 0.414ms activation_13/Tanh 0.654ms conv2d_15/Conv2D 0.347ms conv2d_15/Tanh 0.731ms max_pooling2d_3/MaxPool 0.342ms conv2d/Conv2D + activation/Relu 0.446ms average_pooling2d/AvgPool 0.245ms conv2d_1/Conv2D + activation_1/Relu 0.377ms conv2d_2/Conv2D + activation_2/Relu 0.297ms average_pooling2d_1/AvgPool 0.325ms conv2d_3/Conv2D + activation_3/Relu 0.379ms conv2d_4/Conv2D + activation_4/Relu 0.332ms average_pooling2d_2/AvgPool 0.320ms conv2d_5/Conv2D + activation_5/Relu 0.333ms conv2d_6/Conv2D + activation_6/Relu 0.410ms conv2d_14/Conv2D + conv2d_14/Relu 0.258ms average_pooling2d_3/AvgPool 0.330ms multiply/mul 0.337ms transpose + (Unnamed Layer* 165) [Shuffl 0.364ms dense_1/MatMul 0.343ms dense_1/BiasAdd + dense_1/Tanh 0.353ms offset_stage1/MatMul 0.333ms offset_stage1/BiasAdd + offset_stage1/Ta 0.347ms ssr_function/add 0.345ms conv2d_16/Conv2D 0.343ms conv2d_16/Tanh 0.744ms max_pooling2d_4/MaxPool 0.339ms conv2d_17/Conv2D + conv2d_17/Relu 0.331ms average_pooling2d_4/AvgPool 0.332ms multiply_1/mul 0.326ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.356ms dense_4/MatMul 0.329ms dense_4/BiasAdd + dense_4/Tanh 0.347ms offset_stage2/MatMul 0.332ms offset_stage2/BiasAdd + offset_stage2/Ta 0.339ms ssr_function/add_1 0.338ms ssr_function/add copy 0.369ms offset_stage1/Tanh copy 0.359ms ssr_function/add_1 copy 0.357ms dense_2/MatMul 0.325ms dense_2/BiasAdd + dense_2/Relu 0.346ms reshape_1/Reshape 0.411ms ssr_function/Mul 0.331ms ssr_function/Reshape_3 0.374ms ssr_function/MatMul 0.334ms dense/MatMul 0.323ms dense/BiasAdd + dense/Tanh 0.343ms delta_stage1/MatMul 0.326ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.345ms ssr_function/add_6 0.348ms ssr_function/mul_3 0.337ms ssr_function/truediv 0.329ms ssr_function/add_2 0.338ms ssr_function/add_3 0.341ms ssr_function/add_2 copy 0.365ms offset_stage2/Tanh copy 0.353ms ssr_function/add_3 copy 0.354ms dense_5/MatMul 0.330ms dense_5/BiasAdd + dense_5/Relu 0.344ms reshape_3/Reshape 0.381ms ssr_function/Mul_1 0.332ms ssr_function/Reshape_7 0.373ms ssr_function/MatMul_1 0.331ms dense_3/MatMul 0.326ms dense_3/BiasAdd + dense_3/Tanh 0.345ms delta_stage2/MatMul 0.331ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.344ms ssr_function/add_7 0.344ms ssr_function/mul_4 0.333ms ssr_function/mul_6 0.331ms ssr_function/truediv_1 0.324ms ssr_function/add_9 0.330ms conv2d_18/Conv2D 0.344ms conv2d_18/Tanh 0.745ms max_pooling2d_5/MaxPool 0.349ms conv2d_19/Conv2D + conv2d_19/Relu 0.349ms average_pooling2d_5/AvgPool 0.337ms multiply_2/mul 0.332ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.368ms dense_7/MatMul 0.397ms dense_7/BiasAdd + dense_7/Tanh 0.286ms offset_stage3/MatMul 0.328ms offset_stage3/BiasAdd + offset_stage3/Ta 0.340ms ssr_function/add_4 0.337ms ssr_function/add_5 0.339ms ssr_function/add_4 copy 0.365ms offset_stage3/Tanh copy 0.359ms ssr_function/add_5 copy 0.352ms dense_8/MatMul 0.393ms dense_8/BiasAdd + dense_8/Relu 0.279ms reshape_5/Reshape 0.381ms ssr_function/Mul_2 0.338ms ssr_function/Reshape_11 0.369ms ssr_function/MatMul_2 0.338ms ssr_function/mul_7 0.328ms dense_6/MatMul 0.396ms dense_6/BiasAdd + dense_6/Tanh 0.276ms delta_stage3/MatMul 0.329ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.341ms ssr_function/add_8 0.345ms ssr_function/mul_5 0.345ms ssr_function/mul_8 0.325ms ssr_function/truediv_2 0.329ms ssr_function/add_10 0.320ms ssr_function/mul_9 0.343ms Time over all layers: 45.088 [I] Average over 10 runs is 10.3822 ms (host walltime is 10.4095 ms, 99% percentile time is 10.5574). conv2d_7/Conv2D 0.555ms activation_7/Tanh 0.796ms max_pooling2d/MaxPool 0.407ms conv2d_8/Conv2D 0.459ms activation_8/Tanh 0.830ms conv2d_9/Conv2D 0.552ms activation_9/Tanh 0.772ms max_pooling2d_1/MaxPool 0.410ms conv2d_10/Conv2D 0.407ms activation_10/Tanh 0.874ms conv2d_11/Conv2D 0.400ms activation_11/Tanh 0.880ms max_pooling2d_2/MaxPool 0.417ms conv2d_12/Conv2D 0.403ms activation_12/Tanh 0.886ms conv2d_13/Conv2D 0.495ms activation_13/Tanh 0.783ms conv2d_15/Conv2D 0.415ms conv2d_15/Tanh 0.877ms max_pooling2d_3/MaxPool 0.409ms conv2d/Conv2D + activation/Relu 0.533ms average_pooling2d/AvgPool 0.295ms conv2d_1/Conv2D + activation_1/Relu 0.452ms conv2d_2/Conv2D + activation_2/Relu 0.355ms average_pooling2d_1/AvgPool 0.388ms conv2d_3/Conv2D + activation_3/Relu 0.459ms conv2d_4/Conv2D + activation_4/Relu 0.396ms average_pooling2d_2/AvgPool 0.382ms conv2d_5/Conv2D + activation_5/Relu 0.398ms conv2d_6/Conv2D + activation_6/Relu 0.492ms conv2d_14/Conv2D + conv2d_14/Relu 0.308ms average_pooling2d_3/AvgPool 0.396ms multiply/mul 0.403ms transpose + (Unnamed Layer* 165) [Shuffl 0.441ms dense_1/MatMul 0.411ms dense_1/BiasAdd + dense_1/Tanh 0.423ms offset_stage1/MatMul 0.397ms offset_stage1/BiasAdd + offset_stage1/Ta 0.415ms ssr_function/add 0.412ms conv2d_16/Conv2D 0.410ms conv2d_16/Tanh 0.890ms max_pooling2d_4/MaxPool 0.406ms conv2d_17/Conv2D + conv2d_17/Relu 0.396ms average_pooling2d_4/AvgPool 0.399ms multiply_1/mul 0.390ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.426ms dense_4/MatMul 0.400ms dense_4/BiasAdd + dense_4/Tanh 0.416ms offset_stage2/MatMul 0.398ms offset_stage2/BiasAdd + offset_stage2/Ta 0.407ms ssr_function/add_1 0.405ms ssr_function/add copy 0.441ms offset_stage1/Tanh copy 0.430ms ssr_function/add_1 copy 0.427ms dense_2/MatMul 0.391ms dense_2/BiasAdd + dense_2/Relu 0.414ms reshape_1/Reshape 0.491ms ssr_function/Mul 0.397ms ssr_function/Reshape_3 0.447ms ssr_function/MatMul 0.399ms dense/MatMul 0.386ms dense/BiasAdd + dense/Tanh 0.412ms delta_stage1/MatMul 0.392ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.414ms ssr_function/add_6 0.416ms ssr_function/mul_3 0.404ms ssr_function/truediv 0.394ms ssr_function/add_2 0.405ms ssr_function/add_3 0.411ms ssr_function/add_2 copy 0.438ms offset_stage2/Tanh copy 0.423ms ssr_function/add_3 copy 0.423ms dense_5/MatMul 0.395ms dense_5/BiasAdd + dense_5/Relu 0.412ms reshape_3/Reshape 0.456ms ssr_function/Mul_1 0.397ms ssr_function/Reshape_7 0.448ms ssr_function/MatMul_1 0.398ms dense_3/MatMul 0.391ms dense_3/BiasAdd + dense_3/Tanh 0.413ms delta_stage2/MatMul 0.397ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.414ms ssr_function/add_7 0.412ms ssr_function/mul_4 0.400ms ssr_function/mul_6 0.395ms ssr_function/truediv_1 0.388ms ssr_function/add_9 0.395ms conv2d_18/Conv2D 0.412ms conv2d_18/Tanh 0.894ms max_pooling2d_5/MaxPool 0.422ms conv2d_19/Conv2D + conv2d_19/Relu 0.419ms average_pooling2d_5/AvgPool 0.406ms multiply_2/mul 0.397ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.440ms dense_7/MatMul 0.475ms dense_7/BiasAdd + dense_7/Tanh 0.341ms offset_stage3/MatMul 0.393ms offset_stage3/BiasAdd + offset_stage3/Ta 0.408ms ssr_function/add_4 0.404ms ssr_function/add_5 0.406ms ssr_function/add_4 copy 0.437ms offset_stage3/Tanh copy 0.432ms ssr_function/add_5 copy 0.422ms dense_8/MatMul 0.473ms dense_8/BiasAdd + dense_8/Relu 0.336ms reshape_5/Reshape 0.456ms ssr_function/Mul_2 0.406ms ssr_function/Reshape_11 0.442ms ssr_function/MatMul_2 0.405ms ssr_function/mul_7 0.393ms dense_6/MatMul 0.474ms dense_6/BiasAdd + dense_6/Tanh 0.330ms delta_stage3/MatMul 0.396ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.409ms ssr_function/add_8 0.414ms ssr_function/mul_5 0.412ms ssr_function/mul_8 0.390ms ssr_function/truediv_2 0.394ms ssr_function/add_10 0.383ms ssr_function/mul_9 0.410ms Time over all layers: 54.024 [I] Average over 10 runs is 10.3938 ms (host walltime is 10.4205 ms, 99% percentile time is 10.568). conv2d_7/Conv2D 0.646ms activation_7/Tanh 0.927ms max_pooling2d/MaxPool 0.474ms conv2d_8/Conv2D 0.536ms activation_8/Tanh 0.972ms conv2d_9/Conv2D 0.643ms activation_9/Tanh 0.905ms max_pooling2d_1/MaxPool 0.476ms conv2d_10/Conv2D 0.473ms activation_10/Tanh 1.019ms conv2d_11/Conv2D 0.466ms activation_11/Tanh 1.029ms max_pooling2d_2/MaxPool 0.486ms conv2d_12/Conv2D 0.469ms activation_12/Tanh 1.032ms conv2d_13/Conv2D 0.578ms activation_13/Tanh 0.919ms conv2d_15/Conv2D 0.483ms conv2d_15/Tanh 1.022ms max_pooling2d_3/MaxPool 0.478ms conv2d/Conv2D + activation/Relu 0.620ms average_pooling2d/AvgPool 0.345ms conv2d_1/Conv2D + activation_1/Relu 0.526ms conv2d_2/Conv2D + activation_2/Relu 0.413ms average_pooling2d_1/AvgPool 0.452ms conv2d_3/Conv2D + activation_3/Relu 0.534ms conv2d_4/Conv2D + activation_4/Relu 0.462ms average_pooling2d_2/AvgPool 0.444ms conv2d_5/Conv2D + activation_5/Relu 0.466ms conv2d_6/Conv2D + activation_6/Relu 0.575ms conv2d_14/Conv2D + conv2d_14/Relu 0.361ms average_pooling2d_3/AvgPool 0.462ms multiply/mul 0.468ms transpose + (Unnamed Layer* 165) [Shuffl 0.513ms dense_1/MatMul 0.478ms dense_1/BiasAdd + dense_1/Tanh 0.492ms offset_stage1/MatMul 0.465ms offset_stage1/BiasAdd + offset_stage1/Ta 0.483ms ssr_function/add 0.480ms conv2d_16/Conv2D 0.477ms conv2d_16/Tanh 1.038ms max_pooling2d_4/MaxPool 0.476ms conv2d_17/Conv2D + conv2d_17/Relu 0.463ms average_pooling2d_4/AvgPool 0.467ms multiply_1/mul 0.455ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.496ms dense_4/MatMul 0.466ms dense_4/BiasAdd + dense_4/Tanh 0.485ms offset_stage2/MatMul 0.462ms offset_stage2/BiasAdd + offset_stage2/Ta 0.474ms ssr_function/add_1 0.472ms ssr_function/add copy 0.513ms offset_stage1/Tanh copy 0.500ms ssr_function/add_1 copy 0.497ms dense_2/MatMul 0.457ms dense_2/BiasAdd + dense_2/Relu 0.483ms reshape_1/Reshape 0.569ms ssr_function/Mul 0.467ms ssr_function/Reshape_3 0.521ms ssr_function/MatMul 0.466ms dense/MatMul 0.450ms dense/BiasAdd + dense/Tanh 0.481ms delta_stage1/MatMul 0.457ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.481ms ssr_function/add_6 0.486ms ssr_function/mul_3 0.471ms ssr_function/truediv 0.458ms ssr_function/add_2 0.472ms ssr_function/add_3 0.478ms ssr_function/add_2 copy 0.509ms offset_stage2/Tanh copy 0.496ms ssr_function/add_3 copy 0.494ms dense_5/MatMul 0.461ms dense_5/BiasAdd + dense_5/Relu 0.482ms reshape_3/Reshape 0.531ms ssr_function/Mul_1 0.463ms ssr_function/Reshape_7 0.524ms ssr_function/MatMul_1 0.465ms dense_3/MatMul 0.455ms dense_3/BiasAdd + dense_3/Tanh 0.484ms delta_stage2/MatMul 0.463ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.483ms ssr_function/add_7 0.480ms ssr_function/mul_4 0.467ms ssr_function/mul_6 0.460ms ssr_function/truediv_1 0.453ms ssr_function/add_9 0.460ms conv2d_18/Conv2D 0.481ms conv2d_18/Tanh 1.046ms max_pooling2d_5/MaxPool 0.490ms conv2d_19/Conv2D + conv2d_19/Relu 0.486ms average_pooling2d_5/AvgPool 0.473ms multiply_2/mul 0.462ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.514ms dense_7/MatMul 0.554ms dense_7/BiasAdd + dense_7/Tanh 0.396ms offset_stage3/MatMul 0.458ms offset_stage3/BiasAdd + offset_stage3/Ta 0.474ms ssr_function/add_4 0.473ms ssr_function/add_5 0.473ms ssr_function/add_4 copy 0.512ms offset_stage3/Tanh copy 0.504ms ssr_function/add_5 copy 0.494ms dense_8/MatMul 0.551ms dense_8/BiasAdd + dense_8/Relu 0.390ms reshape_5/Reshape 0.531ms ssr_function/Mul_2 0.471ms ssr_function/Reshape_11 0.515ms ssr_function/MatMul_2 0.470ms ssr_function/mul_7 0.458ms dense_6/MatMul 0.552ms dense_6/BiasAdd + dense_6/Tanh 0.386ms delta_stage3/MatMul 0.461ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.479ms ssr_function/add_8 0.482ms ssr_function/mul_5 0.479ms ssr_function/mul_8 0.456ms ssr_function/truediv_2 0.458ms ssr_function/add_10 0.448ms ssr_function/mul_9 0.478ms Time over all layers: 62.993 [I] Average over 10 runs is 10.4239 ms (host walltime is 10.4509 ms, 99% percentile time is 10.606). conv2d_7/Conv2D 0.737ms activation_7/Tanh 1.059ms max_pooling2d/MaxPool 0.541ms conv2d_8/Conv2D 0.614ms activation_8/Tanh 1.107ms conv2d_9/Conv2D 0.733ms activation_9/Tanh 1.037ms max_pooling2d_1/MaxPool 0.542ms conv2d_10/Conv2D 0.539ms activation_10/Tanh 1.164ms conv2d_11/Conv2D 0.532ms activation_11/Tanh 1.181ms max_pooling2d_2/MaxPool 0.555ms conv2d_12/Conv2D 0.535ms activation_12/Tanh 1.178ms conv2d_13/Conv2D 0.660ms activation_13/Tanh 1.047ms conv2d_15/Conv2D 0.550ms conv2d_15/Tanh 1.167ms max_pooling2d_3/MaxPool 0.546ms conv2d/Conv2D + activation/Relu 0.710ms average_pooling2d/AvgPool 0.395ms conv2d_1/Conv2D + activation_1/Relu 0.601ms conv2d_2/Conv2D + activation_2/Relu 0.470ms average_pooling2d_1/AvgPool 0.516ms conv2d_3/Conv2D + activation_3/Relu 0.610ms conv2d_4/Conv2D + activation_4/Relu 0.527ms average_pooling2d_2/AvgPool 0.505ms conv2d_5/Conv2D + activation_5/Relu 0.531ms conv2d_6/Conv2D + activation_6/Relu 0.657ms conv2d_14/Conv2D + conv2d_14/Relu 0.412ms average_pooling2d_3/AvgPool 0.527ms multiply/mul 0.532ms transpose + (Unnamed Layer* 165) [Shuffl 0.586ms dense_1/MatMul 0.546ms dense_1/BiasAdd + dense_1/Tanh 0.561ms offset_stage1/MatMul 0.530ms offset_stage1/BiasAdd + offset_stage1/Ta 0.551ms ssr_function/add 0.547ms conv2d_16/Conv2D 0.545ms conv2d_16/Tanh 1.187ms max_pooling2d_4/MaxPool 0.545ms conv2d_17/Conv2D + conv2d_17/Relu 0.530ms average_pooling2d_4/AvgPool 0.532ms multiply_1/mul 0.519ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.566ms dense_4/MatMul 0.530ms dense_4/BiasAdd + dense_4/Tanh 0.552ms offset_stage2/MatMul 0.527ms offset_stage2/BiasAdd + offset_stage2/Ta 0.542ms ssr_function/add_1 0.539ms ssr_function/add copy 0.587ms offset_stage1/Tanh copy 0.570ms ssr_function/add_1 copy 0.568ms dense_2/MatMul 0.523ms dense_2/BiasAdd + dense_2/Relu 0.551ms reshape_1/Reshape 0.649ms ssr_function/Mul 0.532ms ssr_function/Reshape_3 0.594ms ssr_function/MatMul 0.531ms dense/MatMul 0.513ms dense/BiasAdd + dense/Tanh 0.548ms delta_stage1/MatMul 0.521ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.548ms ssr_function/add_6 0.555ms ssr_function/mul_3 0.540ms ssr_function/truediv 0.526ms ssr_function/add_2 0.539ms ssr_function/add_3 0.544ms ssr_function/add_2 copy 0.582ms offset_stage2/Tanh copy 0.566ms ssr_function/add_3 copy 0.563ms dense_5/MatMul 0.527ms dense_5/BiasAdd + dense_5/Relu 0.550ms reshape_3/Reshape 0.606ms ssr_function/Mul_1 0.528ms ssr_function/Reshape_7 0.600ms ssr_function/MatMul_1 0.533ms dense_3/MatMul 0.519ms dense_3/BiasAdd + dense_3/Tanh 0.553ms delta_stage2/MatMul 0.529ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.550ms ssr_function/add_7 0.548ms ssr_function/mul_4 0.533ms ssr_function/mul_6 0.524ms ssr_function/truediv_1 0.517ms ssr_function/add_9 0.524ms conv2d_18/Conv2D 0.551ms conv2d_18/Tanh 1.194ms max_pooling2d_5/MaxPool 0.557ms conv2d_19/Conv2D + conv2d_19/Relu 0.557ms average_pooling2d_5/AvgPool 0.539ms multiply_2/mul 0.527ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.585ms dense_7/MatMul 0.634ms dense_7/BiasAdd + dense_7/Tanh 0.451ms offset_stage3/MatMul 0.524ms offset_stage3/BiasAdd + offset_stage3/Ta 0.541ms ssr_function/add_4 0.542ms ssr_function/add_5 0.543ms ssr_function/add_4 copy 0.584ms offset_stage3/Tanh copy 0.574ms ssr_function/add_5 copy 0.565ms dense_8/MatMul 0.629ms dense_8/BiasAdd + dense_8/Relu 0.444ms reshape_5/Reshape 0.606ms ssr_function/Mul_2 0.537ms ssr_function/Reshape_11 0.588ms ssr_function/MatMul_2 0.536ms ssr_function/mul_7 0.524ms dense_6/MatMul 0.630ms dense_6/BiasAdd + dense_6/Tanh 0.443ms delta_stage3/MatMul 0.526ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.549ms ssr_function/add_8 0.550ms ssr_function/mul_5 0.546ms ssr_function/mul_8 0.521ms ssr_function/truediv_2 0.522ms ssr_function/add_10 0.512ms ssr_function/mul_9 0.545ms Time over all layers: 71.921 [I] Average over 10 runs is 10.379 ms (host walltime is 10.4065 ms, 99% percentile time is 10.6149). conv2d_7/Conv2D 0.831ms activation_7/Tanh 1.192ms max_pooling2d/MaxPool 0.608ms conv2d_8/Conv2D 0.692ms activation_8/Tanh 1.246ms conv2d_9/Conv2D 0.824ms activation_9/Tanh 1.164ms max_pooling2d_1/MaxPool 0.608ms conv2d_10/Conv2D 0.606ms activation_10/Tanh 1.308ms conv2d_11/Conv2D 0.602ms activation_11/Tanh 1.327ms max_pooling2d_2/MaxPool 0.624ms conv2d_12/Conv2D 0.601ms activation_12/Tanh 1.326ms conv2d_13/Conv2D 0.744ms activation_13/Tanh 1.182ms conv2d_15/Conv2D 0.619ms conv2d_15/Tanh 1.316ms max_pooling2d_3/MaxPool 0.613ms conv2d/Conv2D + activation/Relu 0.797ms average_pooling2d/AvgPool 0.442ms conv2d_1/Conv2D + activation_1/Relu 0.676ms conv2d_2/Conv2D + activation_2/Relu 0.528ms average_pooling2d_1/AvgPool 0.580ms conv2d_3/Conv2D + activation_3/Relu 0.688ms conv2d_4/Conv2D + activation_4/Relu 0.594ms average_pooling2d_2/AvgPool 0.568ms conv2d_5/Conv2D + activation_5/Relu 0.599ms conv2d_6/Conv2D + activation_6/Relu 0.739ms conv2d_14/Conv2D + conv2d_14/Relu 0.464ms average_pooling2d_3/AvgPool 0.594ms multiply/mul 0.600ms transpose + (Unnamed Layer* 165) [Shuffl 0.657ms dense_1/MatMul 0.614ms dense_1/BiasAdd + dense_1/Tanh 0.631ms offset_stage1/MatMul 0.595ms offset_stage1/BiasAdd + offset_stage1/Ta 0.620ms ssr_function/add 0.614ms conv2d_16/Conv2D 0.613ms conv2d_16/Tanh 1.336ms max_pooling2d_4/MaxPool 0.612ms conv2d_17/Conv2D + conv2d_17/Relu 0.597ms average_pooling2d_4/AvgPool 0.598ms multiply_1/mul 0.583ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.637ms dense_4/MatMul 0.596ms dense_4/BiasAdd + dense_4/Tanh 0.622ms offset_stage2/MatMul 0.596ms offset_stage2/BiasAdd + offset_stage2/Ta 0.613ms ssr_function/add_1 0.607ms ssr_function/add copy 0.659ms offset_stage1/Tanh copy 0.640ms ssr_function/add_1 copy 0.640ms dense_2/MatMul 0.588ms dense_2/BiasAdd + dense_2/Relu 0.623ms reshape_1/Reshape 0.728ms ssr_function/Mul 0.599ms ssr_function/Reshape_3 0.668ms ssr_function/MatMul 0.597ms dense/MatMul 0.577ms dense/BiasAdd + dense/Tanh 0.619ms delta_stage1/MatMul 0.587ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.616ms ssr_function/add_6 0.623ms ssr_function/mul_3 0.607ms ssr_function/truediv 0.591ms ssr_function/add_2 0.607ms ssr_function/add_3 0.614ms ssr_function/add_2 copy 0.654ms offset_stage2/Tanh copy 0.637ms ssr_function/add_3 copy 0.635ms dense_5/MatMul 0.594ms dense_5/BiasAdd + dense_5/Relu 0.619ms reshape_3/Reshape 0.685ms ssr_function/Mul_1 0.593ms ssr_function/Reshape_7 0.673ms ssr_function/MatMul_1 0.599ms dense_3/MatMul 0.582ms dense_3/BiasAdd + dense_3/Tanh 0.621ms delta_stage2/MatMul 0.594ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.618ms ssr_function/add_7 0.615ms ssr_function/mul_4 0.601ms ssr_function/mul_6 0.589ms ssr_function/truediv_1 0.581ms ssr_function/add_9 0.589ms conv2d_18/Conv2D 0.619ms conv2d_18/Tanh 1.348ms max_pooling2d_5/MaxPool 0.626ms conv2d_19/Conv2D + conv2d_19/Relu 0.624ms average_pooling2d_5/AvgPool 0.607ms multiply_2/mul 0.592ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.657ms dense_7/MatMul 0.712ms dense_7/BiasAdd + dense_7/Tanh 0.506ms offset_stage3/MatMul 0.589ms offset_stage3/BiasAdd + offset_stage3/Ta 0.610ms ssr_function/add_4 0.610ms ssr_function/add_5 0.610ms ssr_function/add_4 copy 0.656ms offset_stage3/Tanh copy 0.645ms ssr_function/add_5 copy 0.637ms dense_8/MatMul 0.708ms dense_8/BiasAdd + dense_8/Relu 0.502ms reshape_5/Reshape 0.682ms ssr_function/Mul_2 0.603ms ssr_function/Reshape_11 0.664ms ssr_function/MatMul_2 0.602ms ssr_function/mul_7 0.589ms dense_6/MatMul 0.711ms dense_6/BiasAdd + dense_6/Tanh 0.498ms delta_stage3/MatMul 0.591ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.617ms ssr_function/add_8 0.617ms ssr_function/mul_5 0.614ms ssr_function/mul_8 0.586ms ssr_function/truediv_2 0.587ms ssr_function/add_10 0.579ms ssr_function/mul_9 0.614ms Time over all layers: 80.918 [I] Average over 10 runs is 10.455 ms (host walltime is 10.4822 ms, 99% percentile time is 10.6618). conv2d_7/Conv2D 0.923ms activation_7/Tanh 1.329ms max_pooling2d/MaxPool 0.675ms conv2d_8/Conv2D 0.768ms activation_8/Tanh 1.381ms conv2d_9/Conv2D 0.914ms activation_9/Tanh 1.291ms max_pooling2d_1/MaxPool 0.674ms conv2d_10/Conv2D 0.676ms activation_10/Tanh 1.457ms conv2d_11/Conv2D 0.668ms activation_11/Tanh 1.472ms max_pooling2d_2/MaxPool 0.692ms conv2d_12/Conv2D 0.668ms activation_12/Tanh 1.472ms conv2d_13/Conv2D 0.826ms activation_13/Tanh 1.315ms conv2d_15/Conv2D 0.687ms conv2d_15/Tanh 1.461ms max_pooling2d_3/MaxPool 0.681ms conv2d/Conv2D + activation/Relu 0.884ms average_pooling2d/AvgPool 0.491ms conv2d_1/Conv2D + activation_1/Relu 0.751ms conv2d_2/Conv2D + activation_2/Relu 0.586ms average_pooling2d_1/AvgPool 0.644ms conv2d_3/Conv2D + activation_3/Relu 0.763ms conv2d_4/Conv2D + activation_4/Relu 0.658ms average_pooling2d_2/AvgPool 0.629ms conv2d_5/Conv2D + activation_5/Relu 0.667ms conv2d_6/Conv2D + activation_6/Relu 0.826ms conv2d_14/Conv2D + conv2d_14/Relu 0.516ms average_pooling2d_3/AvgPool 0.659ms multiply/mul 0.666ms transpose + (Unnamed Layer* 165) [Shuffl 0.729ms dense_1/MatMul 0.681ms dense_1/BiasAdd + dense_1/Tanh 0.701ms offset_stage1/MatMul 0.660ms offset_stage1/BiasAdd + offset_stage1/Ta 0.687ms ssr_function/add 0.684ms conv2d_16/Conv2D 0.682ms conv2d_16/Tanh 1.484ms max_pooling2d_4/MaxPool 0.679ms conv2d_17/Conv2D + conv2d_17/Relu 0.663ms average_pooling2d_4/AvgPool 0.664ms multiply_1/mul 0.648ms transpose_1 + (Unnamed Layer* 196) [Shuf 0.707ms dense_4/MatMul 0.663ms dense_4/BiasAdd + dense_4/Tanh 0.691ms offset_stage2/MatMul 0.663ms offset_stage2/BiasAdd + offset_stage2/Ta 0.684ms ssr_function/add_1 0.675ms ssr_function/add copy 0.732ms offset_stage1/Tanh copy 0.711ms ssr_function/add_1 copy 0.710ms dense_2/MatMul 0.653ms dense_2/BiasAdd + dense_2/Relu 0.691ms reshape_1/Reshape 0.806ms ssr_function/Mul 0.664ms ssr_function/Reshape_3 0.741ms ssr_function/MatMul 0.663ms dense/MatMul 0.641ms dense/BiasAdd + dense/Tanh 0.692ms delta_stage1/MatMul 0.652ms delta_stage1/BiasAdd + delta_stage1/Tanh 0.684ms ssr_function/add_6 0.692ms ssr_function/mul_3 0.675ms ssr_function/truediv 0.656ms ssr_function/add_2 0.674ms ssr_function/add_3 0.681ms ssr_function/add_2 copy 0.725ms offset_stage2/Tanh copy 0.706ms ssr_function/add_3 copy 0.705ms dense_5/MatMul 0.660ms dense_5/BiasAdd + dense_5/Relu 0.690ms reshape_3/Reshape 0.760ms ssr_function/Mul_1 0.659ms ssr_function/Reshape_7 0.746ms ssr_function/MatMul_1 0.666ms dense_3/MatMul 0.646ms dense_3/BiasAdd + dense_3/Tanh 0.691ms delta_stage2/MatMul 0.658ms delta_stage2/BiasAdd + delta_stage2/Tanh 0.686ms ssr_function/add_7 0.682ms ssr_function/mul_4 0.668ms ssr_function/mul_6 0.655ms ssr_function/truediv_1 0.646ms ssr_function/add_9 0.656ms conv2d_18/Conv2D 0.687ms conv2d_18/Tanh 1.496ms max_pooling2d_5/MaxPool 0.692ms conv2d_19/Conv2D + conv2d_19/Relu 0.691ms average_pooling2d_5/AvgPool 0.674ms multiply_2/mul 0.657ms transpose_2 + (Unnamed Layer* 316) [Shuf 0.728ms dense_7/MatMul 0.792ms dense_7/BiasAdd + dense_7/Tanh 0.565ms offset_stage3/MatMul 0.654ms offset_stage3/BiasAdd + offset_stage3/Ta 0.676ms ssr_function/add_4 0.677ms ssr_function/add_5 0.676ms ssr_function/add_4 copy 0.728ms offset_stage3/Tanh copy 0.715ms ssr_function/add_5 copy 0.706ms dense_8/MatMul 0.786ms dense_8/BiasAdd + dense_8/Relu 0.556ms reshape_5/Reshape 0.758ms ssr_function/Mul_2 0.673ms ssr_function/Reshape_11 0.738ms ssr_function/MatMul_2 0.668ms ssr_function/mul_7 0.654ms dense_6/MatMul 0.789ms dense_6/BiasAdd + dense_6/Tanh 0.552ms delta_stage3/MatMul 0.655ms delta_stage3/BiasAdd + delta_stage3/Tanh 0.685ms ssr_function/add_8 0.685ms ssr_function/mul_5 0.681ms ssr_function/mul_8 0.650ms ssr_function/truediv_2 0.651ms ssr_function/add_10 0.642ms ssr_function/mul_9 0.684ms Time over all layers: 89.854 [I] Average over 10 runs is 10.3865 ms (host walltime is 10.4138 ms, 99% percentile time is 10.5859). &&&& PASSED TensorRT.trtexec # /home/ubuntu/klass_fr/tensorrt-5.1.6.0/aarch64-linux-gnu/samples/trtexec/build/trtexec --uff=./libs/klass_fr/tensor_rt/data/ssrnet_nchw.uff --uffInput=input_1,3,64,64 --output=ssr_function/mul_9