forked from octoml/qualcomm
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathonnx_yolo_v3.float16.acc32.autotvm.log
31 lines (31 loc) · 23 KB
/
onnx_yolo_v3.float16.acc32.autotvm.log
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 3, 416, 416], "float16"], ["TENSOR", [32, 3, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 267, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 1, 8]], ["tile_x", "sp", [-1, 4, 4]], ["tile_rc", "sp", [-1, 1]]]}, "result": [[1000000000.0], 6, 15, 1690814668.390537], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 32, 416, 416], "float16"], ["TENSOR", [64, 32, 3, 3], "float16"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 157208, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 2, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0029332992000000004], 0, 30.25938105583191, 1690825087.441299], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 208, 208], "float16"], ["TENSOR", [32, 64, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 1876, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 4]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 1, 16]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.0007079321600000001], 0, 7.315176963806152, 1690829384.4008389], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 32, 208, 208], "float16"], ["TENSOR", [64, 32, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 170169, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 2, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00215195136], 0, 72.7067060470581, 1690834264.227191], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 208, 208], "float16"], ["TENSOR", [128, 64, 3, 3], "float16"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 217853, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00241504768], 0, 56.67399787902832, 1690844045.893238], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 104, 104], "float16"], ["TENSOR", [64, 128, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 35049, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 1, 2]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.00053093888], 0, 93.50106596946716, 1690852661.2861829], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 104, 104], "float16"], ["TENSOR", [256, 128, 3, 3], "float16"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 132546, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0027640524799999997], 0, 45.50786781311035, 1690870120.003805], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 52, 52], "float16"], ["TENSOR", [128, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 7041, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 2, 13]], ["tile_x", "sp", [-1, 2, 1]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00047753728], 0, 6.669731616973877, 1690875019.0118248], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 52, 52], "float16"], ["TENSOR", [256, 128, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 120835, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 2]], ["tile_y", "sp", [-1, 4, 13]], ["tile_x", "sp", [-1, 2, 13]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00249423872], 0, 28.215243101119995, 1690877953.09937], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 128, 52, 52], "float16"], ["TENSOR", [256, 128, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 221, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 2, 32]], ["tile_x", "sp", [-1, 13, 2]], ["tile_rc", "sp", [-1, 1]]]}, "result": [[0.0027899801600000003], 0, 126.55899000167847, 1690883398.779171], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 52, 52], "float16"], ["TENSOR", [512, 256, 3, 3], "float16"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 426083, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 4, 7]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00292285952], 0, 41.66624116897583, 1690889107.494447], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 3, 416, 416], "float16"], ["TENSOR", [32, 3, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 38459, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 1, 2]], ["tile_x", "sp", [-1, 8, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00073589248], 0, 91.71014308929443, 1691018875.762337], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 26, 26], "float16"], ["TENSOR", [256, 512, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 163039, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 2, 14]], ["tile_x", "sp", [-1, 4, 1]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 1]]}, "result": [[0.0003975168], 0, 44.48691368103027, 1691029331.843828], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 26, 26], "float16"], ["TENSOR", [512, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 394512, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 1, 14]], ["tile_x", "sp", [-1, 7, 2]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00261305856], 0, 7.017369031906128, 1691032857.581459], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 26, 26], "float16"], ["TENSOR", [512, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1913, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 2, 64]], ["tile_x", "sp", [-1, 13, 1]], ["tile_rc", "sp", [-1, 32]]]}, "result": [[0.00194985984], 0, 7.836325168609619, 1691035718.447256], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 26, 26], "float16"], ["TENSOR", [1024, 512, 3, 3], "float16"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 620066, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 8, 2]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0028223180800000004], 0, 73.82217812538147, 1691041407.473459], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 13, 13], "float16"], ["TENSOR", [512, 1024, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 178767, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 4, 2]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 1]]}, "result": [[0.0004279808], 0, 53.54822134971619, 1691044104.540429], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 13, 13], "float16"], ["TENSOR", [1024, 512, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 721641, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 1, 8]], ["tile_x", "sp", [-1, 8, 1]], ["tile_rcc", "sp", [-1, 8]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 1]]}, "result": [[0.0027130214400000003], 0, 48.0325140953064, 1691051534.4182558], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 512, 13, 13], "float16"], ["TENSOR", [1024, 512, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 3547, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 4], ["tile_y", "sp", [-1, 2, 64]], ["tile_x", "sp", [-1, 7, 1]], ["tile_rc", "sp", [-1, 128]]]}, "result": [[0.0027378688], 0, 13.648095607757568, 1691057200.157311], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 13, 13], "float16"], ["TENSOR", [256, 512, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 119146, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 4]], ["tile_y", "sp", [-1, 1, 8]], ["tile_x", "sp", [-1, 4, 4]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 1]]}, "result": [[0.00014060032], 0, 17.736218452453613, 1691061020.1556292], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 768, 26, 26], "float16"], ["TENSOR", [256, 768, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 253038, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 2, 7]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 1]]}, "result": [[0.0006355302399999999], 0, 6.875800132751465, 1691062052.7584362], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 26, 26], "float16"], ["TENSOR", [128, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 16808, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 2, 7]], ["tile_x", "sp", [-1, 2, 1]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00013243904], 0, 36.61856460571289, 1691069623.9450722], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 384, 52, 52], "float16"], ["TENSOR", [128, 384, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 70907, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 1, 13]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 3]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 1]]}, "result": [[0.0007732326399999999], 0, 12.771561861038208, 1691071200.4426088], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 52, 52], "float16"], ["TENSOR", [255, 256, 3, 3], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 158786, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 8]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00423665664], 0, 48.57140398025513, 1691076997.756667], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 52, 52], "float16"], ["TENSOR", [255, 256, 3, 3], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 2398, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 4], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 5, 1]], ["tile_rc", "sp", [-1, 32]]]}, "result": [[0.0040536832], 0, 87.6362476348877, 1691081843.272956], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 26, 26], "float16"], ["TENSOR", [255, 512, 3, 3], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 1277224, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 3, 1]], ["tile_x", "sp", [-1, 2, 12]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00185388544], 0, 58.60425090789795, 1691091529.977343], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 512, 26, 26], "float16"], ["TENSOR", [255, 512, 3, 3], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 12435, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 2, 16]], ["tile_x", "sp", [-1, 6, 4]], ["tile_rc", "sp", [-1, 16]]]}, "result": [[0.00148004864], 0, 50.377469062805176, 1691095418.441068], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 13, 13], "float16"], ["TENSOR", [255, 1024, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 131019, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 2, 8]], ["tile_x", "sp", [-1, 2, 1]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 1]]}, "result": [[0.00026634752], 0, 67.68352127075195, 1691100144.5741272], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 32, 208, 208], "float16"], ["TENSOR", [64, 32, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 2159, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 1, 16]], ["tile_x", "sp", [-1, 4, 4]], ["tile_rc", "sp", [-1, 4]]]}, "result": [[0.004093742080000001], 0, 36.043375968933105, 1691418573.319615], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 104, 104], "float16"], ["TENSOR", [128, 64, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 212365, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 4]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0021057638399999998], 0, 30.009414434432983, 1691422698.221246], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 64, 104, 104], "float16"], ["TENSOR", [128, 64, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1241, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 8, 4]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rc", "sp", [-1, 4]]]}, "result": [[0.00260759552], 0, 67.13081622123718, 1691427169.212605], "version": 0.2, "tvm_version": "0.14.dev0"}