forked from octoml/qualcomm
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathonnx_ssd_resnet34.float32.autotvm.log
34 lines (34 loc) · 25.5 KB
/
onnx_ssd_resnet34.float32.autotvm.log
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 3, 1200, 1200], "float32"], ["TENSOR", [64, 3, 7, 7], "float32"], [2, 2], [3, 3, 3, 3], [1, 1], "float32"], {}], "config": {"index": 297518, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 6, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 7]], ["tile_rx", "sp", [-1, 7]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.01327192064], 0, 55.35299491882324, 1688392962.229266], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 300, 300], "float32"], ["TENSOR", [64, 64, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 78739, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 5, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.009892096], 0, 46.69255232810974, 1688395332.1541839], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 150, 150], "float32"], ["TENSOR", [256, 128, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 85840, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 2, 4]], ["tile_x", "sp", [-1, 4, 2]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.01768662528], 0, 8.310285806655884, 1689515619.246023], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 128, 150, 150], "float32"], ["TENSOR", [256, 128, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 4722, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 9, 1]], ["tile_rc", "sp", [-1, 8]]]}, "result": [[0.021760645119999998], 0, 55.300305128097534, 1689517676.3759391], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 150, 150], "float32"], ["TENSOR", [256, 256, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 9224, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 9, 1]], ["tile_rc", "sp", [-1, 64]]]}, "result": [[0.03994763264], 0, 27.873415231704712, 1689530862.205327], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 150, 150], "float32"], ["TENSOR", [256, 256, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 151915, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 1, 8]], ["tile_x", "sp", [-1, 8, 1]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.036356357119999995], 0, 11.544915676116943, 1689534972.405212], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 3, 416, 416], "float32"], ["TENSOR", [32, 3, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 28229, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 1, 1]], ["tile_x", "sp", [-1, 4, 8]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.0009668044800000001], 0, 7.085740089416504, 1690504424.1229172], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 32, 416, 416], "float32"], ["TENSOR", [64, 32, 3, 3], "float32"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 46708, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 8, 2]], ["tile_rcc", "sp", [-1, 4]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00344335872], 0, 67.38153100013733, 1690512105.406295], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 208, 208], "float32"], ["TENSOR", [32, 64, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 23237, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 4, 1]], ["tile_x", "sp", [-1, 1, 16]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.0010171392], 0, 69.91663408279419, 1690514187.714591], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 32, 208, 208], "float32"], ["TENSOR", [64, 32, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 44308, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 4, 1]], ["tile_x", "sp", [-1, 2, 8]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00238115328], 0, 43.60479211807251, 1690522025.3913522], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 208, 208], "float32"], ["TENSOR", [128, 64, 3, 3], "float32"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 163714, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 8, 1]], ["tile_x", "sp", [-1, 1, 8]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.00280019968], 0, 66.05893087387085, 1690526809.3885179], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 104, 104], "float32"], ["TENSOR", [64, 128, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 20788, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 2, 4]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0006497791999999999], 0, 14.802577018737793, 1690532721.836989], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 104, 104], "float32"], ["TENSOR", [128, 64, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 17190, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 1, 8]], ["tile_x", "sp", [-1, 8, 1]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00230388224], 0, 71.52445602416992, 1690538673.585098], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 104, 104], "float32"], ["TENSOR", [256, 128, 3, 3], "float32"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 53674, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 4, 1]], ["tile_x", "sp", [-1, 2, 13]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.003381248], 0, 72.11251401901245, 1690543420.674318], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 52, 52], "float32"], ["TENSOR", [128, 256, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 21905, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 2, 13]], ["tile_x", "sp", [-1, 4, 1]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.0006062336000000001], 0, 14.144606828689575, 1690548321.011746], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 52, 52], "float32"], ["TENSOR", [256, 128, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 45069, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0026471424000000005], 0, 42.7782723903656, 1690554088.838741], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 128, 52, 52], "float32"], ["TENSOR", [256, 128, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 3072, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 4, 1]], ["tile_rc", "sp", [-1, 32]]]}, "result": [[0.0031269990400000004], 0, 62.18325734138489, 1690557511.017538], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 52, 52], "float32"], ["TENSOR", [512, 256, 3, 3], "float32"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 31389, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 1, 14]], ["tile_x", "sp", [-1, 7, 1]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00304577536], 0, 7.796635150909424, 1690566035.70511], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 26, 26], "float32"], ["TENSOR", [256, 512, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 22297, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 7, 2]], ["tile_x", "sp", [-1, 1, 2]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00039231488], 0, 62.29633164405823, 1690571802.978019], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 26, 26], "float32"], ["TENSOR", [512, 256, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 62994, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 7, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.0026364416], 0, 23.647432804107666, 1690575186.73526], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 26, 26], "float32"], ["TENSOR", [512, 256, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 2257, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 4], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 13, 1]], ["tile_rc", "sp", [-1, 64]]]}, "result": [[0.00309674496], 0, 52.16355895996094, 1690582450.9915469], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 26, 26], "float32"], ["TENSOR", [1024, 512, 3, 3], "float32"], [2, 2], [1, 1, 0, 0], [1, 1], "float32"], {}], "config": {"index": 355791, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 8, 2]], ["tile_x", "sp", [-1, 1, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.00325700608], 0, 87.11975407600403, 1690589062.8006861], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 13, 13], "float32"], ["TENSOR", [512, 1024, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 72543, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 8, 2]], ["tile_x", "sp", [-1, 1, 8]], ["tile_rcc", "sp", [-1, 128]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.00044862464000000005], 0, 14.508693933486938, 1690598651.426668], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 13, 13], "float32"], ["TENSOR", [1024, 512, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 610384, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 1, 16]], ["tile_x", "sp", [-1, 8, 2]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0033044172799999998], 0, 9.12758994102478, 1690608888.185184], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 512, 13, 13], "float32"], ["TENSOR", [1024, 512, 3, 3], "float32"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1624, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 4], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 7, 1]], ["tile_rc", "sp", [-1, 8]]]}, "result": [[0.00401268736], 0, 16.535113096237183, 1690610263.636968], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 13, 13], "float32"], ["TENSOR", [256, 512, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 74227, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 8, 2]], ["tile_x", "sp", [-1, 1, 1]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.00016873984], 0, 15.364300727844238, 1690615913.6174998], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 768, 26, 26], "float32"], ["TENSOR", [256, 768, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 36970, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 1, 7]], ["tile_x", "sp", [-1, 7, 2]], ["tile_rcc", "sp", [-1, 48]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00058591232], 0, 76.40829110145569, 1690621487.1020281], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 26, 26], "float32"], ["TENSOR", [128, 256, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 35107, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 7]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.00014014976], 0, 21.095643281936646, 1690628131.7152262], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 384, 52, 52], "float32"], ["TENSOR", [128, 384, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 22580, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0008935526400000001], 0, 24.156691074371338, 1690631711.464622], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 52, 52], "float32"], ["TENSOR", [255, 256, 3, 3], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 103389, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.0049573785600000005], 0, 50.42989492416382, 1690635167.561766], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 52, 52], "float32"], ["TENSOR", [255, 256, 3, 3], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 2984, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 1, 16]], ["tile_x", "sp", [-1, 5, 5]], ["tile_rc", "sp", [-1, 64]]]}, "result": [[0.0082428928], 0, 37.08215117454529, 1690640190.431162], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 26, 26], "float32"], ["TENSOR", [255, 512, 3, 3], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 497615, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 4]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 3, 8]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0018803609599999998], 0, 64.11218452453613, 1690648223.607679], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 512, 26, 26], "float32"], ["TENSOR", [255, 512, 3, 3], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 17988, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 4, 16]], ["tile_x", "sp", [-1, 6, 4]], ["tile_rc", "sp", [-1, 64]]]}, "result": [[0.0019487436799999998], 0, 15.87750792503357, 1690656292.635991], "version": 0.2, "tvm_version": "0.13.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 13, 13], "float32"], ["TENSOR", [255, 1024, 1, 1], "float32"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 23013, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 1, 2]], ["tile_x", "sp", [-1, 8, 2]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00032522751999999996], 0, 15.912687063217163, 1690658895.1638908], "version": 0.2, "tvm_version": "0.13.dev0"}