forked from octoml/qualcomm
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathonnx_faster_rcnn.float16.acc32.autotvm.log
40 lines (40 loc) · 30 KB
/
onnx_faster_rcnn.float16.acc32.autotvm.log
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 3, 1200, 1200], "float16"], ["TENSOR", [64, 3, 7, 7], "float16"], [2, 2], [3, 3, 3, 3], [1, 1], "float32"], {}], "config": {"index": 399947, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 2, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 7]], ["tile_rx", "sp", [-1, 7]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.012531138559999998], 0, 117.355792760849, 1690808725.9362528], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 3, 800, 800], "float16"], ["TENSOR", [64, 3, 7, 7], "float16"], [2, 2], [3, 3, 3, 3], [1, 1], "float32"], {}], "config": {"index": 115485, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 4]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 5, 8]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 7]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.005417922559999999], 0, 81.05212998390198, 1690829942.689881], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 200, 200], "float16"], ["TENSOR", [64, 64, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 52059, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 4, 2]], ["tile_x", "sp", [-1, 1, 10]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0010156032000000002], 0, 61.683496952056885, 1690841219.386687], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 64, 200, 200], "float16"], ["TENSOR", [64, 64, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1799, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 1, 16]], ["tile_x", "sp", [-1, 5, 4]], ["tile_rc", "sp", [-1, 4]]]}, "result": [[1000000000.0], 6, 15, 1690852842.11992], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 200, 200], "float16"], ["TENSOR", [256, 64, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 91330, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 2, 5]], ["tile_x", "sp", [-1, 2, 5]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0031435417599999997], 0, 48.588428258895874, 1690859340.690151], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 200, 200], "float16"], ["TENSOR", [128, 256, 1, 1], "float16"], [2, 2], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 23365, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 1, 2]], ["tile_x", "sp", [-1, 5, 4]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00260593152], 0, 7.822289228439331, 1690866014.0500422], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 100, 100], "float16"], ["TENSOR", [512, 128, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 27910, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 16]], ["tile_y", "sp", [-1, 1, 2]], ["tile_x", "sp", [-1, 5, 10]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.00244603392], 0, 76.52547597885132, 1690879664.086293], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 200, 200], "float16"], ["TENSOR", [512, 256, 1, 1], "float16"], [2, 2], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 148344, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 64]], ["tile_y", "sp", [-1, 5, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0054083225600000005], 0, 48.775254249572754, 1690884011.084386], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 100, 100], "float16"], ["TENSOR", [128, 512, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 37530, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 8]], ["tile_y", "sp", [-1, 5, 4]], ["tile_x", "sp", [-1, 1, 4]], ["tile_rcc", "sp", [-1, 4]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0028484505599999997], 0, 7.470408916473389, 1690898606.335825], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 100, 100], "float16"], ["TENSOR", [256, 512, 1, 1], "float16"], [2, 2], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 22604, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 16]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 128]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.0018066380799999998], 0, 96.34204006195068, 1690903197.804775], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 50, 50], "float16"], ["TENSOR", [1024, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 42189, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 16]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 2, 13]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.00215273472], 0, 39.23888278007507, 1690922252.465035], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 100, 100], "float16"], ["TENSOR", [1024, 512, 1, 1], "float16"], [2, 2], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 32021, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 64]], ["tile_y", "sp", [-1, 4, 1]], ["tile_x", "sp", [-1, 2, 13]], ["tile_rcc", "sp", [-1, 128]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.005327749119999999], 0, 63.85982418060303, 1690924800.66927], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 50, 50], "float16"], ["TENSOR", [256, 1024, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 31352, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 16]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 8]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.0027207935999999998], 0, 38.93503499031067, 1690931724.929806], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 50, 50], "float16"], ["TENSOR", [512, 1024, 1, 1], "float16"], [2, 2], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 145715, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 8]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 4, 7]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0016177715200000001], 0, 7.785043954849243, 1690937002.49911], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 25, 25], "float16"], ["TENSOR", [512, 512, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 532386, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 7, 2]], ["tile_rcc", "sp", [-1, 8]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00465138176], 0, 61.261369943618774, 1690945307.137028], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 512, 25, 25], "float16"], ["TENSOR", [512, 512, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1565, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 2, 64]], ["tile_x", "sp", [-1, 13, 1]], ["tile_rc", "sp", [-1, 16]]]}, "result": [[0.0036266752000000003], 0, 25.54634380340576, 1690947608.80124], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 25, 25], "float16"], ["TENSOR", [2048, 512, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 125641, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 8]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 2, 7]], ["tile_rcc", "sp", [-1, 128]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 0]]}, "result": [[0.00264667136], 0, 55.753520011901855, 1690955879.572128], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 1024, 50, 50], "float16"], ["TENSOR", [2048, 1024, 1, 1], "float16"], [2, 2], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 47295, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 32]], ["tile_y", "sp", [-1, 2, 1]], ["tile_x", "sp", [-1, 2, 14]], ["tile_rcc", "sp", [-1, 256]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 0]]}, "result": [[0.005655055359999999], 0, 59.887123107910156, 1690962316.2670138], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 2048, 25, 25], "float16"], ["TENSOR", [512, 2048, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 237764, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 8]], ["tile_y", "sp", [-1, 2, 14]], ["tile_x", "sp", [-1, 2, 1]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 1]]}, "result": [[0.00305049088], 0, 56.29743003845215, 1690965935.712203], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 2048, 25, 25], "float16"], ["TENSOR", [256, 2048, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 127996, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 1, 14]], ["tile_x", "sp", [-1, 7, 1]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0016343500800000002], 0, 66.79692101478577, 1690974745.60696], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 512, 100, 100], "float16"], ["TENSOR", [256, 512, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 139804, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 32]], ["tile_y", "sp", [-1, 5, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00463796224], 0, 88.1339602470398, 1690982035.237529], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 200, 200], "float16"], ["TENSOR", [256, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 126064, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 4, 8]], ["tile_y", "sp", [-1, 5, 4]], ["tile_x", "sp", [-1, 1, 2]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 0]]}, "result": [[0.010390215679999999], 0, 8.813768148422241, 1690994387.078926], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 100, 100], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 8096, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 2, 32]], ["tile_x", "sp", [-1, 5, 4]], ["tile_rc", "sp", [-1, 64]]]}, "result": [[0.01353478144], 0, 18.41515588760376, 1691008839.2957299], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 25, 25], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 345900, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 7, 4]], ["tile_x", "sp", [-1, 1, 1]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0012570931199999999], 0, 71.55911087989807, 1691027397.61183], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 25, 25], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 147, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 13, 1]], ["tile_rc", "sp", [-1, 1]]]}, "result": [[1000000000.0], 6, 15, 1691030731.461725], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 13, 13], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 322964, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 8]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 8, 2]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00045295616000000003], 0, 22.340291023254395, 1691039159.1600928], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 13, 13], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1028, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 16], ["tile_y", "sp", [-1, 4, 8]], ["tile_x", "sp", [-1, 7, 7]], ["tile_rc", "sp", [-1, 4]]]}, "result": [[1000000000.0], 6, 15, 1691042119.17616], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 50, 50], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 134058, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0042351104], 0, 16.482624530792236, 1691057614.3114948], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 50, 50], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 2538, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 0], ["tile_y", "sp", [-1, 4, 16]], ["tile_x", "sp", [-1, 5, 5]], ["tile_rc", "sp", [-1, 32]]]}, "result": [[0.0055552358400000005], 0, 87.85729908943176, 1691075334.409717], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 100, 100], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 421737, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 5, 4]], ["tile_rcc", "sp", [-1, 1]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.01381415936], 0, 11.902816772460938, 1691086522.219925], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 200, 200], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 1061239, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 2, 16]], ["tile_y", "sp", [-1, 5, 2]], ["tile_x", "sp", [-1, 2, 4]], ["tile_rcc", "sp", [-1, 64]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.05619669504], 0, 80.3374400138855, 1691106234.012202], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 13, 13], "float16"], ["TENSOR", [12, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 14082, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 1]], ["tile_y", "sp", [-1, 1, 2]], ["tile_x", "sp", [-1, 1, 16]], ["tile_rcc", "sp", [-1, 4]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[3.487232e-05], 0, 21.557316780090332, 1691111243.9526248], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 25, 25], "float16"], ["TENSOR", [12, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 14049, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 1]], ["tile_y", "sp", [-1, 1, 4]], ["tile_x", "sp", [-1, 1, 14]], ["tile_rcc", "sp", [-1, 4]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[4.687871999999999e-05], 0, 5.870274066925049, 1691115639.4748101], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 50, 50], "float16"], ["TENSOR", [12, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 7265, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 3]], ["tile_y", "sp", [-1, 1, 1]], ["tile_x", "sp", [-1, 4, 13]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 1]]}, "result": [[0.00011686400000000001], 0, 20.78677797317505, 1691117394.260454], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 100, 100], "float16"], ["TENSOR", [12, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 31409, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 3]], ["tile_y", "sp", [-1, 2, 2]], ["tile_x", "sp", [-1, 2, 10]], ["tile_rcc", "sp", [-1, 32]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 1500], ["unroll_explicit", "ot", 1]]}, "result": [[0.00045357568], 0, 43.95883107185364, 1691120559.903743], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 256, 200, 200], "float16"], ["TENSOR", [12, 256, 1, 1], "float16"], [1, 1], [0, 0, 0, 0], [1, 1], "float32"], {}], "config": {"index": 46952, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 3]], ["tile_y", "sp", [-1, 2, 4]], ["tile_x", "sp", [-1, 2, 5]], ["tile_rcc", "sp", [-1, 2]], ["tile_ry", "sp", [-1, 1]], ["tile_rx", "sp", [-1, 1]], ["auto_unroll_max_step", "ot", 512], ["unroll_explicit", "ot", 1]]}, "result": [[0.0017081088], 0, 14.853874921798706, 1691123289.654478], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 64, 200, 200], "float16"], ["TENSOR", [64, 64, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 408899, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 16]], ["tile_y", "sp", [-1, 5, 8]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 4]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.00389012992], 0, 6.645724058151245, 1691408575.745703], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchwc.image2d", [["TENSOR", [1, 128, 100, 100], "float16"], ["TENSOR", [128, 128, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 338113, "code_hash": null, "entity": [["tile_fc", "sp", [-1, 1, 32]], ["tile_y", "sp", [-1, 5, 2]], ["tile_x", "sp", [-1, 2, 2]], ["tile_rcc", "sp", [-1, 16]], ["tile_ry", "sp", [-1, 3]], ["tile_rx", "sp", [-1, 3]], ["auto_unroll_max_step", "ot", 0], ["unroll_explicit", "ot", 1]]}, "result": [[0.0036743014399999996], 0, 58.662723779678345, 1691418318.854497], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 128, 100, 100], "float16"], ["TENSOR", [128, 128, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 355, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 4], ["tile_y", "sp", [-1, 2, 16]], ["tile_x", "sp", [-1, 5, 4]], ["tile_rc", "sp", [-1, 1]]]}, "result": [[0.0043690496], 0, 52.75086975097656, 1691421427.373715], "version": 0.2, "tvm_version": "0.14.dev0"}
{"input": ["opencl -keys=adreno,opencl,gpu -device=adreno -max_function_args=128 -max_num_threads=256 -max_shared_memory_per_block=16384 -max_threads_per_block=256 -texture_spatial_limit=16384 -thread_warp_size=1", "conv2d_nchw_winograd.image2d", [["TENSOR", [1, 256, 200, 200], "float16"], ["TENSOR", [256, 256, 3, 3], "float16"], [1, 1], [1, 1, 1, 1], [1, 1], "float32"], {}], "config": {"index": 4123, "code_hash": null, "entity": [["auto_unroll_max_step", "ot", 4], ["tile_y", "sp", [-1, 1, 64]], ["tile_x", "sp", [-1, 5, 2]], ["tile_rc", "sp", [-1, 8]]]}, "result": [[0.03937955328], 0, 19.30817675590515, 1691433103.8666408], "version": 0.2, "tvm_version": "0.14.dev0"}