From 102b9b44039beed13ce48a8d6aea04403804a2d9 Mon Sep 17 00:00:00 2001 From: Thierry Moreau Date: Mon, 29 Jul 2019 22:16:01 -0700 Subject: [PATCH] batch vta schedules --- tophub/vta_v0.06.log | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/tophub/vta_v0.06.log b/tophub/vta_v0.06.log index f60fd14..be65b41 100644 --- a/tophub/vta_v0.06.log +++ b/tophub/vta_v0.06.log @@ -9,5 +9,16 @@ {"i": ["ext_dev -device=vta -keys=cpu -model=pynq_1x16_i8w8a32_15_15_18_17", "topi_nn_conv2d", [["TENSOR", [1, 4, 56, 56, 1, 16], "int8"], ["TENSOR", [8, 4, 1, 1, 16, 16], "int8"], [2, 2], [0, 0], [1, 1], "NCHW1n16c", "int32"], {}, ["conv2d", [1, 4, 56, 56, 1, 16, "int8"], [8, 4, 1, 1, 16, 16, "int8"], [2, 2], [0, 0], [1, 1], "NCHW1n16c", "int32"], {"i": 1113, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [4, 7]], ["tile_w", "sp", [1, 28]], ["tile_ci", "sp", [4, 1]], ["tile_co", "sp", [2, 4]], ["oc_nthread", "ot", 1], ["h_nthread", "ot", 2]], "c": null, "t": "direct"}], "v": 0.1, "r": [[0.0013487228], 0, 7.647406816482544, 1562814719.0447638]} {"i": ["ext_dev -device=vta -keys=cpu -model=pynq_1x16_i8w8a32_15_15_18_17", "topi_nn_conv2d", [["TENSOR", [1, 8, 28, 28, 1, 16], "int8"], ["TENSOR", [16, 8, 1, 1, 16, 16], "int8"], [2, 2], [0, 0], [1, 1], "NCHW1n16c", "int32"], {}, ["conv2d", [1, 8, 28, 28, 1, 16, "int8"], [16, 8, 1, 1, 16, 16, "int8"], [2, 2], [0, 0], [1, 1], "NCHW1n16c", "int32"], {"i": 526, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [2, 7]], ["tile_w", "sp", [1, 14]], ["tile_ci", "sp", [8, 1]], ["tile_co", "sp", [2, 8]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "c": null, "t": "direct"}], "v": 0.1, "r": [[0.0010287707999999999], 0, 7.80133843421936, 1562815291.6689675]} {"i": ["ext_dev -device=vta -keys=cpu -model=pynq_1x16_i8w8a32_15_15_18_17", "topi_nn_conv2d", [["TENSOR", [1, 16, 14, 14, 1, 16], "int8"], ["TENSOR", [32, 16, 1, 1, 16, 16], "int8"], [2, 2], [0, 0], [1, 1], "NCHW1n16c", "int32"], {}, ["conv2d", [1, 16, 14, 14, 1, 16, "int8"], [32, 16, 1, 1, 16, 16, "int8"], [2, 2], [0, 0], [1, 1], "NCHW1n16c", "int32"], {"i": 203, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [1, 7]], ["tile_w", "sp", [1, 7]], ["tile_ci", "sp", [16, 1]], ["tile_co", "sp", [2, 16]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "c": null, "t": "direct"}], "v": 0.1, "r": [[0.0010809022], 0, 8.027522563934326, 1562816721.1013265]} +# Resnet-18 - pynq_4x8_i8w8a32_15_16_16_18 +{"r": [[0.0213515438], 0, 8.106715679168701, 1564446226.7772598], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 64, 56, 56, 64, 3, 3, [1, 1], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 8, 56, 56, 4, 8, "int8"], [8, 8, 3, 3, 8, 8, "int8"], [1, 1], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [28, 2]], ["tile_w", "sp", [1, 56]], ["tile_ci", "sp", [8, 1]], ["tile_co", "sp", [1, 8]], ["oc_nthread", "ot", 1], ["h_nthread", "ot", 2]], "i": 2873}], "v": 0.1} +{"r": [[0.011107803400000001], 0, 8.049933910369873, 1564446582.3308542], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 64, 56, 56, 128, 3, 3, [2, 2], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 8, 56, 56, 4, 8, "int8"], [16, 8, 3, 3, 8, 8, "int8"], [2, 2], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [4, 7]], ["tile_w", "sp", [1, 28]], ["tile_ci", "sp", [8, 1]], ["tile_co", "sp", [4, 4]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "i": 1041}], "v": 0.1} +{"r": [[0.0028389246], 0, 7.821471214294434, 1564447111.1809626], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 64, 56, 56, 128, 1, 1, [2, 2], [0, 0], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 8, 56, 56, 4, 8, "int8"], [16, 8, 1, 1, 8, 8, "int8"], [2, 2], [0, 0], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [28, 1]], ["tile_w", "sp", [1, 28]], ["tile_ci", "sp", [1, 8]], ["tile_co", "sp", [1, 16]], ["oc_nthread", "ot", 1], ["h_nthread", "ot", 2]], "i": 2154}], "v": 0.1} +{"r": [[0.0199354676], 0, 7.8180694580078125, 1564447409.5572493], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 128, 28, 28, 128, 3, 3, [1, 1], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 16, 28, 28, 4, 8, "int8"], [16, 16, 3, 3, 8, 8, "int8"], [1, 1], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [14, 2]], ["tile_w", "sp", [1, 28]], ["tile_ci", "sp", [16, 1]], ["tile_co", "sp", [1, 16]], ["oc_nthread", "ot", 1], ["h_nthread", "ot", 2]], "i": 2551}], "v": 0.1} +{"r": [[0.0100571334], 0, 7.83553671836853, 1564447896.8268821], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 128, 28, 28, 256, 3, 3, [2, 2], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 16, 28, 28, 4, 8, "int8"], [32, 16, 3, 3, 8, 8, "int8"], [2, 2], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [2, 7]], ["tile_w", "sp", [1, 14]], ["tile_ci", "sp", [16, 1]], ["tile_co", "sp", [4, 8]], ["oc_nthread", "ot", 1], ["h_nthread", "ot", 2]], "i": 1214}], "v": 0.1} +{"r": [[0.0021991859999999997], 0, 7.632226943969727, 1564448677.6960063], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 128, 28, 28, 256, 1, 1, [2, 2], [0, 0], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 16, 28, 28, 4, 8, "int8"], [32, 16, 1, 1, 8, 8, "int8"], [2, 2], [0, 0], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [14, 1]], ["tile_w", "sp", [1, 14]], ["tile_ci", "sp", [1, 16]], ["tile_co", "sp", [1, 32]], ["oc_nthread", "ot", 1], ["h_nthread", "ot", 2]], "i": 1436}], "v": 0.1} +{"r": [[0.0192200492], 0, 8.020992279052734, 1564449175.1251886], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 256, 14, 14, 256, 3, 3, [1, 1], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 32, 14, 14, 4, 8, "int8"], [32, 32, 3, 3, 8, 8, "int8"], [1, 1], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [1, 14]], ["tile_w", "sp", [1, 14]], ["tile_ci", "sp", [32, 1]], ["tile_co", "sp", [8, 4]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "i": 783}], "v": 0.1} +{"r": [[0.0096910504], 0, 7.9031407833099365, 1564449491.4272587], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 256, 14, 14, 512, 3, 3, [2, 2], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 32, 14, 14, 4, 8, "int8"], [64, 32, 3, 3, 8, 8, "int8"], [2, 2], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [1, 7]], ["tile_w", "sp", [1, 7]], ["tile_ci", "sp", [32, 1]], ["tile_co", "sp", [4, 16]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "i": 267}], "v": 0.1} +{"r": [[0.002754953], 0, 7.411137580871582, 1564449689.4525118], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 256, 14, 14, 512, 1, 1, [2, 2], [0, 0], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 32, 14, 14, 4, 8, "int8"], [64, 32, 1, 1, 8, 8, "int8"], [2, 2], [0, 0], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [7, 1]], ["tile_w", "sp", [1, 7]], ["tile_ci", "sp", [2, 16]], ["tile_co", "sp", [2, 32]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "i": 306}], "v": 0.1} +{"r": [[0.018922625800000002], 0, 8.592109680175781, 1564450414.7716956], "i": ["ext_dev -device=vta -keys=cpu -model=pynq_4x8_i8w8a32_15_16_16_18", "conv2d", [4, 512, 7, 7, 512, 3, 3, [1, 1], [1, 1], [1, 1], "int8", "int32"], {}, ["conv2d", [1, 64, 7, 7, 4, 8, "int8"], [64, 64, 3, 3, 8, 8, "int8"], [1, 1], [1, 1], [1, 1], "NCHW4n8c", "int32"], {"t": "direct", "c": null, "e": [["tile_b", "sp", [1, 1]], ["tile_h", "sp", [1, 7]], ["tile_w", "sp", [1, 7]], ["tile_ci", "sp", [64, 1]], ["tile_co", "sp", [4, 16]], ["oc_nthread", "ot", 2], ["h_nthread", "ot", 1]], "i": 311}], "v": 0.1} # Resnet-18 layer 0 - arm_cpu {"i": ["llvm -device=arm_cpu -model=pynq, -target=armv7a-linux-eabi", "topi_nn_conv2d", [["TENSOR", [1, 3, 224, 224], "int8"], ["TENSOR", [64, 3, 7, 7], "int8"], [2, 2], [3, 3], [1, 1], "NCHW", "int32"], {}, ["conv2d", [1, 3, 224, 224, "int8"], [64, 3, 7, 7, "int8"], [2, 2], [3, 3], [1, 1], "NCHW", "int32"], {"i": 72880, "c": null, "e": [["tile_co", "sp", [8, 4]], ["tile_oh", "sp", [56, 1]], ["tile_ow", "sp", [56, 8]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8, 9]], ["ann_reduce", "an", ["none", "none"]], ["ann_spatial", "an", ["unroll", "unroll", "vec"]]], "t": "direct"}], "r": [[0.105920721], 0, 0.729074239730835, 1533135908.2729535], "v": 0.1}