Skip to content

Instantly share code, notes, and snippets.

@yzhliu
Created November 2, 2018 03:37
Show Gist options
  • Save yzhliu/c287798592f7568c6e624b33727576a5 to your computer and use it in GitHub Desktop.
Save yzhliu/c287798592f7568c6e624b33727576a5 to your computer and use it in GitHub Desktop.
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 1024, 7, 7], "float32"], ["TENSOR", [1024, 1024, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 1024, 7, 7, "float32"], [1024, 1024, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 416, "c": null, "e": [["tile_ic", "sp", [2, 512]], ["tile_oc", "sp", [64, 16]], ["tile_ow", "sp", [1, 7]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[0.0012855558738853504], 0, 1.3173747062683105, 1541097220.10334], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 1024, 7, 7], "float32"], ["TENSOR", [1024, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 1024, 7, 7, "float32"], [1024, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 354673, "c": null, "e": [["tile_co", "sp", [1024, 1]], ["tile_oh", "sp", [1, 7]], ["tile_ow", "sp", [1, 7]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 3], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[6.834159044951495e-05], 0, 1.2607789039611816, 1541099813.971948], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 512, 7, 7], "float32"], ["TENSOR", [1024, 512, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 512, 7, 7, "float32"], [1024, 512, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 379, "c": null, "e": [["tile_ic", "sp", [1, 512]], ["tile_oc", "sp", [64, 16]], ["tile_ow", "sp", [1, 7]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[0.000638318708596713], 0, 1.32138991355896, 1541101002.158124], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 512, 14, 14], "float32"], ["TENSOR", [512, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 512, 14, 14, "float32"], [512, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 212080, "c": null, "e": [["tile_co", "sp", [512, 1]], ["tile_oh", "sp", [7, 1]], ["tile_ow", "sp", [7, 1]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 4, 6, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["none", "none", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[7.075995428531054e-05], 0, 1.2892718315124512, 1541103787.705293], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 512, 14, 14], "float32"], ["TENSOR", [512, 512, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 512, 14, 14, "float32"], [512, 512, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 748, "c": null, "e": [["tile_ic", "sp", [2, 256]], ["tile_oc", "sp", [32, 16]], ["tile_ow", "sp", [1, 14]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[0.000885081691696113], 0, 1.3590340614318848, 1541104373.547855], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 512, 14, 14], "float32"], ["TENSOR", [512, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 512, 14, 14, "float32"], [512, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 537410, "c": null, "e": [["tile_co", "sp", [512, 1]], ["tile_oh", "sp", [7, 2]], ["tile_ow", "sp", [1, 14]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 4, 6, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["vec", "unroll", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 1], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.0001803038339906777], 0, 1.6480019092559814, 1541106442.294467], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 256, 14, 14], "float32"], ["TENSOR", [512, 256, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 256, 14, 14, "float32"], [512, 256, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 674, "c": null, "e": [["tile_ic", "sp", [1, 256]], ["tile_oc", "sp", [32, 16]], ["tile_ow", "sp", [1, 14]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[0.0004854025510879849], 0, 1.348909854888916, 1541107340.295816], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 256, 28, 28], "float32"], ["TENSOR", [256, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 256, 28, 28, "float32"], [256, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 815085, "c": null, "e": [["tile_co", "sp", [256, 1]], ["tile_oh", "sp", [7, 2]], ["tile_ow", "sp", [7, 2]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.00010908774640209334], 0, 1.2660508155822754, 1541110088.94157], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 256, 28, 28], "float32"], ["TENSOR", [256, 256, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 256, 28, 28, "float32"], [256, 256, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 219, "c": null, "e": [["tile_ic", "sp", [32, 8]], ["tile_oc", "sp", [4, 64]], ["tile_ow", "sp", [7, 4]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.0010078490658025922], 0, 1.5808501243591309, 1541110875.83389], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 256, 28, 28], "float32"], ["TENSOR", [256, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 256, 28, 28, "float32"], [256, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 1865763, "c": null, "e": [["tile_co", "sp", [256, 1]], ["tile_oh", "sp", [14, 2]], ["tile_ow", "sp", [4, 7]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 4, 6, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["vec", "unroll", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.0003885519321249518], 0, 1.3752059936523438, 1541112319.192314], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 128, 28, 28], "float32"], ["TENSOR", [256, 128, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 128, 28, 28, "float32"], [256, 128, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 261, "c": null, "e": [["tile_ic", "sp", [4, 32]], ["tile_oc", "sp", [8, 32]], ["tile_ow", "sp", [4, 7]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.0005010874967709885], 0, 1.4124279022216797, 1541112996.942117], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 128, 56, 56], "float32"], ["TENSOR", [128, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 128, 56, 56, "float32"], [128, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 1598208, "c": null, "e": [["tile_co", "sp", [128, 1]], ["tile_oh", "sp", [28, 1]], ["tile_ow", "sp", [7, 4]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 8, 6, 7]], ["reorder_1", "re", [0, 1, 2, 3, 4, 6, 5]], ["ann_reduce", "an", ["none", "none"]], ["ann_spatial", "an", ["unroll", "unroll", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.000214896734719078], 0, 1.2821760177612305, 1541114351.022547], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 128, 56, 56], "float32"], ["TENSOR", [128, 128, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 128, 56, 56, "float32"], [128, 128, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 179, "c": null, "e": [["tile_ic", "sp", [16, 8]], ["tile_oc", "sp", [2, 64]], ["tile_ow", "sp", [14, 4]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.0011927223289786223], 0, 1.5646419525146484, 1541115180.410259], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 128, 56, 56], "float32"], ["TENSOR", [128, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 128, 56, 56, "float32"], [128, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 2885384, "c": null, "e": [["tile_co", "sp", [128, 1]], ["tile_oh", "sp", [28, 2]], ["tile_ow", "sp", [7, 8]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 8, 6, 7]], ["reorder_1", "re", [0, 1, 2, 3, 4, 5, 6]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.0007198469814152966], 0, 1.2987592220306396, 1541116461.177921], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 64, 56, 56], "float32"], ["TENSOR", [128, 64, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 64, 56, 56, "float32"], [128, 64, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 206, "c": null, "e": [["tile_ic", "sp", [8, 8]], ["tile_oc", "sp", [4, 32]], ["tile_ow", "sp", [8, 7]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.0006921729174001355], 0, 1.4132380485534668, 1541117387.827645], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 64, 112, 112], "float32"], ["TENSOR", [64, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 64, 112, 112, "float32"], [64, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 2495472, "c": null, "e": [["tile_co", "sp", [64, 1]], ["tile_oh", "sp", [56, 1]], ["tile_ow", "sp", [14, 4]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["none", "none"]], ["ann_spatial", "an", ["unroll", "unroll", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.00044570696675302245], 0, 1.3406379222869873, 1541118966.558775], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 32, 112, 112], "float32"], ["TENSOR", [64, 32, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 32, 112, 112, "float32"], [64, 32, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 151, "c": null, "e": [["tile_ic", "sp", [16, 2]], ["tile_oc", "sp", [4, 16]], ["tile_ow", "sp", [16, 7]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.0010983103128430298], 0, 1.3156898021697998, 1541119987.544479], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 32, 112, 112], "float32"], ["TENSOR", [32, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 32, 112, 112, "float32"], [32, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 3396246, "c": null, "e": [["tile_co", "sp", [32, 1]], ["tile_oh", "sp", [56, 2]], ["tile_ow", "sp", [14, 8]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 0]], "t": "direct"}], "r": [[0.0007260540542691752], 0, 1.302393913269043, 1541121289.114512], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 3, 224, 224], "float32"], ["TENSOR", [32, 3, 3, 3], "float32"], [2, 2], [1, 1], "NCHW", "float32"], {}, ["conv2d", [1, 3, 224, 224, "float32"], [32, 3, 3, 3, "float32"], [2, 2], [1, 1], "NCHW", "float32"], {"i": 188, "c": null, "e": [["tile_ic", "sp", [3, 1]], ["tile_oc", "sp", [2, 16]], ["tile_ow", "sp", [7, 16]], ["unroll_kw", "ot", false]], "t": "direct"}], "r": [[0.0005389010258481421], 0, 1.3655979633331299, 1541122085.422816], "v": 0.1}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment