Skip to content

Instantly share code, notes, and snippets.

@yzhliu
Created November 2, 2018 21:07
Show Gist options
  • Save yzhliu/c5b4ad171c0d8b862fe30bdad09434b3 to your computer and use it in GitHub Desktop.
Save yzhliu/c5b4ad171c0d8b862fe30bdad09434b3 to your computer and use it in GitHub Desktop.
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 1024, 7, 7], "float32"], ["TENSOR", [1024, 1024, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 1024, 7, 7, "float32"], [1024, 1024, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 417, "c": null, "e": [["tile_ic", "sp", [1, 1024]], ["tile_oc", "sp", [64, 16]], ["tile_ow", "sp", [1, 7]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[0.00010386519659715739], 0, 1.2961008548736572, 1541133775.742406], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 1024, 7, 7], "float32"], ["TENSOR", [1024, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 1024, 7, 7, "float32"], [1024, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 777271, "c": null, "e": [["tile_co", "sp", [1024, 1]], ["tile_oh", "sp", [1, 7]], ["tile_ow", "sp", [7, 1]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 8, 6, 7]], ["reorder_1", "re", [0, 1, 2, 3, 4, 5, 6]], ["ann_reduce", "an", ["none", "none"]], ["ann_spatial", "an", ["vec", "none", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 3], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[1.3592455556007427e-05], 0, 1.220390796661377, 1541136835.442611], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 512, 7, 7], "float32"], ["TENSOR", [1024, 512, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 512, 7, 7, "float32"], [1024, 512, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 379, "c": null, "e": [["tile_ic", "sp", [1, 512]], ["tile_oc", "sp", [64, 16]], ["tile_ow", "sp", [1, 7]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[5.4070532632146703e-05], 0, 1.3067660331726074, 1541139391.440993], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 512, 14, 14], "float32"], ["TENSOR", [512, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 512, 14, 14, "float32"], [512, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 1271020, "c": null, "e": [["tile_co", "sp", [512, 1]], ["tile_oh", "sp", [7, 1]], ["tile_ow", "sp", [1, 7]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 8, 6, 7]], ["reorder_1", "re", [0, 1, 2, 3, 4, 6, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["none", "unroll", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 1], ["conv_inline", "ot", 3]], "t": "direct"}], "r": [[8.570726388651514e-06], 0, 1.2734742164611816, 1541144170.814932], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 512, 14, 14], "float32"], ["TENSOR", [512, 512, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 512, 14, 14, "float32"], [512, 512, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 749, "c": null, "e": [["tile_ic", "sp", [1, 512]], ["tile_oc", "sp", [32, 16]], ["tile_ow", "sp", [1, 14]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[8.500800439797528e-05], 0, 1.3582830429077148, 1541145096.951141], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 512, 14, 14], "float32"], ["TENSOR", [512, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 512, 14, 14, "float32"], [512, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 5514210, "c": null, "e": [["tile_co", "sp", [512, 1]], ["tile_oh", "sp", [7, 2]], ["tile_ow", "sp", [1, 14]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 8, 6, 7]], ["reorder_1", "re", [0, 1, 2, 3, 4, 6, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 3]], "t": "direct"}], "r": [[1.0471765691077334e-05], 0, 1.2541429996490479, 1541151082.108897], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 256, 14, 14], "float32"], ["TENSOR", [512, 256, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 256, 14, 14, "float32"], [512, 256, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 674, "c": null, "e": [["tile_ic", "sp", [1, 256]], ["tile_oc", "sp", [32, 16]], ["tile_ow", "sp", [1, 14]], ["tile_oh", "ot", 2]], "t": "direct"}], "r": [[5.0277709421939006e-05], 0, 1.4122250080108643, 1541152905.73859], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 256, 28, 28], "float32"], ["TENSOR", [256, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 256, 28, 28, "float32"], [256, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 2515428, "c": null, "e": [["tile_co", "sp", [256, 1]], ["tile_oh", "sp", [14, 1]], ["tile_ow", "sp", [7, 2]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["none", "vec", "unroll"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 3], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[1.2434137185505304e-05], 0, 1.284156084060669, 1541158135.486475], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 256, 28, 28], "float32"], ["TENSOR", [256, 256, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 256, 28, 28, "float32"], [256, 256, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 449, "c": null, "e": [["tile_ic", "sp", [1, 256]], ["tile_oc", "sp", [16, 16]], ["tile_ow", "sp", [1, 28]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.00010307642396560988], 0, 1.507378101348877, 1541160055.125099], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 256, 28, 28], "float32"], ["TENSOR", [256, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 256, 28, 28, "float32"], [256, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 4930218, "c": null, "e": [["tile_co", "sp", [256, 1]], ["tile_oh", "sp", [7, 4]], ["tile_ow", "sp", [2, 14]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 4, 5, 6]], ["ann_reduce", "an", ["none", "none"]], ["ann_spatial", "an", ["unroll", "vec", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[1.6605442621862134e-05], 0, 1.2241771221160889, 1541167564.825683], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 128, 28, 28], "float32"], ["TENSOR", [256, 128, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 128, 28, 28, "float32"], [256, 128, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 399, "c": null, "e": [["tile_ic", "sp", [1, 128]], ["tile_oc", "sp", [16, 16]], ["tile_ow", "sp", [1, 28]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[6.103659873661082e-05], 0, 1.429612159729004, 1541167754.770049], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 128, 56, 56], "float32"], ["TENSOR", [128, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 128, 56, 56, "float32"], [128, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 4388080, "c": null, "e": [["tile_co", "sp", [128, 1]], ["tile_oh", "sp", [7, 4]], ["tile_ow", "sp", [7, 4]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[2.4103942467535596e-05], 0, 1.2903680801391602, 1541171156.394026], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 128, 56, 56], "float32"], ["TENSOR", [128, 128, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 128, 56, 56, "float32"], [128, 128, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 242, "c": null, "e": [["tile_ic", "sp", [32, 4]], ["tile_oc", "sp", [2, 64]], ["tile_ow", "sp", [8, 7]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[0.00010614913752676114], 0, 1.555973768234253, 1541172923.267865], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 128, 56, 56], "float32"], ["TENSOR", [128, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 128, 56, 56, "float32"], [128, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 7800656, "c": null, "e": [["tile_co", "sp", [128, 1]], ["tile_oh", "sp", [14, 4]], ["tile_ow", "sp", [4, 14]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 8, 6, 7]], ["reorder_1", "re", [0, 1, 2, 3, 4, 5, 6]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "vec", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 2], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[3.2108080823277106e-05], 0, 1.2447669506072998, 1541179975.661915], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 64, 56, 56], "float32"], ["TENSOR", [128, 64, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 64, 56, 56, "float32"], [128, 64, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 155, "c": null, "e": [["tile_ic", "sp", [32, 2]], ["tile_oc", "sp", [2, 64]], ["tile_ow", "sp", [14, 4]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[6.500861753958587e-05], 0, 1.5069780349731445, 1541180070.801788], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 64, 112, 112], "float32"], ["TENSOR", [64, 1, 3, 3], "float32"], [2, 2], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 64, 112, 112, "float32"], [64, 1, 3, 3, "float32"], [2, 2], [1, 1], "float32"], {"i": 5718510, "c": null, "e": [["tile_co", "sp", [64, 1]], ["tile_oh", "sp", [14, 4]], ["tile_ow", "sp", [7, 8]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["unroll", "unroll", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 1], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[4.923698401770347e-05], 0, 1.6932947635650635, 1541183600.543316], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 32, 112, 112], "float32"], ["TENSOR", [64, 32, 1, 1], "float32"], [1, 1], [0, 0], "NCHW", "float32"], {}, ["conv2d", [1, 32, 112, 112, "float32"], [64, 32, 1, 1, "float32"], [1, 1], [0, 0], "NCHW", "float32"], {"i": 160, "c": null, "e": [["tile_ic", "sp", [2, 16]], ["tile_oc", "sp", [2, 32]], ["tile_ow", "sp", [16, 7]], ["tile_oh", "ot", 1]], "t": "direct"}], "r": [[8.695871455888743e-05], 0, 1.4124460220336914, 1541185106.716176], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_depthwise_conv2d_nchw", [["TENSOR", [1, 32, 112, 112], "float32"], ["TENSOR", [32, 1, 3, 3], "float32"], [1, 1], [1, 1], "float32"], {}, ["depthwise_conv2d_nchw", [1, 32, 112, 112, "float32"], [32, 1, 3, 3, "float32"], [1, 1], [1, 1], "float32"], {"i": 10380012, "c": null, "e": [["tile_co", "sp", [32, 1]], ["tile_oh", "sp", [28, 4]], ["tile_ow", "sp", [112, 1]], ["reorder_0", "re", [0, 1, 2, 3, 4, 5, 6, 7, 8]], ["reorder_1", "re", [0, 1, 2, 3, 6, 4, 5]], ["ann_reduce", "an", ["unroll", "unroll"]], ["ann_spatial", "an", ["none", "none", "none"]], ["data_pad_inline", "ot", 1], ["data_vec_inline", "ot", 3], ["conv_inline", "ot", 1]], "t": "direct"}], "r": [[6.47391044012945e-05], 0, 1.2620232105255127, 1541189613.086462], "v": 0.1}
{"i": ["llvm -mcpu=skylake-avx512", "topi_nn_conv2d", [["TENSOR", [1, 3, 224, 224], "float32"], ["TENSOR", [32, 3, 3, 3], "float32"], [2, 2], [1, 1], "NCHW", "float32"], {}, ["conv2d", [1, 3, 224, 224, "float32"], [32, 3, 3, 3, "float32"], [2, 2], [1, 1], "NCHW", "float32"], {"i": 8, "c": null, "e": [["tile_ic", "sp", [3, 1]], ["tile_oc", "sp", [2, 16]], ["tile_ow", "sp", [112, 1]], ["unroll_kw", "ot", true]], "t": "direct"}], "r": [[5.2986724205301506e-05], 0, 1.347486972808838, 1541191372.385285], "v": 0.1}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment