Skip to content

Instantly share code, notes, and snippets.

@dovahcrow
Created September 22, 2020 08:13
Show Gist options
  • Save dovahcrow/2d854810f94ed875543c87771fb349a0 to your computer and use it in GitHub Desktop.
Save dovahcrow/2d854810f94ed875543c87771fb349a0 to your computer and use it in GitHub Desktop.
Vega-Lite spec from Tue Sep 22 2020
{
"config": {"view": {"continuousWidth": 400, "continuousHeight": 300}},
"data": {"name": "data-311d929e23a8671460fda2c7f27ad1a7"},
"facet": {
"type": "nominal",
"field": "dataset",
"header": {
"labelAlign": "left",
"labelAngle": 0,
"labelPadding": 0,
"titlePadding": 0
},
"sort": ["order"],
"title": "Dataset"
},
"spec": {
"layer": [
{
"mark": "bar",
"encoding": {
"color": {"type": "nominal", "field": "name", "legend": null},
"tooltip": [
{"type": "nominal", "field": "name"},
{
"type": "quantitative",
"field": "elapsed",
"format": ".2s",
"title": "Elapsed (s)"
},
{"type": "nominal", "field": "MachineMem"},
{"type": "nominal", "field": "DatasetMemSize"}
],
"x": {
"type": "quantitative",
"field": "elapsed",
"title": "Elapsed (s)"
},
"y": {"type": "nominal", "field": "name", "title": ""}
},
"title": "create_report(df) Comparison",
"width": 240
},
{
"mark": {"type": "text", "color": "white", "dx": -15, "dy": 1},
"encoding": {
"text": {"type": "quantitative", "field": "elapsed", "format": ".1f"},
"x": {
"type": "quantitative",
"field": "elapsed",
"title": "Elapsed (s)"
},
"y": {"type": "nominal", "field": "name", "title": ""}
},
"title": "create_report(df) Comparison",
"width": 240
}
]
},
"columns": 2,
"resolve": {"scale": {"x": "independent"}},
"$schema": "https://vega.github.io/schema/vega-lite/v4.8.1.json",
"datasets": {
"data-311d929e23a8671460fda2c7f27ad1a7": [
{
"cpu": 8,
"dataset": "automobile",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 219745,
"name": "PandasProfilingReport",
"elapsed": 38.19445466995239,
"DVM": 0.000003197710611857474,
"MachineMem": "64G",
"DatasetMemSize": "0.2M",
"order": 2
},
{
"cpu": 8,
"dataset": "automobile",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 219745,
"name": "DataPrepReport",
"elapsed": 3.90642237663269,
"DVM": 0.000003197710611857474,
"MachineMem": "64G",
"DatasetMemSize": "0.2M",
"order": 2
},
{
"cpu": 8,
"dataset": "titanic",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 336844,
"name": "PandasProfilingReport",
"elapsed": 17.759124279022217,
"DVM": 0.000004901725333184004,
"MachineMem": "64G",
"DatasetMemSize": "0.3M",
"order": 3
},
{
"cpu": 8,
"dataset": "titanic",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 336844,
"name": "DataPrepReport",
"elapsed": 2.093762397766113,
"DVM": 0.000004901725333184004,
"MachineMem": "64G",
"DatasetMemSize": "0.3M",
"order": 3
},
{
"cpu": 8,
"dataset": "suicide",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 12979530,
"name": "PandasProfilingReport",
"elapsed": 20.60933256149292,
"DVM": 0.0001888770202640444,
"MachineMem": "64G",
"DatasetMemSize": "12.4M",
"order": 7
},
{
"cpu": 8,
"dataset": "suicide",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 12979530,
"name": "DataPrepReport",
"elapsed": 2.795340538024902,
"DVM": 0.0001888770202640444,
"MachineMem": "64G",
"DatasetMemSize": "12.4M",
"order": 7
},
{
"cpu": 8,
"dataset": "chess",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 18135117,
"name": "PandasProfilingReport",
"elapsed": 23.597283363342285,
"DVM": 0.0002639006852405146,
"MachineMem": "64G",
"DatasetMemSize": "17.3M",
"order": 9
},
{
"cpu": 8,
"dataset": "chess",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 18135117,
"name": "DataPrepReport",
"elapsed": 4.349036455154419,
"DVM": 0.0002639006852405146,
"MachineMem": "64G",
"DatasetMemSize": "17.3M",
"order": 9
},
{
"cpu": 8,
"dataset": "adult",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 32319408,
"name": "PandasProfilingReport",
"elapsed": 23.207568645477295,
"DVM": 0.00047030928544700146,
"MachineMem": "64G",
"DatasetMemSize": "30.8M",
"order": 10
},
{
"cpu": 8,
"dataset": "adult",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 32319408,
"name": "DataPrepReport",
"elapsed": 3.995121479034424,
"DVM": 0.00047030928544700146,
"MachineMem": "64G",
"DatasetMemSize": "30.8M",
"order": 10
},
{
"cpu": 8,
"dataset": "women",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 2982987,
"name": "PandasProfilingReport",
"elapsed": 19.846524477005005,
"DVM": 0.00004340817395132035,
"MachineMem": "64G",
"DatasetMemSize": "2.8M",
"order": 4
},
{
"cpu": 8,
"dataset": "women",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 2982987,
"name": "DataPrepReport",
"elapsed": 2.253621578216552,
"DVM": 0.00004340817395132035,
"MachineMem": "64G",
"DatasetMemSize": "2.8M",
"order": 4
},
{
"cpu": 8,
"dataset": "conflicts",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 42992820,
"name": "PandasProfilingReport",
"elapsed": 34.8504536151886,
"DVM": 0.000625627872068435,
"MachineMem": "64G",
"DatasetMemSize": "41.0M",
"order": 12
},
{
"cpu": 8,
"dataset": "conflicts",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 42992820,
"name": "DataPrepReport",
"elapsed": 8.63267731666565,
"DVM": 0.000625627872068435,
"MachineMem": "64G",
"DatasetMemSize": "41.0M",
"order": 12
},
{
"cpu": 8,
"dataset": "rain",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 81910261,
"name": "PandasProfilingReport",
"elapsed": 100.13724899291992,
"DVM": 0.0011919511744054034,
"MachineMem": "64G",
"DatasetMemSize": "78.1M",
"order": 14
},
{
"cpu": 8,
"dataset": "rain",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 81910261,
"name": "DataPrepReport",
"elapsed": 11.556110858917236,
"DVM": 0.0011919511744054034,
"MachineMem": "64G",
"DatasetMemSize": "78.1M",
"order": 14
},
{
"cpu": 8,
"dataset": "hotel",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 111833855,
"name": "PandasProfilingReport",
"elapsed": 83.23299789428711,
"DVM": 0.0016273967776214704,
"MachineMem": "64G",
"DatasetMemSize": "106.7M",
"order": 15
},
{
"cpu": 8,
"dataset": "hotel",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 111833855,
"name": "DataPrepReport",
"elapsed": 12.955996036529541,
"DVM": 0.0016273967776214704,
"MachineMem": "64G",
"DatasetMemSize": "106.7M",
"order": 15
},
{
"cpu": 8,
"dataset": "credit",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 6240128,
"name": "PandasProfilingReport",
"elapsed": 126.97673153877258,
"DVM": 0.00009080581367015839,
"MachineMem": "64G",
"DatasetMemSize": "6.0M",
"order": 5
},
{
"cpu": 8,
"dataset": "credit",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 6240128,
"name": "DataPrepReport",
"elapsed": 6.080683946609497,
"DVM": 0.00009080581367015839,
"MachineMem": "64G",
"DatasetMemSize": "6.0M",
"order": 5
},
{
"cpu": 8,
"dataset": "diamonds",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 13668592,
"name": "PandasProfilingReport",
"elapsed": 28.24142575263977,
"DVM": 0.00019890419207513332,
"MachineMem": "64G",
"DatasetMemSize": "13.0M",
"order": 8
},
{
"cpu": 8,
"dataset": "diamonds",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 13668592,
"name": "DataPrepReport",
"elapsed": 3.12566876411438,
"DVM": 0.00019890419207513332,
"MachineMem": "64G",
"DatasetMemSize": "13.0M",
"order": 8
},
{
"cpu": 8,
"dataset": "solar",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 11031487,
"name": "PandasProfilingReport",
"elapsed": 25.080874919891357,
"DVM": 0.00016052926366683096,
"MachineMem": "64G",
"DatasetMemSize": "10.5M",
"order": 6
},
{
"cpu": 8,
"dataset": "solar",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 11031487,
"name": "DataPrepReport",
"elapsed": 2.742274284362793,
"DVM": 0.00016052926366683096,
"MachineMem": "64G",
"DatasetMemSize": "10.5M",
"order": 6
},
{
"cpu": 8,
"dataset": "basketball",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 44191798,
"name": "PandasProfilingReport",
"elapsed": 126.23006176948547,
"DVM": 0.0006430752982851118,
"MachineMem": "64G",
"DatasetMemSize": "42.1M",
"order": 13
},
{
"cpu": 8,
"dataset": "basketball",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 44191798,
"name": "DataPrepReport",
"elapsed": 9.948905229568481,
"DVM": 0.0006430752982851118,
"MachineMem": "64G",
"DatasetMemSize": "42.1M",
"order": 13
},
{
"cpu": 8,
"dataset": "diabetes",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 61568,
"name": "PandasProfilingReport",
"elapsed": 28.29576539993286,
"DVM": 8.959323167800903e-7,
"MachineMem": "64G",
"DatasetMemSize": "0.1M",
"order": 1
},
{
"cpu": 8,
"dataset": "diabetes",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 61568,
"name": "DataPrepReport",
"elapsed": 1.577282905578613,
"DVM": 8.959323167800903e-7,
"MachineMem": "64G",
"DatasetMemSize": "0.1M",
"order": 1
},
{
"cpu": 8,
"dataset": "heart",
"fname": "create_report_pp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 36488,
"name": "PandasProfilingReport",
"elapsed": 17.657201051712036,
"DVM": 5.309702828526497e-7,
"MachineMem": "64G",
"DatasetMemSize": "0.0M",
"order": 0
},
{
"cpu": 8,
"dataset": "heart",
"fname": "create_report_dp.py",
"format": "csv",
"memory": 68719476736,
"ncol": 0,
"nrow": 0,
"partition": 0,
"reader": "pandas",
"mem_size": 36488,
"name": "DataPrepReport",
"elapsed": 1.9863638877868652,
"DVM": 5.309702828526497e-7,
"MachineMem": "64G",
"DatasetMemSize": "0.0M",
"order": 0
}
]
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment