Skip to content

Instantly share code, notes, and snippets.

@wchargin
Created November 13, 2017 16:09
Show Gist options
  • Star 14 You must be signed in to star a gist
  • Fork 3 You must be signed in to fork a gist
  • Save wchargin/31eee50b9aaebf387b380f70054575c5 to your computer and use it in GitHub Desktop.
Save wchargin/31eee50b9aaebf387b380f70054575c5 to your computer and use it in GitHub Desktop.
Extract scalars to CSV using the TensorBoard event multiplexer API
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import csv
import errno
import os
import re
import tensorflow as tf
from tensorboard.backend.event_processing import plugin_event_multiplexer as event_multiplexer # pylint: disable=line-too-long
# Control downsampling: how many scalar data do we keep for each run/tag
# combination?
SIZE_GUIDANCE = {'scalars': 1000}
def extract_scalars(multiplexer, run, tag):
"""Extract tabular data from the scalars at a given run and tag.
The result is a list of 3-tuples (wall_time, step, value).
"""
tensor_events = multiplexer.Tensors(run, tag)
return [
(event.wall_time, event.step, tf.make_ndarray(event.tensor_proto).item())
for event in tensor_events
]
def create_multiplexer(logdir):
multiplexer = event_multiplexer.EventMultiplexer(
tensor_size_guidance=SIZE_GUIDANCE)
multiplexer.AddRunsFromDirectory(logdir)
multiplexer.Reload()
return multiplexer
def export_scalars(multiplexer, run, tag, filepath, write_headers=True):
data = extract_scalars(multiplexer, run, tag)
with open(filepath, 'w') as outfile:
writer = csv.writer(outfile)
if write_headers:
writer.writerow(('wall_time', 'step', 'value'))
for row in data:
writer.writerow(row)
NON_ALPHABETIC = re.compile('[^A-Za-z0-9_]')
def munge_filename(name):
"""Remove characters that might not be safe in a filename."""
return NON_ALPHABETIC.sub('_', name)
def mkdir_p(directory):
try:
os.makedirs(directory)
except OSError as e:
if not (e.errno == errno.EEXIST and os.path.isdir(directory)):
raise
def main():
run_names = (
'scalars_demo/temperature:t0=270,tA=270,kH=%s' % x
for x in ('0.001', '0.005')
)
tag_names = ('temperature/current/scalar_summary', 'delta/scalar_summary')
logdir = '/tmp/data'
output_dir = '/tmp/csv_output'
mkdir_p(output_dir)
print("Loading data...")
multiplexer = create_multiplexer(logdir)
for run_name in run_names:
for tag_name in tag_names:
output_filename = '%s___%s' % (
munge_filename(run_name), munge_filename(tag_name))
output_filepath = os.path.join(output_dir, output_filename)
print(
"Exporting (run=%r, tag=%r) to %r..."
% (run_name, tag_name, output_filepath))
export_scalars(multiplexer, run_name, tag_name, output_filepath)
print("Done.")
if __name__ == '__main__':
main()
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment