wchargin/extract_scalars.py

## extract_scalars.py
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function


import csv
import errno
import os
import re

import tensorflow as tf
from tensorboard.backend.event_processing import plugin_event_multiplexer as event_multiplexer  # pylint: disable=line-too-long


# Control downsampling: how many scalar data do we keep for each run/tag
# combination?
SIZE_GUIDANCE = {'scalars': 1000}


def extract_scalars(multiplexer, run, tag):
  """Extract tabular data from the scalars at a given run and tag.

  The result is a list of 3-tuples (wall_time, step, value).
  """
  tensor_events = multiplexer.Tensors(run, tag)
  return [
      (event.wall_time, event.step, tf.make_ndarray(event.tensor_proto).item())
      for event in tensor_events
  ]


def create_multiplexer(logdir):
  multiplexer = event_multiplexer.EventMultiplexer(
      tensor_size_guidance=SIZE_GUIDANCE)
  multiplexer.AddRunsFromDirectory(logdir)
  multiplexer.Reload()
  return multiplexer


def export_scalars(multiplexer, run, tag, filepath, write_headers=True):
  data = extract_scalars(multiplexer, run, tag)
  with open(filepath, 'w') as outfile:
    writer = csv.writer(outfile)
    if write_headers:
      writer.writerow(('wall_time', 'step', 'value'))
    for row in data:
      writer.writerow(row)


NON_ALPHABETIC = re.compile('[^A-Za-z0-9_]')

def munge_filename(name):
  """Remove characters that might not be safe in a filename."""
  return NON_ALPHABETIC.sub('_', name)


def mkdir_p(directory):
  try:
    os.makedirs(directory)
  except OSError as e:
    if not (e.errno == errno.EEXIST and os.path.isdir(directory)):
      raise


def main():
  run_names = (
      'scalars_demo/temperature:t0=270,tA=270,kH=%s' % x
      for x in ('0.001', '0.005')
  )
  tag_names = ('temperature/current/scalar_summary', 'delta/scalar_summary')

  logdir = '/tmp/data'
  output_dir = '/tmp/csv_output'
  mkdir_p(output_dir)

  print("Loading data...")
  multiplexer = create_multiplexer(logdir)
  for run_name in run_names:
    for tag_name in tag_names:
      output_filename = '%s___%s' % (
          munge_filename(run_name), munge_filename(tag_name))
      output_filepath = os.path.join(output_dir, output_filename)
      print(
          "Exporting (run=%r, tag=%r) to %r..."
          % (run_name, tag_name, output_filepath))
      export_scalars(multiplexer, run_name, tag_name, output_filepath)
  print("Done.")


if __name__ == '__main__':
  main()
	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function


	import csv
	import errno
	import os
	import re

	import tensorflow as tf
	from tensorboard.backend.event_processing import plugin_event_multiplexer as event_multiplexer # pylint: disable=line-too-long


	# Control downsampling: how many scalar data do we keep for each run/tag
	# combination?
	SIZE_GUIDANCE = {'scalars': 1000}


	def extract_scalars(multiplexer, run, tag):
	"""Extract tabular data from the scalars at a given run and tag.

	The result is a list of 3-tuples (wall_time, step, value).
	"""
	tensor_events = multiplexer.Tensors(run, tag)
	return [
	(event.wall_time, event.step, tf.make_ndarray(event.tensor_proto).item())
	for event in tensor_events
	]


	def create_multiplexer(logdir):
	multiplexer = event_multiplexer.EventMultiplexer(
	tensor_size_guidance=SIZE_GUIDANCE)
	multiplexer.AddRunsFromDirectory(logdir)
	multiplexer.Reload()
	return multiplexer


	def export_scalars(multiplexer, run, tag, filepath, write_headers=True):
	data = extract_scalars(multiplexer, run, tag)
	with open(filepath, 'w') as outfile:
	writer = csv.writer(outfile)
	if write_headers:
	writer.writerow(('wall_time', 'step', 'value'))
	for row in data:
	writer.writerow(row)


	NON_ALPHABETIC = re.compile('[^A-Za-z0-9_]')

	def munge_filename(name):
	"""Remove characters that might not be safe in a filename."""
	return NON_ALPHABETIC.sub('_', name)


	def mkdir_p(directory):
	try:
	os.makedirs(directory)
	except OSError as e:
	if not (e.errno == errno.EEXIST and os.path.isdir(directory)):
	raise


	def main():
	run_names = (
	'scalars_demo/temperature:t0=270,tA=270,kH=%s' % x
	for x in ('0.001', '0.005')
	)
	tag_names = ('temperature/current/scalar_summary', 'delta/scalar_summary')

	logdir = '/tmp/data'
	output_dir = '/tmp/csv_output'
	mkdir_p(output_dir)

	print("Loading data...")
	multiplexer = create_multiplexer(logdir)
	for run_name in run_names:
	for tag_name in tag_names:
	output_filename = '%s___%s' % (
	munge_filename(run_name), munge_filename(tag_name))
	output_filepath = os.path.join(output_dir, output_filename)
	print(
	"Exporting (run=%r, tag=%r) to %r..."
	% (run_name, tag_name, output_filepath))
	export_scalars(multiplexer, run_name, tag_name, output_filepath)
	print("Done.")


	if __name__ == '__main__':
	main()