Skip to content

Instantly share code, notes, and snippets.

@jeremymv2
Last active August 21, 2019 17:55
Show Gist options
  • Star 1 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save jeremymv2/80ba99cb059e658d4639bbd013eb178b to your computer and use it in GitHub Desktop.
Save jeremymv2/80ba99cb059e658d4639bbd013eb178b to your computer and use it in GitHub Desktop.
Parrallel (backgrounded) knife ec restores with 1 thread per org
#!/usr/bin/env ruby
# Use this script if you have 3 or more Chef Organizations
# and wish to speed up restores by using parallelism.
require 'fileutils'
require 'optparse'
CONCURRENCY = 1
BACKUP_LOG = "restore_#{Time.now.strftime('%m%d%Y%H%M')}.log".freeze
SCRIPT_OUTPUT = 'chef-restore-by-org.sh'.freeze
ARGV << '-h' if ARGV.length != 6
# rubocop:disable Style/GlobalVars
$options = {}
OptionParser.new do |opts|
opts.banner = "Usage: #{$PROGRAM_NAME} [options]"
opts.on('-d', '--backup-dir PATH', '/path/to/backup/directory') { |v| $options[:backup_dir] = v }
opts.on('-k', '--kniferb PATH', '/path/to/pivotal.rb') { |v| $options[:knife_rb] = v }
opts.on('-a', '--args PATH', '/path/to/extra-args.txt') { |v| $options[:args_file] = v }
opts.on_tail('-h', '--help', 'Show this message') do
puts opts
exit
end
end.parse!
EXTRA_ARGS_FILE = $options[:args_file]
KNIFE_RB = $options[:knife_rb]
def extra_args
File.readlines(EXTRA_ARGS_FILE).map(&:chomp).join(' ')
end
def org_path(org)
File.expand_path(File.join($options[:backup_dir], 'organizations', org))
end
def tree_size(org_path)
Dir[File.join(org_path, '**/*')].size
end
def organizations_path
File.expand_path(File.join($options[:backup_dir], 'organizations'))
end
def populate_org_hash
orgs = {}
Dir[File.join(organizations_path, '**')].each do |org_path|
org = File.basename(org_path)
orgs[org] = {}
orgs[org]['path'] = org_path
orgs[org]['size'] = tree_size(org_path)
end
orgs
end
def orgs_by_size(orgs)
Hash[orgs.sort_by { |_k, v| v['size'] }.reverse].keys
end
# rubocop:disable Metrics/MethodLength
def write_script(list)
last_org = list.pop
penultimate_org = list.pop
org_with_users = "knife ec restore #{$options[:backup_dir]} --yes --purge -c #{KNIFE_RB} \
--concurrency #{CONCURRENCY} --with-user-sql --skip-useracl --only-org #{last_org} #{extra_args} 2>&1 \
| while IFS= read -r line; do echo \"ORG:#{last_org} $(date) $line\"; done >> #{BACKUP_LOG}"
org_with_useracl = "knife ec restore #{$options[:backup_dir]} --yes --purge -c #{KNIFE_RB} \
--concurrency #{CONCURRENCY} --skip-users --only-org #{penultimate_org} #{extra_args} 2>&1 \
| while IFS= read -r line; do echo \"ORG:#{penultimate_org} $(date) $line\"; done >> #{BACKUP_LOG}"
script = <<-SCRIPT
#!/bin/bash
ORGS="#{list.join(' ')}"
export PATH=/opt/chefdk/bin:$PATH
echo "Saving logs to #{BACKUP_LOG}"
echo "Step 1. restoring smallest org and all users"
#{org_with_users} || true
echo "Step 2. backgrounding restore job for orgs"
for org in $ORGS; do
knife ec restore #{$options[:backup_dir]} --yes --purge --concurrency #{CONCURRENCY} -c #{KNIFE_RB} --only-org $org --skip-users --skip-useracl #{extra_args} 2>&1 | while IFS= read -r line; do echo \"ORG:$org $(date) $line\"; done >> #{BACKUP_LOG} &
done
while [[ -n $(jobs -r) ]]; do echo -n "."; sleep 60; done
echo
echo "Step 3. restoring user acls along with last org"
#{org_with_useracl} || true
echo "Step 4. gathering results"
ORGS="${ORGS} #{last_org} #{penultimate_org}"
for org in $ORGS; do
if grep -q "^ORG:$org .*Finished" #{BACKUP_LOG}; then
echo "$org succeeded"
else
echo "$org failed"
fi
done
SCRIPT
puts "Writing: #{SCRIPT_OUTPUT}"
File.open(SCRIPT_OUTPUT, 'w') do |f|
f.write(script)
end
FileUtils.chmod 'u=rwx', SCRIPT_OUTPUT.to_s
end
# rubocop:enable Metrics/MethodLength
# rubocop:enable Style/GlobalVars
write_script orgs_by_size populate_org_hash
@jeremymv2
Copy link
Author

jeremymv2 commented Sep 17, 2018

  1. Copy the above script to one of your FrontEnds or backup workstation.

  2. Create a file in the same directory that contains lines for the following extra knife ec restore arguments, customized for your setup.

--webui-key /path/to/webui_priv.pem
--sql-host 192.168.200.100
--sql-port 5432
--sql-user opscode-pgsql
--sql-password f106a7d1a005696a5aeb4e9b87f2541ccb9834b4dfefba03f597ee130e73dc2b2d595f59aaf7b31f3aa2ad42f746a6991309
  1. Generate your restore script
15:49 $ ./parallel-restorev2.rb -d /path/to/backups -k /path/to/pivotal.rb -a /path/to/extra-args.txt
Writing: chef-restore-by-org.sh
15:50 $
  1. Run the restore
15:43 $ ./chef-restore-by-org.sh
Saving logs to restore_091720181543.log
Step 1. restoring smallest org (acmeinc) and all users.
Step 2. backgrounding restore job for remainder of orgs. users and user-acls will be skipped.
brewinc..
.
Step 3. gathering results
acmeinc succeeded
brewinc succeeded
15:44 $
  1. Monitor the output of the following commands on the Frontend and on the backend running PostgreSQL DB
  • watch iostat -x
  • watch free -m

@jeremymv2
Copy link
Author

This is a version that works with Habitat pkgs:

#!/usr/bin/env ruby

# Use this script if you have 3 or more Chef Organizations
# and wish to speed up restores by using parallelism.

require 'fileutils'
require 'optparse'

CONCURRENCY = 1
BACKUP_LOG = "restore_#{Time.now.strftime('%m%d%Y%H%M')}.log".freeze
SCRIPT_OUTPUT = 'chef-restore-by-org.sh'.freeze
KNIFE_EC_CMD = 'hab pkg exec jeremymv2/knife-ec-backup knife ec'

ARGV << '-h' if ARGV.length != 6
# rubocop:disable Style/GlobalVars
$options = {}
OptionParser.new do |opts|
  opts.banner = "Usage: #{$PROGRAM_NAME} [options]"
  opts.on('-d', '--backup-dir PATH', '/path/to/backup/directory') { |v| $options[:backup_dir] = v }
  opts.on('-k', '--kniferb PATH', '/path/to/pivotal.rb') { |v| $options[:knife_rb] = v }
  opts.on('-a', '--args PATH', '/path/to/extra-args.txt') { |v| $options[:args_file] = v }
  opts.on_tail('-h', '--help', 'Show this message') do
    puts opts
    exit
  end
end.parse!

EXTRA_ARGS_FILE = $options[:args_file]
KNIFE_RB = $options[:knife_rb]

def extra_args
  File.readlines(EXTRA_ARGS_FILE).map(&:chomp).join(' ')
end

def org_path(org)
  File.expand_path(File.join($options[:backup_dir], 'organizations', org))
end

def tree_size(org_path)
  Dir[File.join(org_path, '**/*')].size
end

def organizations_path
  File.expand_path(File.join($options[:backup_dir], 'organizations'))
end

def populate_org_hash
  orgs = {}
  Dir[File.join(organizations_path, '**')].each do |org_path|
    org = File.basename(org_path)
    orgs[org] = {}
    orgs[org]['path'] = org_path
    orgs[org]['size'] = tree_size(org_path)
  end
  orgs
end

def orgs_by_size(orgs)
  Hash[orgs.sort_by { |_k, v| v['size'] }.reverse].keys
end

# rubocop:disable Metrics/MethodLength
def write_script(list)
  last_org = list.pop
  penultimate_org = list.pop
  org_with_users = "#{KNIFE_EC_CMD} restore #{$options[:backup_dir]} --yes --purge -c #{KNIFE_RB} \
  --concurrency #{CONCURRENCY} --with-user-sql --skip-useracl --only-org #{last_org} #{extra_args} 2>&1 \
  | while IFS= read -r line; do echo \"ORG:#{last_org} $(date) $line\"; done >> #{BACKUP_LOG}"
  org_with_useracl = "#{KNIFE_EC_CMD} restore #{$options[:backup_dir]} --yes --purge -c #{KNIFE_RB} \
  --concurrency #{CONCURRENCY} --skip-users --only-org #{penultimate_org} #{extra_args} 2>&1 \
  | while IFS= read -r line; do echo \"ORG:#{penultimate_org} $(date) $line\"; done >> #{BACKUP_LOG}"
  script = <<-SCRIPT
#!/bin/bash
PATH=\$(hab pkg path core/ruby)/bin:\$PATH
ORGS="#{list.join(' ')}"
export PATH=/opt/chefdk/bin:$PATH
echo "Saving logs to #{BACKUP_LOG}"
echo "Step 1. restoring smallest org and all users"
#{org_with_users} || true
echo "Step 2. backgrounding restore job for orgs"
for org in $ORGS; do
  #{KNIFE_EC_CMD} restore #{$options[:backup_dir]} --yes --purge --concurrency #{CONCURRENCY} -c #{KNIFE_RB} --only-org $org --skip-users --skip-useracl #{extra_args} 2>&1 | while IFS= read -r line; do echo \"ORG:$org $(date) $line\"; done >> #{BACKUP_LOG} &
done
while [[ -n $(jobs -r) ]]; do echo -n "."; sleep 60; done
echo
echo "Step 3. restoring user acls along with last org"
#{org_with_useracl} || true
echo "Step 4. gathering results"
ORGS="${ORGS} #{last_org} #{penultimate_org}"
for org in $ORGS; do
  if grep -q "^ORG:$org .*Finished" #{BACKUP_LOG}; then
    echo "$org succeeded"
  else
    echo "$org failed"
  fi
done
SCRIPT
  puts "Writing: #{SCRIPT_OUTPUT}"
  File.open(SCRIPT_OUTPUT, 'w') do |f|
    f.write(script)
  end
  FileUtils.chmod 'u=rwx', SCRIPT_OUTPUT.to_s
end
# rubocop:enable Metrics/MethodLength
# rubocop:enable Style/GlobalVars

write_script orgs_by_size populate_org_hash

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment