Created
March 23, 2018 07:51
-
-
Save pasamio/405e0be4e812f2735ee7ca05274b500b to your computer and use it in GitHub Desktop.
Backup CouchDB instance to local JSON files.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/php -n -d error_reporting=-1 -d display_errors=1 -d memory_limit=1G | |
<?php | |
ini_set('error_reporting', -1); | |
ini_set('display_errors', 1); | |
foreach(glob(realpath(dirname(__FILE__)) . '/configs/*.ini') as $configFile) | |
{ | |
processUpdate(parse_ini_file($configFile)); | |
} | |
die("All done\n"); | |
function delTree($dir) { | |
$files = array_diff(scandir($dir), array('.','..')); | |
foreach ($files as $file) { | |
(is_dir("$dir/$file")) ? delTree("$dir/$file") : unlink("$dir/$file"); | |
} | |
return rmdir($dir); | |
} | |
function getPathForRecord($backupPath, $id, $depth = 2) | |
{ | |
$hash = md5($id); | |
if ($depth > 15) | |
{ | |
$depth = 15; | |
} | |
$path = $backupPath; | |
for ($i = 0; $i < $depth; $i++) | |
{ | |
$path .= '/' . substr($hash, $i * 2, 2); | |
} | |
return $path; | |
} | |
function processUpdate($config) | |
{ | |
extract($config); | |
if (!file_exists($backupPath)) | |
{ | |
mkdir($backupPath, 0777, true); | |
} | |
$sequenceFile = sprintf('%s/%s_to_backup_%s', $sequencePath, $dbName, md5($dbHost.$backupPath)); | |
$since = "0"; | |
$pending = 1; | |
if (file_exists($sequenceFile)) | |
{ | |
printf("Using sequence file: %s\n", $sequenceFile); | |
$lastSince = file_get_contents($sequenceFile); | |
$since = !empty($lastSince) ? $lastSince : $since; | |
} | |
while ($pending > 0) | |
{ | |
$url = sprintf('%s/%s/_changes?include_docs=true&limit=10&since=%s&attachments=true', $dbHost, $dbName, $since); | |
printf("Using URL %s\n\n", $url); | |
$data = file_get_contents($url) or die("Unable to connect to CouchDB\n"); | |
$response = json_decode($data); | |
$pending = $response->pending; | |
$changes = $response->results; | |
$lastSeq = $response->last_seq; | |
$since = $lastSeq; | |
foreach ($changes as $change) | |
{ | |
$documentPath = getPathForRecord($backupPath, $change->id); | |
if (!file_exists($documentPath)) | |
{ | |
mkdir($documentPath, 0777, true); | |
} | |
if (isset($change->deleted)) | |
{ | |
printf("Change %s is deleted, deleting doc.\n", $change->id); | |
$recPath = sprintf('%s/%s.json', $documentPath, $change->id); | |
$recPathCompressed = sprintf('%s/%s.json.gz', $documentPath, $change->id); | |
$attachments = sprintf('%s/%s', $documentPath, $change->id); | |
file_exists($recPath) ? var_dump(unlink($recPath)) : null; | |
file_exists($recPathCompressed) ? var_dump(unlink($recPathCompressed)) : null; | |
file_exists($attachments) ? var_dump(delTree($attachments)) : null; | |
continue; | |
} | |
printf("Found Record %s\n", $change->id); | |
// Drop attachments. | |
if (isset($change->doc->_attachments)) | |
{ | |
$attachmentRoot = sprintf("%s/%s", $documentPath, $change->id); | |
mkdir ($attachmentRoot); | |
foreach ($change->doc->_attachments as $filename=>$attachment) | |
{ | |
file_put_contents($attachmentRoot . '/' . $filename, base64_decode($attachment->data)); | |
unset($change->doc->_attachments->$filename->data); | |
} | |
} | |
$data_json = json_encode($change->doc); | |
$url = sprintf('%s/%s.json', $documentPath, $change->id); | |
if (isset($compressBackup) && $compressBackup) | |
{ | |
$url .= '.gz'; | |
$data_json = gzencode($data_json); | |
} | |
mkdir(basepath($url), 0777, true); | |
$result = file_put_contents($url, $data_json); | |
var_dump($result); | |
} | |
printf("Pending: %d; Last Seq: %s\n", $pending, $lastSeq); | |
file_put_contents($sequenceFile, $lastSeq); | |
} | |
} | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment