jamessouth/hashFilenames.js

## hashFilenames.js
const crypto = require('crypto');
const fs = require('fs');
const path = require('path');
const walk = require('walkdir');

let tree = [];

//hash and rename a file
async function hashFile(filepath) {
  const file = fs.createReadStream(filepath);
  const hash = crypto.createHash('md5');
  const { dir, name, ext } = path.parse(filepath);
  return new Promise((res) => {
    file.on('readable', () => {
      const data = file.read();
      if (data) {
        hash.update(data);
      } else {
        const dig = hash.digest('hex');
        const newname = `${name}.${dig}${ext}`;
        const newpath = path.resolve(dir, newname);
        fs.renameSync(filepath, newpath);
        res(newname);
      }
    });
  });
}

//loop through paths found in a file, send each path to either be hashed or explore its paths
async function* generateNewName(arr) {
  for (let i = 0; i < arr.length; i += 1) {
    let newname;
    const { base, ext } = path.parse(arr[i]);
    const match = tree.find((e) => e.includes(base)); //get absolute path from tree
    if (['.png', '.jpg', '.pdf'].includes(ext)) { //files that don't reference other files can be hashed
      newname = await hashFile(match);
    } else {
      newname = await makeNewFile(match); //follow other paths to get their sub-paths and repeat
    }
    yield [base, newname];
  }
}

//get paths from a file, exclude non-hashed files, replace old paths with new hashed names, return either new or original
//file contents
async function updateHashedPaths(data) {
  let file = data.replace(/src\//g, ''); //src used in dev, remove for prod
  const paths = file.match(/\.\.?\/(\w+\/)?[\w-]+\.(css|m?js|png|jpg|pdf)/g); //adjust as needed to capture paths
  if (paths) {
    const uniquePaths = [...new Set([...paths.filter((p) => !p.includes('service-worker', 'manifest.webmanifest'))])]; //exclude
    for await (const p of generateNewName(uniquePaths)) {
      file = file.replace(new RegExp(p[0], 'g'), p[1]); //update paths
    }
    return file;
  }
  return data;
}

//opens file for hashing and writes new file
async function makeNewFile(file) {
  const resolvedFile = path.resolve(file);
  const data = await fs.promises.readFile(resolvedFile, 'utf8');
  const newFile = await updateHashedPaths(data);
  await fs.promises.writeFile(resolvedFile, newFile, 'utf8');
  const newname = resolvedFile.endsWith('html') ? resolvedFile : await hashFile(resolvedFile); //hash file that does reference
  //other files, after paths have been updated
  return newname;
}

//walk directory to get absolute file paths for easier matching with relative paths ./ and ../
async function getFileTree(file) {
  const dirs = [];
  const filetree = await walk.async(path.dirname(file), {
    filter: (dir, files) => {
      dirs.push(dir);
      return files.filter((f) => !['icons', 'index.html', 'manifest.webmanifest'].includes(f)); //exclude paths we don't
      //want to hash
    },
  });
  return [file, filetree.filter((f) => !dirs.includes(f))];
}

//pass starter file through while updating tree array
function sepArray([file, arr]) {
  tree = tree.concat(arr);
  return file;
}

//start with node hashFilenames.js ./dist/index.html
getFileTree(process.argv[2])
  .then(sepArray)
  .then(makeNewFile)
  .catch((e) => console.error(e));
	const crypto = require('crypto');
	const fs = require('fs');
	const path = require('path');
	const walk = require('walkdir');

	let tree = [];

	//hash and rename a file
	async function hashFile(filepath) {
	const file = fs.createReadStream(filepath);
	const hash = crypto.createHash('md5');
	const { dir, name, ext } = path.parse(filepath);
	return new Promise((res) => {
	file.on('readable', () => {
	const data = file.read();
	if (data) {
	hash.update(data);
	} else {
	const dig = hash.digest('hex');
	const newname = `${name}.${dig}${ext}`;
	const newpath = path.resolve(dir, newname);
	fs.renameSync(filepath, newpath);
	res(newname);
	}
	});
	});
	}

	//loop through paths found in a file, send each path to either be hashed or explore its paths
	async function* generateNewName(arr) {
	for (let i = 0; i < arr.length; i += 1) {
	let newname;
	const { base, ext } = path.parse(arr[i]);
	const match = tree.find((e) => e.includes(base)); //get absolute path from tree
	if (['.png', '.jpg', '.pdf'].includes(ext)) { //files that don't reference other files can be hashed
	newname = await hashFile(match);
	} else {
	newname = await makeNewFile(match); //follow other paths to get their sub-paths and repeat
	}
	yield [base, newname];
	}
	}

	//get paths from a file, exclude non-hashed files, replace old paths with new hashed names, return either new or original
	//file contents
	async function updateHashedPaths(data) {
	let file = data.replace(/src\//g, ''); //src used in dev, remove for prod
	const paths = file.match(/\.\.?\/(\w+\/)?[\w-]+\.(css\|m?js\|png\|jpg\|pdf)/g); //adjust as needed to capture paths
	if (paths) {
	const uniquePaths = [...new Set([...paths.filter((p) => !p.includes('service-worker', 'manifest.webmanifest'))])]; //exclude
	for await (const p of generateNewName(uniquePaths)) {
	file = file.replace(new RegExp(p[0], 'g'), p[1]); //update paths
	}
	return file;
	}
	return data;
	}

	//opens file for hashing and writes new file
	async function makeNewFile(file) {
	const resolvedFile = path.resolve(file);
	const data = await fs.promises.readFile(resolvedFile, 'utf8');
	const newFile = await updateHashedPaths(data);
	await fs.promises.writeFile(resolvedFile, newFile, 'utf8');
	const newname = resolvedFile.endsWith('html') ? resolvedFile : await hashFile(resolvedFile); //hash file that does reference
	//other files, after paths have been updated
	return newname;
	}

	//walk directory to get absolute file paths for easier matching with relative paths ./ and ../
	async function getFileTree(file) {
	const dirs = [];
	const filetree = await walk.async(path.dirname(file), {
	filter: (dir, files) => {
	dirs.push(dir);
	return files.filter((f) => !['icons', 'index.html', 'manifest.webmanifest'].includes(f)); //exclude paths we don't
	//want to hash
	},
	});
	return [file, filetree.filter((f) => !dirs.includes(f))];
	}

	//pass starter file through while updating tree array
	function sepArray([file, arr]) {
	tree = tree.concat(arr);
	return file;
	}

	//start with node hashFilenames.js ./dist/index.html
	getFileTree(process.argv[2])
	.then(sepArray)
	.then(makeNewFile)
	.catch((e) => console.error(e));