isaacs/no-parse.js

## gistfile.txt
$ for TEST in old.js ts.js np3.js np3-seek.js np3-ignore.js no-parse.js; do echo ""; echo $TEST; for i in {1..5}; do node $TEST test/fixtures.tar >/dev/null; done; done

old.js
24.48
25.71
25.696
26.064
24.163

ts.js
43.783
32.742
42.84
37.62
24.885

np3.js
22.333
21.877
22.392
22.277
26.681

np3-seek.js
13.655
14.247
17.884
15.737
13.07

np3-ignore.js
9.554
10.376
9.671
10.198
9.807

no-parse.js
5.873
5.649
6.187
5.776
5.678

## no-parse.js
var ReadStream = require('fs-readstream-seek')

const input = new ReadStream(process.argv[2])

const parse = chunk => {
  var path = chunk.slice(0, 100).toString().replace(/\u0000.*/, '')
  if (!path)
    return
  var size = parseNumeric(chunk.slice(124, 124 + 12))
  var blockSize = Math.ceil(size / 512) * 512
  console.log(path)
  input.seek(input.readPos + blockSize)
}

const parseNumeric = f => {
  if (f[0] & 0x80) return parse256(f)

  var str = f.toString().replace(/\u0000.*$/, '').trim()
  var res = parseInt(str, 8)

  return isNaN(res) ? null : res
}

const parse256 = buf => {
  // first byte MUST be either 80 or FF
  // 80 for positive, FF for 2's comp
  var positive
  if (buf[0] === 0x80) positive = true
  else if (buf[0] === 0xFF) positive = false
  else return null

  // build up a base-256 tuple from the least sig to the highest
  var zero = false
  var tuple = []
  for (var i = buf.length - 1; i > 0; i --) {
    var byte = buf[i]
    if (positive) tuple.push(byte)
    else if (zero && byte === 0) tuple.push(0)
    else if (zero) {
      zero = false
      tuple.push(0x100 - byte)
    } else tuple.push(0xFF - byte)
  }

  for (var sum = 0, i = 0, l = tuple.length; i < l; i ++) {
    sum += tuple[i] * Math.pow(256, i)
  }

  return positive ? sum : -1 * sum
}

const read = _ => {
  let chunk
  while (chunk = input.read(512)) {
    parse(chunk)
  }
}
input.on('readable', read)

const start = process.hrtime()
process.on('exit', c => {
  const end = process.hrtime(start)
  console.error(end[0]*1e3 + end[1]/1e6)
})

## np3-ignore.js
const Parser = require('./lib/new3.js')
const p = new Parser({
  filter (entry) {
    console.log(entry.path)
    return false
  }
})

const fs = require('fs')
const data = fs.readFileSync(process.argv[2])
console.log('< %j', process.argv[2])

process.on('exit', c => {
  const end = process.hrtime(start)
  console.error(end[0]*1e3 + end[1]/1e6)
})

const start = process.hrtime()
p.write(data)

## np3-seek.js
const Parser = require('./lib/new3.js')
const p = new Parser()
const ReadStream = require('fs-readstream-seek')

p.on('entry', entry => {
  const entryBlockSize = entry.blockRemain
  const entryEnd = input.readPos + entryBlockSize
  const entryStart = input.readPos - 512
  entry.remain = 0
  entry.blockRemain = 0
  console.log(entry.path)

  if (entryBlockSize !== 0)
    input.seek(entryEnd)
})
console.log('< %j', process.argv[2])
const input = new ReadStream(process.argv[2])

input.once('end', _ => p.end())

const read = _ => {
  reading = true
  let chunk
  let pos = input.readPos
  // this is just reading headers
  while (chunk = input.read(512)) {
    if (!p.write(chunk))
      return p.once('drain', read)
    pos = input.readPos
  }
}

input.on('readable', read)
const start = process.hrtime()
process.on('exit', c => {
  const end = process.hrtime(start)
  console.error(end[0]*1e3 + end[1]/1e6)
})

## np3.js
var Parser = require('./lib/new3.js')
var p = new Parser()
p.on('entry', entry => {
  entry.resume()
  console.log(entry.path)
})

const fs = require('fs')
const input = fs.readFileSync(process.argv[2])
const start = process.hrtime()

p.write(input)

const end = process.hrtime(start)
console.error(end[0]*1e3 + end[1]/1e6)

## old.js
const Parse = require('./').Parse
const p = Parse()
p.on('entry', entry => {
  console.log(entry.path)
})
p.resume()
const fs = require('fs')
const input = fs.readFileSync(process.argv[2])

process.on('exit', c => {
  const end = process.hrtime(start)
  console.error(end[0]*1e3 + end[1]/1e6)
})

const start = process.hrtime()
p.write(input)
p.end()

## ts.js
const ts = require('tar-stream')
const p = ts.extract()
p.on('entry', (entry, stream, callback) => {
  console.log(entry.name)
  stream.resume()
  callback()
})
p.on('data', _ => _)
const fs = require('fs')
const input = fs.readFileSync(process.argv[2])
const start = process.hrtime()
p.write(input)
p.end()
// const fs = require('fs')
// const input = fs.createReadStream(process.argv[2])
// input.pipe(p)

process.on('exit', c => {
  const end = process.hrtime(start)
  console.error(end[0]*1e3 + end[1]/1e6)
})
	$ for TEST in old.js ts.js np3.js np3-seek.js np3-ignore.js no-parse.js; do echo ""; echo $TEST; for i in {1..5}; do node $TEST test/fixtures.tar >/dev/null; done; done

	old.js
	24.48
	25.71
	25.696
	26.064
	24.163

	ts.js
	43.783
	32.742
	42.84
	37.62
	24.885

	np3.js
	22.333
	21.877
	22.392
	22.277
	26.681

	np3-seek.js
	13.655
	14.247
	17.884
	15.737
	13.07

	np3-ignore.js
	9.554
	10.376
	9.671
	10.198
	9.807

	no-parse.js
	5.873
	5.649
	6.187
	5.776
	5.678
	var ReadStream = require('fs-readstream-seek')

	const input = new ReadStream(process.argv[2])

	const parse = chunk => {
	var path = chunk.slice(0, 100).toString().replace(/\u0000.*/, '')
	if (!path)
	return
	var size = parseNumeric(chunk.slice(124, 124 + 12))
	var blockSize = Math.ceil(size / 512) * 512
	console.log(path)
	input.seek(input.readPos + blockSize)
	}

	const parseNumeric = f => {
	if (f[0] & 0x80) return parse256(f)

	var str = f.toString().replace(/\u0000.*$/, '').trim()
	var res = parseInt(str, 8)

	return isNaN(res) ? null : res
	}

	const parse256 = buf => {
	// first byte MUST be either 80 or FF
	// 80 for positive, FF for 2's comp
	var positive
	if (buf[0] === 0x80) positive = true
	else if (buf[0] === 0xFF) positive = false
	else return null

	// build up a base-256 tuple from the least sig to the highest
	var zero = false
	var tuple = []
	for (var i = buf.length - 1; i > 0; i --) {
	var byte = buf[i]
	if (positive) tuple.push(byte)
	else if (zero && byte === 0) tuple.push(0)
	else if (zero) {
	zero = false
	tuple.push(0x100 - byte)
	} else tuple.push(0xFF - byte)
	}

	for (var sum = 0, i = 0, l = tuple.length; i < l; i ++) {
	sum += tuple[i] * Math.pow(256, i)
	}

	return positive ? sum : -1 * sum
	}

	const read = _ => {
	let chunk
	while (chunk = input.read(512)) {
	parse(chunk)
	}
	}
	input.on('readable', read)

	const start = process.hrtime()
	process.on('exit', c => {
	const end = process.hrtime(start)
	console.error(end[0]*1e3 + end[1]/1e6)
	})
	const Parser = require('./lib/new3.js')
	const p = new Parser({
	filter (entry) {
	console.log(entry.path)
	return false
	}
	})

	const fs = require('fs')
	const data = fs.readFileSync(process.argv[2])
	console.log('< %j', process.argv[2])

	process.on('exit', c => {
	const end = process.hrtime(start)
	console.error(end[0]*1e3 + end[1]/1e6)
	})

	const start = process.hrtime()
	p.write(data)
	const Parser = require('./lib/new3.js')
	const p = new Parser()
	const ReadStream = require('fs-readstream-seek')

	p.on('entry', entry => {
	const entryBlockSize = entry.blockRemain
	const entryEnd = input.readPos + entryBlockSize
	const entryStart = input.readPos - 512
	entry.remain = 0
	entry.blockRemain = 0
	console.log(entry.path)

	if (entryBlockSize !== 0)
	input.seek(entryEnd)
	})
	console.log('< %j', process.argv[2])
	const input = new ReadStream(process.argv[2])

	input.once('end', _ => p.end())

	const read = _ => {
	reading = true
	let chunk
	let pos = input.readPos
	// this is just reading headers
	while (chunk = input.read(512)) {
	if (!p.write(chunk))
	return p.once('drain', read)
	pos = input.readPos
	}
	}

	input.on('readable', read)
	const start = process.hrtime()
	process.on('exit', c => {
	const end = process.hrtime(start)
	console.error(end[0]*1e3 + end[1]/1e6)
	})
	var Parser = require('./lib/new3.js')
	var p = new Parser()
	p.on('entry', entry => {
	entry.resume()
	console.log(entry.path)
	})

	const fs = require('fs')
	const input = fs.readFileSync(process.argv[2])
	const start = process.hrtime()

	p.write(input)

	const end = process.hrtime(start)
	console.error(end[0]*1e3 + end[1]/1e6)
	const Parse = require('./').Parse
	const p = Parse()
	p.on('entry', entry => {
	console.log(entry.path)
	})
	p.resume()
	const fs = require('fs')
	const input = fs.readFileSync(process.argv[2])

	process.on('exit', c => {
	const end = process.hrtime(start)
	console.error(end[0]*1e3 + end[1]/1e6)
	})

	const start = process.hrtime()
	p.write(input)
	p.end()
	const ts = require('tar-stream')
	const p = ts.extract()
	p.on('entry', (entry, stream, callback) => {
	console.log(entry.name)
	stream.resume()
	callback()
	})
	p.on('data', _ => _)
	const fs = require('fs')
	const input = fs.readFileSync(process.argv[2])
	const start = process.hrtime()
	p.write(input)
	p.end()
	// const fs = require('fs')
	// const input = fs.createReadStream(process.argv[2])
	// input.pipe(p)

	process.on('exit', c => {
	const end = process.hrtime(start)
	console.error(end[0]*1e3 + end[1]/1e6)
	})