Skip to content

Instantly share code, notes, and snippets.

@petermaloney
Forked from jimparis/punch.py
Last active May 19, 2017 08:23
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save petermaloney/c184d077d8cb2d43165761b2487f3da8 to your computer and use it in GitHub Desktop.
Save petermaloney/c184d077d8cb2d43165761b2487f3da8 to your computer and use it in GitHub Desktop.
Using FALLOC_FL_PUNCH_HOLE from Python to punch holes in files
#!/usr/bin/python
import ctypes
import ctypes.util
import os
c_off_t = ctypes.c_int64
def make_fallocate():
libc_name = ctypes.util.find_library('c')
libc = ctypes.CDLL(libc_name)
_fallocate = libc.fallocate
_fallocate.restype = ctypes.c_int
_fallocate.argtypes = [ctypes.c_int, ctypes.c_int, c_off_t, c_off_t]
del libc
del libc_name
def fallocate(fd, mode, offset, len_):
res = _fallocate(fd.fileno(), mode, offset, len_)
if res != 0:
raise IOError(res, 'fallocate')
return fallocate
fallocate = make_fallocate()
del make_fallocate
FALLOC_FL_KEEP_SIZE = 0x01
FALLOC_FL_PUNCH_HOLE = 0x02
def punch(filename, verbose, blocksize=None):
if verbose:
print "processing", filename
with open(filename, 'r+') as f:
if not blocksize:
blocksize = os.fstatvfs(f.fileno()).f_bsize
else:
blocksize = int(blocksize)
offset = 0
length = 0
while True:
buf = f.read(blocksize)
if not buf:
break
for c in buf:
if c != '\x00':
break
else:
if verbose:
print "punching hole at offset", offset, "length", len(buf)
fallocate(f, FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE,
offset, len(buf))
offset = offset + blocksize
if __name__ == '__main__':
import sys
import argparse
parser = argparse.ArgumentParser(
description = "Punch out the empty areas in a file, making it sparse")
parser.add_argument('file', metavar='FILE',
help='file(s) to modify in-place', nargs='+')
parser.add_argument('-v', '--verbose', action="store_true", default=False,
help='be verbose')
parser.add_argument('-b', '--blocksize', metavar='BS', default=None,
help='override detected filesystem blocksize')
args = parser.parse_args()
for filename in args.file:
punch(filename, args.verbose, args.blocksize)
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment