Skip to content

Instantly share code, notes, and snippets.

@bear
Created October 15, 2014 06:07
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save bear/04a01662b88196fe138d to your computer and use it in GitHub Desktop.
Save bear/04a01662b88196fe138d to your computer and use it in GitHub Desktop.
sample indie-stats cruncher
#!/usr/bin/env python
# count_hcards.sh domain workdir datajson resultjson
import os, sys
import json
import argparse
parser = argparse.ArgumentParser()
parser.add_argument('domain',)
parser.add_argument('workdir')
parser.add_argument('datajson')
parser.add_argument('resultjson')
args = parser.parse_args()
print args.domain, args.workdir, args.datajson, args.resultjson
with open(args.datajson) as h:
dataFiles = json.load(h)
counts = {}
for f in dataFiles:
print 'processing', f
ts, t = f.split('_')
counts[ts] = { 'h-card': 0 }
with open(os.path.join(args.workdir, f)) as h:
d = json.load(h)
if 'mf2' in d and 'items' in d['mf2']:
for item in d['mf2']['items']:
if 'h-card' in item['type']:
counts[ts]['h-card'] += 1
print json.dumps(counts)
with open(args.resultjson, 'w') as h:
h.write(json.dumps(counts))
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment