Skip to content

Instantly share code, notes, and snippets.

from Bio import SeqIO
import sys
seq_number = 1
for rec in SeqIO.parse(open(sys.argv[1]), "fasta"):
cols = rec.name.split("_")
count = int(cols[3])
for n in xrange(count):
print ">%s_%s_%s read%s" % (cols[0], cols[1], seq_number, seq_number)
@nickloman
nickloman / get.py
Created June 3, 2011 09:55
Little Tweet ripper
## little tweet ripper, run python get.py ABPH11
import operator
import sys
import urllib
import json
url = "http://search.twitter.com/search.json"
u_hash = {}
@nickloman
nickloman / expandvcf.py
Created July 5, 2011 15:01
A little script to expand VCF to allow the key-value list to be easily sorted/filtered
import sys
from copy import copy
used_keys = ['DP', 'AF1', 'CI95', 'DP4', 'MQ', 'PV4', 'INDEL']
initial_dict = dict([(k, '') for k in used_keys])
for ln in sys.stdin:
d = copy(initial_dict)
cols = ln.rstrip().split("\t")
@nickloman
nickloman / filter.py
Created August 4, 2011 10:43
Remove filtered reads from CASAVA 1.8+ output.
# Usage python filter.py <read1.gz> <read2.gz>
from Bio import SeqIO
import itertools
import sys
import gzip
import os.path
f1 = gzip.open(sys.argv[1], "r")
f2 = gzip.open(sys.argv[2], "r")
@nickloman
nickloman / dodir_makeqiimefiles.py
Created November 18, 2011 14:24
dodir_makeqiimefiles.py
from Bio import SeqIO
import sys
import glob
def system(cmd):
print >>sys.stderr, cmd
os.system(cmd)
# dodir_pyro.py directory
@nickloman
nickloman / dodir_perseus.py
Created November 18, 2011 14:24
dodir_perseus.py
import os
import sys
import glob
def system(cmd):
print >>sys.stderr, cmd
os.system(cmd)
# dodir_pyro.py directory
@nickloman
nickloman / gist:1376578
Created November 18, 2011 14:25
dodir_pyrom.py
import os
import sys
import glob
def system(cmd):
print >>sys.stderr, cmd
os.system(cmd)
# dodir_pyro.py directory
@nickloman
nickloman / dodir_seqnoisem.py
Created November 18, 2011 14:26
dodir_seqnoisem.py
import os
import sys
import glob
TRUNCATE_LENGTH = int(sys.argv[2])
def system(cmd):
print >>sys.stderr, cmd
os.system(cmd)
@nickloman
nickloman / genbank_to_tbl.py
Created May 11, 2012 16:10
genbank_to_tbl.py
# requires biopython
# run like:
# genbank_to_tbl.py "my organism name" "my strain ID" "ncbi project id" < my_sequence.gbk
# writes seq.fsa, seq.tbl as output
import sys
from copy import copy
from Bio import SeqIO
def find_gene_entry(features, locus_tag):
--- lib/qiime/assign_taxonomy.py 2011-09-11 20:53:06.000000000 +0100
+++ ../16s/Qiime-1.2.1/build/lib/qiime/assign_taxonomy.py 2011-02-22 21:00:06.000000000 +0000
@@ -89,7 +89,7 @@
""" Initialize the object
"""
_params = {
- 'Min percent identity': 90,
+ 'Min percent identity': 0.90,
'Max E value': 1e-30,
'Application': 'blastn/megablast'