premchalmeti/highlighter.py

## highlighter.py
doc = 'The quick brown fox jumps over the lazy dog. The quick brown fox over the lazy dog. The quick brown fox jumps over the lazy dog.'

cur_pos = -1
end_pos = 0
distance = 2
tracked_words = []
start_pos = 0

search_words = ['quick', 'fox', 'over']
highlights = []


splitted_words = doc.split(' ')

matched_pair_pos = []

for word in splitted_words:
    cur_pos += 1
    if word in search_words and word not in tracked_words:
        if not tracked_words:
            start_pos = cur_pos
        tracked_words.append(word)
    if len(tracked_words) == len(search_words):
        end_pos = cur_pos + 1
        tracked_words = []
        cur_highlight = " ".join(splitted_words[start_pos:end_pos])
        pre_highlight = " ".join(splitted_words[:start_pos])
        post_highlight = " ".join(splitted_words[end_pos:])


        highlights.append("%s <b>%s</b> %s" %
                          (pre_highlight, cur_highlight, post_highlight))

print highlights
	doc = 'The quick brown fox jumps over the lazy dog. The quick brown fox over the lazy dog. The quick brown fox jumps over the lazy dog.'

	cur_pos = -1
	end_pos = 0
	distance = 2
	tracked_words = []
	start_pos = 0

	search_words = ['quick', 'fox', 'over']
	highlights = []


	splitted_words = doc.split(' ')

	matched_pair_pos = []

	for word in splitted_words:
	cur_pos += 1
	if word in search_words and word not in tracked_words:
	if not tracked_words:
	start_pos = cur_pos
	tracked_words.append(word)
	if len(tracked_words) == len(search_words):
	end_pos = cur_pos + 1
	tracked_words = []
	cur_highlight = " ".join(splitted_words[start_pos:end_pos])
	pre_highlight = " ".join(splitted_words[:start_pos])
	post_highlight = " ".join(splitted_words[end_pos:])


	highlights.append("%s <b>%s</b> %s" %
	(pre_highlight, cur_highlight, post_highlight))

	print highlights