mittenchops/tagger.py

## tagger.py
import re

ARTS = ['dance','photography','art therapy']

def string_found(string1, string2):
   if re.search(r"\b" + re.escape(string1) + r"\b", string2):
      return 1
   return 0

def string_count(string1, string2):
    pos = 0
    count = 0
    while pos <  len(string2):
        v = re.search(r"\b" + re.escape(string1) + r"\b", string2[pos:])
        if v:
            count += 1
            pos += v.end()
        else:
            break
    return(count)

makecounts = lambda mystr, tags: {k: string_count(k,mystr.lower()) for k in tags}
gettags = lambda mydict : filter(None,[m for m,vv in mydict.items() if vv>0])
tagger = lambda mystr, tags : gettags(makecounts(mystr,tags))

x = "A wonderful string about art therapy, photography, and architecture!"
makecounts(x,ARTS)
{'dance': 0, 'photography': 1, 'art therapy': 1}

tagger(x, ARTS)
['photography', 'art therapy']
	import re

	ARTS = ['dance','photography','art therapy']

	def string_found(string1, string2):
	if re.search(r"\b" + re.escape(string1) + r"\b", string2):
	return 1
	return 0

	def string_count(string1, string2):
	pos = 0
	count = 0
	while pos < len(string2):
	v = re.search(r"\b" + re.escape(string1) + r"\b", string2[pos:])
	if v:
	count += 1
	pos += v.end()
	else:
	break
	return(count)

	makecounts = lambda mystr, tags: {k: string_count(k,mystr.lower()) for k in tags}
	gettags = lambda mydict : filter(None,[m for m,vv in mydict.items() if vv>0])
	tagger = lambda mystr, tags : gettags(makecounts(mystr,tags))

	x = "A wonderful string about art therapy, photography, and architecture!"
	makecounts(x,ARTS)
	{'dance': 0, 'photography': 1, 'art therapy': 1}

	tagger(x, ARTS)
	['photography', 'art therapy']