tonybaloney/awesome.py

## awesome.py
from os import listdir
from os.path import isfile, join

import re

import matplotlib.pyplot as plt
import numpy as np

path = 'transcripts'

transcripts = [f for f in listdir(path) if isfile(join(path, f))]

episodes = []

for transcript in transcripts:
    with open(join(path, transcript), encoding='utf8') as t:
        episodes.append({
            'number': transcript.replace('.txt', ''),
            'contents': t.read()
        })

for episode in episodes:
    awesomes = re.findall(r'that\'s (\w+)?( )?awesome', episode['contents'])
    rank = len(awesomes) # how many awesomes
    # Sometimes Michael gets really excited..
    for awesome, _ in awesomes:
        if awesome == 'pretty': # meh
            rank = rank + 1
        if awesome == 'very': # nice
            rank = rank + 2
        if awesome == 'really': # woah
            rank = rank + 5

    episode['awesome'] = rank

ind = np.arange(53)

p1 = plt.bar(ind, [ep['awesome'] for ep in episodes],
             color='g')

plt.ylabel('Awesomeness')
plt.title('Episodes by awesomeness')
plt.xticks(ind + 2., list([ep['number'] for ep in episodes]))
plt.yticks([ep['awesome'] for ep in episodes])
plt.show()
	from os import listdir
	from os.path import isfile, join

	import re

	import matplotlib.pyplot as plt
	import numpy as np

	path = 'transcripts'

	transcripts = [f for f in listdir(path) if isfile(join(path, f))]

	episodes = []

	for transcript in transcripts:
	with open(join(path, transcript), encoding='utf8') as t:
	episodes.append({
	'number': transcript.replace('.txt', ''),
	'contents': t.read()
	})

	for episode in episodes:
	awesomes = re.findall(r'that\'s (\w+)?( )?awesome', episode['contents'])
	rank = len(awesomes) # how many awesomes
	# Sometimes Michael gets really excited..
	for awesome, _ in awesomes:
	if awesome == 'pretty': # meh
	rank = rank + 1
	if awesome == 'very': # nice
	rank = rank + 2
	if awesome == 'really': # woah
	rank = rank + 5

	episode['awesome'] = rank

	ind = np.arange(53)

	p1 = plt.bar(ind, [ep['awesome'] for ep in episodes],
	color='g')

	plt.ylabel('Awesomeness')
	plt.title('Episodes by awesomeness')
	plt.xticks(ind + 2., list([ep['number'] for ep in episodes]))
	plt.yticks([ep['awesome'] for ep in episodes])
	plt.show()