kaminomisosiru/frequency_analysis.py

## frequency_analysis.py
# -*- coding: utf-8 -*-
'''
英文ファイルを読み込んで頻度分析を行うサンプル
'''
from collections import OrderedDict

def frequency_analysis(text):
    '''
    与えられたtextに対して頻度分析を行う。
    結果はアルファベット順に各文字の頻度が標準出力に出力される。
    '''
    occurences = {}
    counter = 0
    for i in range(len(text)):
        chara = text[i]
        is_alphabet = True if ord('a') <= ord(chara) and ord(chara) <= ord('z') else False
        if is_alphabet and chara not in occurences:
            counter += 1
            occurences[chara] = 1
        elif is_alphabet:
            counter += 1
            occurences[chara] += 1

    # アルファベット順にソート
    occurences = OrderedDict(sorted(occurences.items(), key=lambda x: x[0]))

    for c, count in occurences.items():
        print(c + ':' +str(count / counter * 100))

if __name__ == '__main__':
    f = open('freq_sample') #分析するファイルを読み込む
    text = f.read()
    f.close()
    frequency_analysis(text)
	# -- coding: utf-8 --
	'''
	英文ファイルを読み込んで頻度分析を行うサンプル
	'''
	from collections import OrderedDict

	def frequency_analysis(text):
	'''
	与えられたtextに対して頻度分析を行う。
	結果はアルファベット順に各文字の頻度が標準出力に出力される。
	'''
	occurences = {}
	counter = 0
	for i in range(len(text)):
	chara = text[i]
	is_alphabet = True if ord('a') <= ord(chara) and ord(chara) <= ord('z') else False
	if is_alphabet and chara not in occurences:
	counter += 1
	occurences[chara] = 1
	elif is_alphabet:
	counter += 1
	occurences[chara] += 1

	# アルファベット順にソート
	occurences = OrderedDict(sorted(occurences.items(), key=lambda x: x[0]))

	for c, count in occurences.items():
	print(c + ':' +str(count / counter * 100))

	if __name__ == '__main__':
	f = open('freq_sample') #分析するファイルを読み込む
	text = f.read()
	f.close()
	frequency_analysis(text)