1. Miki Tebeka
  2. pythonwise


pythonwise / ll-freq.py

#!/usr/bin/env python
'''Show last letter frequency in English words'''

from urllib import urlopen
from collections import Counter
from matplotlib import pyplot as plt
import numpy as np

def get_words():
    '''Get list of dictionary words.'''
    # The North American Scrabble Tournament Word List (178,690 words)
    fo = urlopen('http://norvig.com/ngrams/TWL06.txt')
    return (w.strip() for w in fo)

def plot(freq, filename):
    '''Bar chart of last letter frequency.'''
    width = 0.35  # Bar width (also used for xticks positioning)

    idx = np.arange(len(freq))
    xs = sorted(freq)  # Letters in alphabetic order
    ys = [freq[x] for x in xs]  # Frequency

    plt.bar(idx, ys, width=width)
    plt.xticks(idx + width/2., xs)  # Annotate X axis
    plt.title('Last Letter Frequency')

if __name__ == '__main__':
    freq = Counter(w[-1].upper() for w in get_words())
    plot(freq, 'll-freq.png')