import random

for _ in range(5):
    print(random.random())

0.4026686653499624
0.491781417388341
0.43643160454313823
0.6269806578535505
0.8487585900005747


for _ in range(5):
    print(random.randint(1,5))

4
1
5
4
2


l = [1, 2, 3, 4, 5]
for _ in range(5):
    print(random.choice(l))

5
1
3
1
1


print(random.sample(l, 2))

[3, 4]


import string

def dictSubtract(d1, d2):
    # The dictionary holding the words in d1 not in d2.
    d = {}

    for word in d1:
        if word not in d2:
            # Add the word, but don't care about the value.
            d[word] = None

    return d

def processSubractFile(filename):
    '''Return a histogram of the words in the filename.'''
    hist = {}
    
    with open(filename) as fin:    
        for line in fin:
            processSubtractLine(line, hist)

    return hist


def processSubtractLine(line, hist):
    '''Removes all non-letters from line and add to the histogram.'''
    line = line.replace('-', ' ')

    for word in line.split():
        word = word.strip(string.punctuation + string.whitespace)
        word = word.lower()
        hist[word] = 1 + hist.get(word, 0)

# Use emma.txt and words.txt.
bookWords = processSubractFile('emma.txt')
listWords = processSubractFile('words.txt')
d = dictSubtract(bookWords, listWords)

l = list(d)
print(f'Found {len(d)} words. Here is a sample:')
for word in l[:10]:
    print(word)

Found 587 words. Here is a sample:
emma
woodhouse
a
sister's
remembrance
taylor
mr
woodhouse's
taylor's
emma's


import string

def processSetFile(filename):
    wordSet = set()
    
    with open(filename) as fin:    
        for line in fin:
            processSetLine(line, wordSet)

    return wordSet


def processSetLine(line, wordSet):
    line = line.replace('-', ' ')

    for word in line.split():
        word = word.strip(string.punctuation + string.whitespace)
        word = word.lower()
        wordSet.add(word)

# Use emma.txt and words.txt.
bookWords = processSetFile('emma.txt')
listWords = processSetFile('words.txt')
s = bookWords - listWords

print(f'Found {len(s)} words. Here is a sample:')
# Here's a small sample.
l = list(s)
for word in l[:10]:
    print(word)

Found 587 words. Here is a sample:

humourist
recollect
tuesday
complimenter
unseasonableness
hetty
november
improvidently
smallridge


import random

def chooseFromHistogram(h):
    l = []
    for word, frequency in h.items():
        l.extend([word] * frequency)
    
    return random.choice(l)

d = {}
h = {'a': 2, 'b': 1}

for _ in range(10000):
    letter = chooseFromHistogram(h)
    d[letter] = 1 + d.get(letter, 0)
print(d)

{'b': 3333, 'a': 6667}

Data Structures¶

Random Numbers¶

.random()¶

.randint()¶

.choice()¶

.sample()¶

Ex 1 - Choose from histogram¶

Dictionary Subtraction¶

Ex 1 - Solution - Choose from histogram¶

Practice problems¶

p1 - Convert to lowercase¶

p2 - Word Count¶

p3 - 20 Most Frequent Words¶