import doctest

nums = []
for i in range(10):
    nums.append(i ** 2)
nums

[0, 1, 4, 9, 16, 25, 36, 49, 64, 81]

[i for i in range(10)]

[0, 1, 2, 3, 4, 5, 6, 7, 8, 9]

[i ** 2 for i in range(10)]

[0, 1, 4, 9, 16, 25, 36, 49, 64, 81]

[i ** 2 for i in range(10) if i % 2 == 0]

[0, 4, 16, 36, 64]

words

['I', 'saw', 'a', 'dog', 'today']

words = "I saw a dog today".split()
[word[0] for word in words if len(word) >= 2]

['s', 'd', 't']

def fun_numbers(start, stop):
    """
    Returns an increasing list of all fun numbers between start (inclusive) and stop (exclusive).
    A fun number is defined as a number that is either divisible by 2 or divisible by 5.

    >>> fun_numbers(2, 16, words)
    [2, 4, 5, 6, 8, 10, 12, 14, 15]
    """
    return [i for i in range(start, stop) if i % 2 == 0 or i % 5 == 0]
    # Making list comprehensions more complicated---trade-off with code quality


doctest.run_docstring_examples(fun_numbers, globals())
# "globals" is part of the "Python environment" model

# This list comprehension (at this level of complexity) is still
# relatively self-documenting
[i for i in range(start, stop) if i % 2 == 0 or i % 5 == 0]

1, 2, 3

(1, 2, 3)

1,2,3

(1, 2, 3)

print(2, 3)

2 3

example = 2, 3
print(example)

(2, 3)

print((2, 3))

(2, 3)

def first_two_letters(word):
    return word[0], word[1]


# Tuple unpacking
a, b = first_two_letters("goodbye")
a

'g'

b

'o'

example = first_two_letters("goodbye")
example

('g', 'o')

example[1] = "hello"

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[30], line 1
----> 1 example[1] = "hello"

TypeError: 'tuple' object does not support item assignment

first, second, third, *rest = tuple([0] * 10)
first, second, third

(0, 0, 0)

rest

[0, 0, 0, 0, 0, 0, 0]

example = 1,
example

(1,)

1

1

nums = set()
nums.add(1)
nums.add(2)
nums.add(3)
nums.add(2) # duplicate ignored
nums.add(-1)
nums

{-1, 1, 2, 3}

nums[0]

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[49], line 1
----> 1 nums[0]

TypeError: 'set' object is not subscriptable

def count_unique(path):
    unique = set() # []
    with open(path) as f:
        for line in f.readlines():
            for token in line.split():
                # if token not in unique:
                unique.add(token) # used to be append
    return len(unique)


%time count_unique("moby-dick.txt")

CPU times: user 53.5 ms, sys: 2.96 ms, total: 56.4 ms
Wall time: 55.4 ms

32553

# Pythonic programs utilize the properties of your structures to great effect!
def count_unique(path):
    with open(path) as f:
        return len(set([token for line in f.readlines() for token in line.split()]))
        return len(set([token for token in f.read().split()]))
        return len(set(f.read().split()))


%time count_unique("moby-dick.txt")

CPU times: user 23.7 ms, sys: 7.19 ms, total: 30.9 ms
Wall time: 30.6 ms

32553

def area_codes(phone_numbers):
    """
    Returns the number of unique area codes in the given sequence.

    >>> area_codes([
    ...    '123-456-7890',
    ...    '206-123-4567',
    ...    '123-000-0000',
    ...    '425-999-9999'
    ... ])
    3
    """
    # Maybe split on "-" character and then grab the first group
    # pn.split("-") ==> ["123", "456", "7890"]
    return len(set([pn.split("-")[0] for pn in phone_numbers]))
    return len(set([pn[:3] for pn in phone_numbers]))


doctest.run_docstring_examples(area_codes, globals())

def count_tokens(path):
    counts = {}
    with open(path) as f:
        for token in f.read().split():
            if token not in counts:
                counts[token] = 1
            else:
                counts[token] += 1
    return counts


%time count_tokens("moby-dick.txt")

def count_tokens(path):
    from collections import Counter
    with open(path) as f:
        return Counter(f.read().split())


%time count_tokens("moby-dick.txt")

def count_lengths(words):
    counts = {}
    for word in words:
        first_letter = word[0]
        if first_letter not in counts:
            counts[first_letter] = 0
        counts[first_letter] += 1
    return counts


count_lengths(['cats', 'dogs', 'deers'])

{'c': 1, 'd': 2}

Data Structures¶

List comprehensions¶

Practice: Fun numbers¶

Tuples¶

Sets¶

Practice: Area codes¶

Dictionaries¶

Practice: Count lengths¶