import doctest

example = "I really like dogs".split()
example[1] # Lists are sort of like dictionaries... in that you have an index

'really'

dictionary["a"] # This gets the value associated with "a"

1

dictionary = {"a": 1, "b": 2, "c": 3}
for key in dictionary:
    print(key, dictionary[key]) # dictionary[key] gets value associated with key

a 1
b 2
c 3

dictionary = {"a": 1, "b": 2, "c": 3}
for key in dictionary.keys():
    print(key, dictionary[key])

a 1
b 2
c 3

dictionary = {"a": 1, "b": 2, "c": 3}
for value in dictionary.values():
    # Dictionaries do not have an easy way to go from values back to keys!
    print(value)

1
2
3

dictionary = {"a": 1, "b": 2, "c": 3}
for key, value in dictionary.items():
    # value = dictionary[key]
    print(key, value)

a 1
b 2
c 3

def most_frequent(counts):
    """
    Returns the token in the given dictionary with the highest count, or None if empty.

    >>> most_frequent({"green": 2, "eggs": 6, "and": 3, "yam": 2})
    'eggs'
    >>> most_frequent({}) # None is not displayed as output

    """
    max_word = None
    for word in counts:
        # KeyError means that we've tried to look up a dictionary value
        # for a key that is not in the dictionary
        # Often want to check if a key is None before accessing its value from a dictionary
        if max_word is None or counts[word] > counts[max_word]:
            max_word = word
    return max_word


doctest.run_docstring_examples(most_frequent, globals())

def most_frequent(counts):
    """
    Returns the token in the given dictionary with the highest count, or None if empty.

    >>> most_frequent({"green": 2, "eggs": 6, "and": 3, "yam": 2})
    'eggs'
    >>> most_frequent({}) # None is not displayed as output

    """
    max_word = None
    for word in counts:
        # Hmm, what if we change the order of the "or" operator
        # First, Python has to check the left condition, then the right one!
        # Can look up "short circuiting"
        if counts[word] > counts[max_word] or max_word is None:
            max_word = word
    return max_word


doctest.run_docstring_examples(most_frequent, globals())

**********************************************************************
File "__main__", line 5, in NoName
Failed example:
    most_frequent({"green": 2, "eggs": 6, "and": 3, "yam": 2})
Exception raised:
    Traceback (most recent call last):
      File "/opt/conda/lib/python3.10/doctest.py", line 1350, in __run
        exec(compile(example.source, filename, "single",
      File "<doctest NoName[0]>", line 1, in <module>
        most_frequent({"green": 2, "eggs": 6, "and": 3, "yam": 2})
      File "/tmp/ipykernel_190/3519406350.py", line 13, in most_frequent
        if counts[word] > counts[max_word] or max_word is None:
    KeyError: None

most_frequent({})

dictionary = {"a": 1, "b": 2, "c": 3}
for key, value in dictionary.items():
    print(key, value)

with open("poem.txt") as f:
    # This handles the line_num variable that we used to have to create manually
    for i, line in enumerate(f.readlines(), start=1):
        print(i, line[:-1])

1 she sells
2 sea
3 shells by
4 the sea shore

arabic_nums = [  1,    2,     3,    4,   5]
alpha_nums  = ["a",  "b",   "c",  "d", "e"]
roman_nums  = ["i", "ii", "iii", "iv", "v"]

# Zip iterates through each list at the same time
for arabic, alpha, roman in zip(arabic_nums, alpha_nums, roman_nums):
    print(arabic, alpha, roman)

1 a i
2 b ii
3 c iii
4 d iv
5 e v

staff = [
    {"Name": "Anna", "Hours": 20},
    {"Name": "Iris", "Hours": 15},
    {"Name": "Abiy", "Hours": 10},
    {"Name": "Gege", "Hours": 12},
]
staff

[{'Name': 'Anna', 'Hours': 20},
 {'Name': 'Iris', 'Hours': 15},
 {'Name': 'Abiy', 'Hours': 10},
 {'Name': 'Gege', 'Hours': 12}]

total_hours = 0
for ta in staff: # Loop over the list
    # For each ta (dictionary)...
    total_hours += ta["Hours"]
total_hours

57

for ta in staff:
    if ta["Name"] == "Iris":
        print(ta["Hours"])

15

staff["Iris"]["Hours"]

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[20], line 1
----> 1 staff["Iris"]["Hours"]

TypeError: list indices must be integers or slices, not str

staff[1]["Hours"]

15

def largest_earthquake_place(path):
    """
    Returns the name of the place with the largest-magnitude earthquake in the specified CSV file.

    >>> largest_earthquake_place("earthquakes.csv")
    'Northern Mariana Islands'
    """
    import pandas as pd
    earthquakes = pd.read_csv(path).to_dict("records") # Reads file as a list of dictionaries
    # print(earthquakes[0])

    max_name = None
    max_magn = None
    for earthquake in earthquakes:
        if max_magn is None or earthquake["magnitude"] > max_magn:
            max_name = earthquake["name"]
            max_magn = earthquake["magnitude"]
    return max_name


doctest.run_docstring_examples(largest_earthquake_place, globals())

id	year	month	day	latitude	longitude	name	magnitude
nc72666881	2016	7	27	37.672	-121.619	California	1.43
us20006i0y	2016	7	27	21.515	94.572	Burma	4.9
nc72666891	2016	7	27	37.577	-118.859	California	0.06
nc72666896	2016	7	27	37.596	-118.995	California	0.4
nn00553447	2016	7	27	39.378	-119.845	Nevada	0.3

CSV Data¶

Dictionary functions¶

None in Python¶

Loop unpacking¶

Comma-separated values¶

Practice: Largest earthquake place¶

Name	Hours
Anna	20
Iris	15
Abiy	10
Gege	12