import pandas as pd

seattle_air = pd.read_csv("seattle_air.csv", index_col="Time", parse_dates=True)
seattle_air.groupby(seattle_air.index.year).count()

type(seattle_air)

pandas.core.frame.DataFrame

seattle_air

seattle_air.groupby(seattle_air.index.year)

<pandas.core.groupby.generic.DataFrameGroupBy object at 0x78bb42ff3c70>

seattle_air_nanremoved = seattle_air.dropna()

type(seattle_air_nanremoved)

pandas.core.frame.DataFrame

seattle_air.dropna(inplace=True)

seattle_air

seattle_air.groupby([...]) # seattle_air is the self

class DataFrame:
    """Represents two-dimensional tabular data structured around an index and column names."""

    def __init__(self, index, columns, data):
        """Initializes a new DataFrame object from the given index, columns, and tabular data."""
        print("Initializing DataFrame")
        self.index = index
        self.columns = columns
        self.data = data

    def dropna(self, inplace=False):
        """"
        Drops all rows containing NaN from this DataFrame. If inplace, returns None and modifies
        self. If not inplace, returns a new DataFrame without modifying self.
        """
        print("Calling dropna")
        if not inplace:
            return DataFrame([...], [...], [...])
        else:
            self.columns = [...]
            self.index = [...]
            self.data = [...]
            return None

    def __getitem__(self, column_or_indexer):
        """Given a column or indexer, returns the selection as a new Series or DataFrame object."""
        print("Calling __getitem__")
        if column_or_indexer in self.columns:
            return "Series" # placeholder for a Series
        else:
            return DataFrame([...], [...], [...])

# my_object = DataFrame(...)

# my_list[0]

# def __getitem__(self, index):
#     return self.data.at(0)

example = DataFrame([0, 1, 2], ["PM2.5"], [10, 20, 30])
example["PM2.5"]

Initializing DataFrame
Calling __getitem__

'Series'

"stri\'ng"

"stri'ng"

my_dict = {}
my_list = [0, 1, 2]
my_dict[my_list] = 3
# __hash__()

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[16], line 3
      1 my_dict = {}
      2 my_list = [0, 1, 2]
----> 3 my_dict[my_list] = 3

TypeError: unhashable type: 'list'

csv = """
Name,Hours
Diana,10
Thrisha,15
Yuxiang,20
Sheamin,12
"""

import io
staff = pd.read_csv(io.StringIO(csv), index_col=["Name"])
staff["Hours"]["Thrisha"]

15

staff.__getitem__(self, "Hours", "Thrisha")
column_or_indexer = (self, "Hours", "Thrisha")

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
Cell In[20], line 1
----> 1 staff.__getitem__(self, "Hours", "Thrisha")

NameError: name 'self' is not defined

staff.__getitem__("Hours")

Name
Diana      10
Thrisha    15
Yuxiang    20
Sheamin    12
Name: Hours, dtype: int64

staff.__getitem__("Hours").__getitem__("Thrisha")

15

class Student:
    def __init__(self, student_number, file_to_schedule):
        """
        Initializes a student with the student number and their schedule.

        The file_to_schedule is expected to be of format "<name>.txt".
        """
        self._number = student_number
        self._name = file_to_schedule.split(".")[0]
        self.schedule = {}
        with open(file_to_schedule) as f:
            for line in f.readlines():
                course_name, course_credit = line.split(' ')
                self.schedule[course_name] = course_credit

    def get_name(self):
        return self._name

nicole = Student(1234567, "nicole.txt")
for course in nicole.get_courses():
    print(course, nicole[course])

nicole.get_name()

!pip install -q nb_mypy
%reload_ext nb_mypy
%nb_mypy mypy-options --strict

class University:
    ...


uw = University("Udub", [nicole])
uw.enrollments()

wsu = University("Wazzu")
wsu.enrollments()

sea_u = University("SeaU")
sea_u.enrollments()

sea_u.enroll(nicole)
sea_u.enrollments()

wsu.enrollments()

	PM2.5
Time
2017	6283
2018	8540
2019	8597
2020	8683
2021	8664
2022	2292

	PM2.5
Time
2017-04-06 00:00:00	6.8
2017-04-06 01:00:00	5.3
2017-04-06 02:00:00	5.3
2017-04-06 03:00:00	5.6
2017-04-06 04:00:00	5.9
...	...
2022-04-06 19:00:00	5.1
2022-04-06 20:00:00	5.0
2022-04-06 21:00:00	5.3
2022-04-06 22:00:00	5.2
2022-04-06 23:00:00	5.2

	PM2.5
Time
2017-04-06 00:00:00	6.8
2017-04-06 01:00:00	5.3
2017-04-06 02:00:00	5.3
2017-04-06 03:00:00	5.6
2017-04-06 04:00:00	5.9
...	...
2022-04-06 19:00:00	5.1
2022-04-06 20:00:00	5.0
2022-04-06 21:00:00	5.3
2022-04-06 22:00:00	5.2
2022-04-06 23:00:00	5.2

Objects¶

Reference semantics¶

Defining classes¶

Practice: `Student` class¶

Type annotations¶

Practice: `University` class¶

Mutable default parameters¶

Objects¶

Reference semantics¶

Defining classes¶

Practice: Student class¶

Type annotations¶

Practice: University class¶

Mutable default parameters¶

Practice: `Student` class¶

Practice: `University` class¶