import pandas as pd

seattle_air = pd.read_csv("seattle_air.csv", index_col="Time", parse_dates=True)
seattle_air.groupby(seattle_air.index.year).count()

seattle_air

seattle_air.dropna()

seattle_air

class DataFrame:
    """Represents two-dimensional tabular data structured around an index and column names."""

    def __init__(self, index, columns, data):
        """Initializes a new DataFrame object from the given index, columns, and tabular data."""
        print("Initializing DataFrame")
        self.index = index
        self.columns = columns
        self.data = data

    def dropna(self, inplace=False):
        """"
        Drops all rows containing NaN from this DataFrame. If inplace, returns None and modifies
        self. If not inplace, returns a new DataFrame without modifying self.
        """
        print("Calling dropna")
        if not inplace:
            return DataFrame([...], [...], [...])
        else:
            self.columns = [...]
            self.index = [...]
            self.data = [...]
            return None

    def __getitem__(self, column_or_indexer):
        """Given a column or indexer, returns the selection as a new Series or DataFrame object."""
        print("Calling __getitem__")
        if column_or_indexer in self.columns:
            return "Series" # placeholder for a Series
        else:
            return DataFrame([...], [...], [...])

example = DataFrame([0, 1, 2], ["PM2.5"], [10, 20, 30])
example["PM2.5"]

example

!pip install -q nb_mypy
%reload_ext nb_mypy
%nb_mypy mypy-options --strict

Version 1.0.5

class Student:
    """Represents a UW student with a name, number, and courses dictionary."""
    # Type annotations are ways to tell other programmers what the type of
    # each parameter and each return value will be! Documentation also does
    # a lot of this, but the advantage of using type annotations is that
    # Python (or, rather, mypy) is able to systematically double check your
    # work.

    def __init__(self, number: int, filename: str):
        """Initializes a new Student instance with the given number and filename."""
        # filename[:-4] gets the string "nicole" from "nicole.txt"
        self._name = filename[:-4]
        self._number = number
        self._courses = {}
        self._load_file()

    def _load_file(self, filename: str):
        # Load in the courses from the path
        with open(filename) as f:
            for line in f.readlines():
                course, credits = line.split()
                self.courses[course] = int(credits)

    # To fix incompatible return types for None, we need to specify None
    # can be returned by this function!
    def __getitem__(self, course: str) -> int | None:
        """Returns the number of credits the student is taking the given course."""
        if course not in self._courses:
            return None
        return self._courses[course]

    # For "generic type list" errors, we need to specify the type of
    # elements stored in the list using square brackets notation
    def get_courses(self) -> list[str]:
        """Return the list of courses the student is taking."""
        return list(self._courses)

    def get_name(self) -> str:
        return self._name

    def get_number(self) -> int:
        return self._number

    def __repr__(self) -> str:
        return f"Student({self._number}, '{self._name}.txt')"


nicole = Student(1234567, "nicole.txt")
for course in nicole.get_courses():
    print(course, nicole[course])

CSE163 4
PHIL100 4
CSE390HA 1

class University:
    # self.name, self.students

    # Fix mutable default parameters: default to None and then reassign later.
    def __init__(self, name: str, students: list[Student] | None = None):
        self.name = name
        if students is None:
            students = []
        self.students = students

        self.courses : dict[str, list[Student]] = {}
        for student in self.students:
            for course in student.get_courses():
                if course in self.courses:
                    self.courses[course].append(student)
                else:
                    self.courses[course] = [student]
                # # alternative 1
                # if course not in self.courses:
                #     self.courses[course] = []
                # self.courses[course].append(student)
                # # alternative 2
                # self.courses.get(course, []).append(student)

    def enrollments(self) -> list[Student]:
        # How to alphabetically sort the list of students?
        return sorted(self.students, key=lambda student: student.name)
        # alternative since the get_name function already takes one parameter
        # return sorted(self.students, key=Student.get_name)

    def enroll(self, student: Student) -> None:
        self.students.append(student)
        # need to update the self.courses
        ....

    def roster(self, course: str) -> list[Student]:
        """
        Return the students enrolled in the course.
        """
        # enrolled_students = []
        # for student in self.students:
        #     # check whether the student is enrolled in this course:
        #     if course in student.get_courses():
        #         enrolled_students.append(student)
        # return enrolled_students
        
        # precomputation approach
        if course not in self.courses:
            return []
        return self.courses[course]
        # return self.courses.get(course, [])


uw = University("Udub", [nicole])
# uw.enrollments()
print(uw.roster("CSE000"))
print(uw.roster("CSE163"))
print(uw.roster("CSE163"))

[]
[Student(1234567, 'nicole.txt')]

student_list = [nicole, Student(1234568, 'nicole.txt'), Student(0, 'nicole.txt'), Student(-100000, 'nicole.txt')]

sorted(student_list, key=lambda student: student.get_number())

[Student(-100000, 'nicole.txt'),
 Student(0, 'nicole.txt'),
 Student(1234567, 'nicole.txt'),
 Student(1234568, 'nicole.txt')]

def get_number(student: Student) -> int:
    return student.number

sorted(student_list, key=get_number, reverse=True)

[Student(1234568, 'nicole.txt'),
 Student(1234567, 'nicole.txt'),
 Student(0, 'nicole.txt'),
 Student(-100000, 'nicole.txt')]

wsu = University("Wazzu")
wsu.enrollments()

[]

seattle_u = University("SeattleU")
seattle_u.enrollments()

[]

seattle_u.enroll(nicole)
seattle_u.enrollments()

[Student(1234567, 'nicole.txt')]

# Not expected: enrolling a student in SeattleU also enrolls them in WSU
wsu.enrollments()

[Student(1234567, 'nicole.txt')]

Objects¶

Reference semantics¶

Defining classes¶

Type annotations¶

Practice: `Student` class¶

Practice: `University` class¶

Mutable default parameters¶

Objects¶

Reference semantics¶

Defining classes¶

Type annotations¶

Practice: Student class¶

Practice: University class¶

Mutable default parameters¶

Practice: `Student` class¶

Practice: `University` class¶