import doctest

with open("poem.txt") as f:
    content = f.read()
    print(content)

she sells
sea
shells by
the sea shore

with open("poem.txt") as f:
    lines = f.readlines()
    # lines = ["she sells\n", "sea\n", "shells by\n", "the sea shore\n"]
    line_num = 1
    for line in lines:
        # What if we remove the slicing part?
        print(line, end="") # Slice-out the newline character at the end
        line_num += 1

she sells
sea
shells by
the sea shore

print("Hello, my name is Kevin", end="")
print("My favorite course is CSE 163")

Hello, my name is KevinMy favorite course is CSE 163

"I really like dogs".split()

['I', 'really', 'like', 'dogs']

with open("poem.txt") as f:
    lines = f.readlines()
    # lines = ["she sells\n", "sea\n", "shells by\n", "the sea shore\n"]
    line_num = 1
    for line in lines:
        tokens = line.split()
        # line1: ["she", "sells"]
        print(line_num, tokens)
        for token in tokens:
            print(token, "has", len(token), "characters")
        line_num += 1

1 ['she', 'sells']
she has 3 characters
sells has 5 characters
2 ['sea']
sea has 3 characters
3 ['shells', 'by']
shells has 6 characters
by has 2 characters
4 ['the', 'sea', 'shore']
the has 3 characters
sea has 3 characters
shore has 5 characters

def count_odd(path):
    """
    For the file path, prints out each line number followed by the number of odd-length tokens.

    >>> count_odd("poem.txt")
    1 2
    2 1
    3 0
    4 3
    """
    with open(path) as f:
        lines = f.readlines()
        # lines = ["she sells\n", "sea\n", "shells by\n", "the sea shore\n"]
        line_num = 1
        for line in lines:
            tokens = line.split()
            # line1: ["she", "sells"]

            # Note: must assign num_odd = 0 inside the `for line in lines` loop!
            num_odd = 0
            for token in tokens:
                # line1 token1: "she"
                if len(token) % 2 == 1: # if odd length...
                    num_odd += 1
            # Probably calling print too frequently, so if I call print less frequently...
            print(line_num, num_odd)
            line_num += 1


doctest.run_docstring_examples(count_odd, globals())

def first_tokens(path):
    """
    Returns the first token in each line in the specified text file as a list of strings.

    >>> first_tokens("poem.txt")
    ['she', 'sea', 'shells', 'the']
    """
    result = []
    with open(path) as f:
        for line in f.readlines():
            # We need to assign the result of splitting on tokens
            tokens = line.split()
            result += tokens[0]
            # result.append(tokens[0]) # Probably the program is only adding the first character
    return result


doctest.run_docstring_examples(first_tokens, globals())

**********************************************************************
File "__main__", line 5, in NoName
Failed example:
    first_tokens("poem.txt")
Expected:
    ['she', 'sea', 'shells', 'the']
Got:
    ['s', 'h', 'e', 's', 'e', 'a', 's', 'h', 'e', 'l', 'l', 's', 't', 'h', 'e']

result = []
# result += "she"
result.extend("she")
result

['s', 'h', 'e']

result = []
# result.append("she")
result += ["she"]
result

['she']

File Processing¶

Opening files in Python¶

Line processing¶

Token processing¶

Practice: Count odd-length tokens¶

Debugging tips¶

Practice: Debugging first tokens¶