# There will always be an import cell at the start of each lecture notebook.
# If you're coding alongside me in lecture, run it!
from lec_utils import *
def test_pt_example():
    src = "https://pythontutor.com/iframe-embed.html#code=test_list%20%3D%20%5B8,%200,%202,%204%5D%0Atest_string%20%3D%20'zebra'%0Atest_list%5B1%5D%20%3D%2099%0Atest_string%5B1%5D%20%3D%20'f'&codeDivHeight=400&codeDivWidth=350&cumulative=false&curInstr=-1&heapPrimitives=nevernest&origin=opt-frontend.js&py=311&rawInputLstJSON=%5B%5D&textReferences=false"
    width = 800
    height = 500
    display(IFrame(src, width, height))
def swap_pt():
    src = "https://pythontutor.com/iframe-embed.html#code=x%20%3D%2042%0Ay%20%3D%20x%0Ax%20%3D%2012%0A%0Aa%20%3D%20%5B5,%2010%5D%0Ab%20%3D%20a%0Aa%5B0%5D%20%3D%20-1&codeDivHeight=400&codeDivWidth=350&cumulative=false&curInstr=-1&heapPrimitives=nevernest&origin=opt-frontend.js&py=311&rawInputLstJSON=%5B%5D&textReferences=false"
    width = 800
    height = 500
    display(IFrame(src, width, height))
def mystery_pt():
    src = "https://pythontutor.com/iframe-embed.html#code=def%20mystery%28vals%29%3A%0A%20%20%20%20vals%5B-1%5D%20%3D%2015%0A%20%20%20%20return%20vals.append%28'BBB'%29%0A%20%20%20%20%0Acreature%20%3D%20%5B1,%202,%203%5D%0A%0Amystery%28creature%29%0Amystery%28creature%29%0Amystery%28creature%29&codeDivHeight=400&codeDivWidth=350&cumulative=false&curInstr=-1&heapPrimitives=nevernest&origin=opt-frontend.js&py=311&rawInputLstJSON=%5B%5D&textReferences=false"
    width = 800
    height = 500
    display(IFrame(src, width, height))

// Compiler error!
            int count = 7 + 9;
            count = "data science";

# Works just fine.
count = 7 + 9
count = "data science"
count

'data science'

type(count) # The type function returns the type of an object.

str

# This function takes in a single argument and returns that argument + 1 / 0.
# Python doesn't stop us from defining the function.
def f(x):
    return x + 1 / 0

f(15)

---------------------------------------------------------------------------
ZeroDivisionError                         Traceback (most recent call last)
Cell In[5], line 1
----> 1 f(15)

Cell In[4], line 4, in f(x)
      3 def f(x):
----> 4     return x + 1 / 0

ZeroDivisionError: division by zero

name: str = 'Junior'
name = 3.14

# We defined this a while ago, but it still remembers.
# This is a common pattern: writing the name of a variable in a cell of its own
# to check its value.
count

'data science'

# To illustrate the issue, run this cell and then delete it.
age = 23

# If the above cell has been run, this cell will run just fine, even if you 
# delete the cell above. However, once your notebook "forgets" all of 
# the variables it knows about, this cell will error, 
# since `age` won't be defined anywhere!
age + 15

38

# If you run the cell below first, then this cell will run just fine.
# However, once your notebook "forgets" all of the variables
# it knows about, and you run all of its cells in order,
# this will cause an error, because you are trying to use
# `weather` before its defined!
weather - 4

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
Cell In[10], line 6
      1 # If you run the cell below first, then this cell will run just fine.
      2 # However, once your notebook "forgets" all of the variables
      3 # it knows about, and you run all of its cells in order,
      4 # this will cause an error, because you are trying to use
      5 # `weather` before its defined!
----> 6 weather - 4

NameError: name 'weather' is not defined

# To illustrate the issue, run this cell FIRST, then the cell above.
weather = 72

min(2, 3)

2

min = 17

min(2, 3)

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[14], line 1
----> 1 min(2, 3)

TypeError: 'int' object is not callable

!ls imgs

annotations.png    humans-cpp.png     restart-kernel.png

mixed_list = [-2, 2.5, 'michigan', [1, 3], max] # Different types!
mixed_list

[-2, 2.5, 'michigan', [1, 3], <function max>]

max(['hey', 'hi', 'hello'])

'hi'

groceries = ['eggs', 'milk']
groceries

['eggs', 'milk']

groceries.append('bread')

groceries

['eggs', 'milk', 'bread']

groceries + ['yogurt'] # This is a new list, not a modification of groceries!

['eggs', 'milk', 'bread', 'yogurt']

nums = [3, 1, 'dog', -9.5, 'michigan']

nums[0]

3

nums[3]

-9.5

nums[-1] # Counts from the end.

'michigan'

nums[5]

---------------------------------------------------------------------------
IndexError                                Traceback (most recent call last)
Cell In[26], line 1
----> 1 nums[5]

IndexError: list index out of range

nums

[3, 1, 'dog', -9.5, 'michigan']

nums[1:3]

[1, 'dog']

nums

[3, 1, 'dog', -9.5, 'michigan']

nums[0:4]

[3, 1, 'dog', -9.5]

# If you don't include 'start', the slice starts at the beginning of the list.
nums[:4]

[3, 1, 'dog', -9.5]

# If you don't include 'stop', the slice starts at the end of the list.
nums[-2:]

[-9.5, 'michigan']

# Interesting...
nums[::-1]

['michigan', -9.5, 'dog', 1, 3]

university = 'university of michigan'

university[1]

'n'

university[11:13]

'of'

university[-8:]

'michigan'

university.title()

'University Of Michigan'

university.replace('i', 'I').split()

['unIversIty', 'of', 'mIchIgan']

test_list = [8, 0, 2, 4]
test_string = 'zebra'

id(test_list) # Memory address of test_list.

6069529792

id(test_string)

6069908784

test_list[1] = 99
test_list

[8, 99, 2, 4]

id(test_list) # Same memory address!

6069529792

test_string[1] = 'f'

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[45], line 1
----> 1 test_string[1] = 'f'

TypeError: 'str' object does not support item assignment

# Since we can't "change" test_string, we need to make a "new" string 
# containing the parts of it that we wanted.
# We can re-use the variable name test_string, though!
test_string = test_string[:1] + 'f' + test_string[2:]
test_string

'zfbra'

test_pt_example()

var_name = <some expression>

x = 42
y = x
x = 12
y

42

a = [5, 10]
b = a
a[0] = -1
b

[-1, 10]

swap_pt()

double future_value(double present_value, double APR, int months) {
                double r = APR / 12.0 / 100.0;
                return present_value * pow(1 + r, months);
            }

def future_value(present_value, APR, months):
    r = APR / 12 / 100
    return present_value * (1 + r) ** months

future_value(100, 7, 36)

123.29255874769281

total = 3
def square_and_cube(a, b):
    return a ** 2 + total ** b

def mystery(vals):
    vals[-1] = 15
    return vals.append('BBB')

the
university
of
michigan
at
ann
arbor

0 the
1 university
2 of
3 michigan
4 at
5 ann
6 arbor

[4, 1, 81, 16, 9, 64]

[4, 16, 64]

[4, 0, 10, 16, 4, 64]

[4, 0, 10, 16, 4, 64]

{'name': 'Junior', 'age': 15, 4: ['kibble', 'treat']}

'Junior'

---------------------------------------------------------------------------
KeyError                                  Traceback (most recent call last)
Cell In[63], line 1
----> 1 dog['height']

KeyError: 'height'

{'name': 'Junior',
 'age': 15,
 4: ['kibble', 'treat'],
 'color': 'beige',
 'tricks': {'easy': ['roll over', 'paw'], 'medium': ['jump']}}

mystery_pt()

for value in "this is a string":

            for element in lst:                  # Assume lst is a list.

            for i in range(len(lst)):

sentence = ['the', 'university', 'of', 'michigan', 'at', 'ann', 'arbor']
# word is 'the', then 'university', then 'of', ...
for word in sentence:
    print(word)

the
university
of
michigan
at
ann
arbor

# i is 0, then 1, then 2, ...
# Depending on the problem, you may need to use the first pattern or this second pattern.
for i in range(len(sentence)):
    print(i, sentence[i])

0 the
1 university
2 of
3 michigan
4 at
5 ann
6 arbor

def double(vals):
                new_vals = []
                for val in vals:
                    new_vals.append(vals * 2)
                return new_vals

vals = [2, -1, 9, 4, 3, 8]

[val ** 2 for val in vals]

[4, 1, 81, 16, 9, 64]

[val ** 2 for val in vals if val % 2 == 0]

[4, 16, 64]

[val ** 2 if val % 2 == 0 else val + 1 for val in vals]

[4, 0, 10, 16, 4, 64]

new_vals = []
for val in vals:
    if val % 2 == 0:
        new_vals.append(val ** 2)
    else:
        new_vals.append(val + 1)
new_vals

[4, 0, 10, 16, 4, 64]

dog = {'name': 'Junior', 
       'age': 15, 
       4: ['kibble', 'treat']}
dog

{'name': 'Junior', 'age': 15, 4: ['kibble', 'treat']}

dog['name']

'Junior'

dog['height']

---------------------------------------------------------------------------
KeyError                                  Traceback (most recent call last)
Cell In[63], line 1
----> 1 dog['height']

KeyError: 'height'

dog['color'] = 'beige'
dog['tricks'] = {
    'easy': ['roll over', 'paw'],
    'medium': ['jump']
}

dog

{'name': 'Junior',
 'age': 15,
 4: ['kibble', 'treat'],
 'color': 'beige',
 'tricks': {'easy': ['roll over', 'paw'], 'medium': ['jump']}}

# Here, we're trying to add a value with a key of [1, 2].
# Since [1, 2] is mutable, it can't be used as a key.
dog[[1, 2]] = 'does this work?'

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[66], line 3
      1 # Here, we're trying to add a value with a key of [1, 2].
      2 # Since [1, 2] is mutable, it can't be used as a key.
----> 3 dog[[1, 2]] = 'does this work?'

TypeError: unhashable type: 'list'

codes_dict = {}
f = open('data/areacodes.txt', 'r')
s = f.read()
for l in s.split('\n')[:-1]:
    code, state = l.split(' — ')
    codes_dict[int(code)] = state

codes_dict = {...
208: 'Idaho',
209: 'California',
210: 'Texas',
212: 'New York',
213: 'California',
...}

states_dict = {}
...

YouTubeVideo('IaEuWJCcwjk')

	Python	C++
Do I need to define the type of a variable beforehand?	No Python is dynamically typed.	Yes C++ is statically typed.
Do I compile my code before running it?	No Python is interpreted; Python code is converted to bytecode line-by-line at runtime. In fact, the standard implementation of Python is written in C (called CPython).	Yes The entirety of a C++ program needs to be compiled to bytecode before it's run. This is part of why C++ is much faster than Python.

Lecture 2¶

Python Basics¶

EECS 398: Practical Data Science, Spring 2025¶

Agenda 📆¶

Following along¶

Notebooks, variables, lists, and strings¶

Variable types and code compilation¶

Variable types and compilers¶

Jupyter memory model¶

Restarting the kernel¶

Aside: Terminal commands in Jupyter Notebooks¶

Data structures¶

Lists¶

Appending¶

Indexing¶

Slicing¶

Strings and slicing¶

Immutability¶

Aside: Python Tutor¶

The swap¶

Functions and loops¶

Indentation and control flow¶

Activity

Activity

Aside: Workflow¶

`for`-loops in Python¶

Warning ⚠️¶

List comprehension¶

Dictionaries¶

Pre-activity setup¶

Activity

Walkthrough video of area codes example¶

What's next?¶

Lecture 2¶

Python Basics¶

EECS 398: Practical Data Science, Spring 2025¶

Agenda 📆¶

Following along¶

Notebooks, variables, lists, and strings¶

Variable types and code compilation¶

Variable types and compilers¶

Jupyter memory model¶

Restarting the kernel¶

Aside: Terminal commands in Jupyter Notebooks¶

Data structures¶

Lists¶

Appending¶

Indexing¶

Slicing¶

Strings and slicing¶

Immutability¶

Aside: Python Tutor¶

The swap¶

Functions and loops¶

Indentation and control flow¶

Activity

Activity

Aside: Workflow¶

for-loops in Python¶

Warning ⚠️¶

List comprehension¶

Dictionaries¶

Pre-activity setup¶

Activity

Walkthrough video of area codes example¶

What's next?¶

`for`-loops in Python¶