# Set up packages for lecture. Don't worry about understanding this code, but
# make sure to run it if you're following along.
import numpy as np
import babypandas as bpd
import pandas as pd
from matplotlib_inline.backend_inline import set_matplotlib_formats
import matplotlib.pyplot as plt
%reload_ext pandas_tutor
%set_pandas_tutor_options {'projectorMode': True}
set_matplotlib_formats("svg")
plt.style.use('fivethirtyeight')

np.set_printoptions(threshold=20, precision=2, suppress=True)
pd.set_option("display.max_rows", 7)
pd.set_option("display.max_columns", 8)
pd.set_option("display.precision", 2)


# Simulate a fair coin flip
np.random.choice(['Heads', 'Tails'])

'Heads'


# Simulate a roll of a die
np.random.choice(np.arange(1, 7))

5


# Simulate 10 fair coin flips
np.random.choice(['Heads', 'Tails'], 10)

array(['Tails', 'Heads', 'Tails', 'Tails', 'Heads', 'Tails', 'Heads',
       'Heads', 'Heads', 'Tails'], dtype='<U5')


# Choose three colleges to win free HDH swag
colleges = ['Revelle', 'John Muir', 'Thurgood Marshall', 
            'Earl Warren', 'Eleanor Roosevelt', 'Sixth', 'Seventh']

np.random.choice(colleges, 3, replace=False)

array(['Earl Warren', 'Eleanor Roosevelt', 'Seventh'], dtype='<U17')


coins = np.random.choice(['Heads', 'Tails'], 100)
coins

array(['Tails', 'Tails', 'Heads', ..., 'Heads', 'Heads', 'Tails'],
      dtype='<U5')


(coins == 'Heads').sum()

49


np.count_nonzero(coins == 'Heads') # counts the number of Trues in sequence

49


def coin_experiment():
    coins = np.random.choice(['Heads', 'Tails'], 100)
    return np.count_nonzero(coins == 'Heads')


coin_experiment()

59


head_counts = np.array([])
head_counts

array([], dtype=float64)


head_counts = np.append(head_counts, 15)
head_counts

array([15.])


head_counts = np.append(head_counts, 25)
head_counts

array([15., 25.])


# Specify the number of repetitions
repetitions = 10000

# Create an empty array to store the results
head_counts = np.array([])

for i in np.arange(repetitions):
    # For each repetition, run the experiment and add the result to head_counts
    head_count = coin_experiment()
    head_counts = np.append(head_counts, head_count)


len(head_counts)

10000


head_counts

array([46., 59., 51., ..., 44., 49., 45.])


# In how many experiments was the number of heads >= 60?
at_least_60 = np.count_nonzero(head_counts >= 60)
at_least_60

289


# What is this as a proportion?
at_least_60 / repetitions

0.0289


# Can also use np.mean()! Why?
np.mean(head_counts >= 60)

0.0289


# The theoretical answer – don't worry about how or why this code works
import math
sum([math.comb(100, i) * (1 / 2) ** 100 for i in np.arange(60, 101)])

0.028443966820490392


bpd.DataFrame().assign(
    Number_of_Heads=head_counts
).plot(kind='hist', bins=np.arange(30, 70), density=True, ec='w', figsize=(10, 5));
plt.axvline(60, color='C1');


behind_picked_door = np.random.choice(['Car', 'Goat #1', 'Goat #2'])
behind_picked_door

'Goat #2'


# Determine winning_strategy ('Stay' or 'Switch') based on what behind_picked_door is.

if behind_picked_door == 'Car':
    winning_strategy = 'Stay'
else:
    # A goat was behind the picked door. Monty will reveal the other goat. 
    # Switching wins:
    winning_strategy = 'Switch'


def simulate_monty_hall():
    behind_picked_door = np.random.choice(['Car', 'Goat #1', 'Goat #2'])
    
    if behind_picked_door == 'Car':
        winning_strategy = 'Stay'
    else:
        winning_strategy = 'Switch'
        
#     print(behind_picked_door, 'was behind the door. Winning strategy:', winning_strategy)
    return winning_strategy


simulate_monty_hall()

'Switch'


repetitions = 10000

winning_strategies = np.array([])

for i in np.arange(repetitions):
    winning_strategy = simulate_monty_hall()
    winning_strategies = np.append(winning_strategies, winning_strategy)


winning_strategies

array(['Stay', 'Stay', 'Stay', ..., 'Stay', 'Switch', 'Stay'],
      dtype='<U32')


winning_strategies

array(['Stay', 'Stay', 'Stay', ..., 'Stay', 'Switch', 'Stay'],
      dtype='<U32')


np.count_nonzero(winning_strategies == 'Switch')

6696


np.count_nonzero(winning_strategies == 'Switch') / repetitions

0.6696


np.count_nonzero(winning_strategies == 'Stay') / repetitions

0.3304


switch_count = 0


for i in np.arange(repetitions):
    winning_strategy = simulate_monty_hall()
    if winning_strategy == 'Switch':
        switch_count = switch_count + 1


switch_count / repetitions

0.6717


1 - switch_count / repetitions

0.32830000000000004

Lecture 13 – Simulation¶

DSC 10, Fall 2022¶

Announcements¶

Midterm Exam details¶

Agenda¶

Simulation¶

Simulation¶

Making a random choice¶

Making multiple random choices¶

With replacement vs. without replacement¶

Example: What's the probability of getting 60 or more heads if we flip 100 coins?¶

Flipping coins¶

Step 1: Figure out how to do one experiment¶

Aside: Putting the experiment in a function¶

Step 2: Repeat the experiment¶

Step 2: Repeat the experiment¶

Step 3: Find the proportion of experiments in which the number of heads was 60 or more¶

Visualizing the distribution¶

Example: The "Monty Hall" Problem¶

The "Monty Hall" Problem¶

Concept Check ✅ – Answer at cc.dsc10.com ¶

Let's see 🤔¶

Time to simulate!¶

Step 1: Simulate a single game¶

Step 1: Simulate a single game¶

Step 1: Simulate a single game¶

Step 1: Simulate a single game¶

Step 2: Play the game many times¶

Step 3: Count the proportion of wins for each strategy (stay or switch)¶

Alternate implementation¶

Marilyn vos Savant's column¶

Summary, next time¶

Simulation finds probabilities¶

The simulation "recipe"¶

What's next?¶

Lecture 13 – Simulation¶

DSC 10, Fall 2022¶

Announcements¶

Midterm Exam details¶

Agenda¶

Simulation¶

Simulation¶

Making a random choice¶

Making multiple random choices¶

With replacement vs. without replacement¶

Example: What's the probability of getting 60 or more heads if we flip 100 coins?¶

Flipping coins¶

Step 1: Figure out how to do one experiment¶

Aside: Putting the experiment in a function¶

Step 2: Repeat the experiment¶

Step 2: Repeat the experiment¶

Step 3: Find the proportion of experiments in which the number of heads was 60 or more¶

Visualizing the distribution¶

Example: The "Monty Hall" Problem¶

The "Monty Hall" Problem¶

Concept Check ✅ – Answer at cc.dsc10.com¶

Let's see 🤔¶

Time to simulate!¶

Step 1: Simulate a single game¶

Step 1: Simulate a single game¶

Step 1: Simulate a single game¶

Step 1: Simulate a single game¶

Step 2: Play the game many times¶

Step 3: Count the proportion of wins for each strategy (stay or switch)¶

Alternate implementation¶

Marilyn vos Savant's column¶

Summary, next time¶

Simulation finds probabilities¶

The simulation "recipe"¶

What's next?¶

Concept Check ✅ – Answer at cc.dsc10.com ¶