# ignore

# If this is the first time you are opening a notebook, please read this.
#
# Interaction basics
# ------------------
#
# * The notebook is composed of _code cells_ (like this one) and
#   _text cells_ (like the one above).
# 
# * To interact with the notebook, click into a cell (or type `Return`) 
#   and start editing. Type `Shift+Return` to execute the code, or 
#   `Esc` to leave without executing it.
# 
# * Since code cells depend on earlier cells, you will have to execute
#   those first - beginning from the top of the notebook.
# 
# * You can change code (and text) at your leisure to try out alternatives.
#   In Jupyter, use `b` to add a new cell below, and `Return` to enter it.
#   Type `x` to delete (cut) a cell, and `z` to undo this.
# 
# * There's a `Help` menu at the top of Jupyter Notebook. Enjoy!
#
#
# `# ignore` markers
# ------------------
#
# * In the notebook, there are some extra code cells starting with `# ignore`
#   (like this one, actually). These are code blocks used to create diagrams,
#   run tests, create or tear down special environments or more - code blocks
#   that are not necessary for reading (but for creation).
#
#
# `# type: ignore` markers
# ------------------------
#
# * In the notebook, some lines come with a comment `# type: ignore`. This tells
#   static code checkers to ignore any typing errors in that line. Most frequently,
#   this is used to mark untyped Python code (as in our examples) such that the
#   static code checker does not mark it as erroneous.

This is <em>emphasized</em>.

Here's some <strong>strong argument</strong>.

def remove_html_markup(s):  # type: ignore
    tag = False
    out = ""

    for c in s:
        if c == '<':    # start of markup
            tag = True
        elif c == '>':  # end of markup
            tag = False
        elif not tag:
            out = out + c

    return out

Here's some <strong>strong argument</strong>.

remove_html_markup("Here's some <strong>strong argument</strong>.")

"Here's some strong argument."

assert remove_html_markup("Here's some <strong>strong argument</strong>.") == \
    "Here's some strong argument."

<input type="text" value="<your name>">

remove_html_markup('<input type="text" value="<your name>">')

'"'

with ExpectError():
    assert remove_html_markup('<input type="text" value="<your name>">') == ""

Traceback (most recent call last):
  File "/var/folders/n2/xd9445p97rb3xh7m1dfx8_4h0006ts/T/ipykernel_92822/145241764.py", line 2, in <module>
    assert remove_html_markup('<input type="text" value="<your name>">') == ""
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
AssertionError (expected)

# ignore
PASS = "✔"
FAIL = "✘"

PASS_COLOR = 'darkgreen'  # '#006400' # darkgreen
FAIL_COLOR = 'red4'  # '#8B0000' # darkred

STEP_COLOR = 'peachpuff'
FONT_NAME = 'Raleway'

# ignore
def graph(comment: str ="default") -> Digraph:
    return Digraph(name='', comment=comment, graph_attr={'rankdir': 'LR'},
        node_attr={'style': 'filled',
                   'fillcolor': STEP_COLOR,
                   'fontname': FONT_NAME},
        edge_attr={'fontname': FONT_NAME})

# ignore
state_machine = graph()
state_machine.node('Start', )
state_machine.edge('Start', '¬ tag')
state_machine.edge('¬ tag', '¬ tag', label=" ¬ '<'\\nadd character")
state_machine.edge('¬ tag:s', '¬ tag', label="'>'")
state_machine.edge('¬ tag', 'tag', label="'<'")
state_machine.edge('tag', '¬ tag', label="'>'")
state_machine.edge('tag', 'tag', label="¬ '>'")

# ignore
display(state_machine)

<input type="text" value="<your name>">

# ignore
state_machine = graph()
state_machine.node('Start')
state_machine.edge('Start', '¬ quote\\n¬ tag')
state_machine.edge('¬ quote\\n¬ tag', '¬ quote\\n¬ tag',
                   label="¬ '<'\\nadd character")
state_machine.edge('¬ quote\\n¬ tag', '¬ quote\\ntag', label="'<'")
state_machine.edge('¬ quote\\ntag', 'quote\\ntag', label="'\"'")
state_machine.edge('¬ quote\\ntag', '¬ quote\\ntag', label="¬ '\"' ∧ ¬ '>'")
state_machine.edge('quote\\ntag', 'quote\\ntag', label="¬ '\"'")
state_machine.edge('quote\\ntag', '¬ quote\\ntag', label="'\"'")
state_machine.edge('¬ quote\\ntag', '¬ quote\\n¬ tag', label="'>'")

# ignore
display(state_machine)

def remove_html_markup(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        if c == '<' and not quote:
            tag = True
        elif c == '>' and not quote:
            tag = False
        elif c == '"' or c == "'" and tag:
            quote = not quote
        elif not tag:
            out = out + c

    return out

remove_html_markup('<input type="text" value="<your name>">')

''

assert remove_html_markup("Here's some <strong>strong argument</strong>.") == \
    "Here's some strong argument."

assert remove_html_markup('<input type="text" value="<your name>">') == ""

<b>foo</b>
<b>"foo"</b>
"<b>foo</b>"
<"b">foo</"b">

with ExpectError():
    assert remove_html_markup('<b>foo</b>') == 'foo'

with ExpectError():
    assert remove_html_markup('<b>"foo"</b>') == '"foo"'

Traceback (most recent call last):
  File "/var/folders/n2/xd9445p97rb3xh7m1dfx8_4h0006ts/T/ipykernel_92822/4031927246.py", line 2, in <module>
    assert remove_html_markup('<b>"foo"</b>') == '"foo"'
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
AssertionError (expected)

with ExpectError():
    assert remove_html_markup('"<b>foo</b>"') == '"foo"'

Traceback (most recent call last):
  File "/var/folders/n2/xd9445p97rb3xh7m1dfx8_4h0006ts/T/ipykernel_92822/242211734.py", line 2, in <module>
    assert remove_html_markup('"<b>foo</b>"') == '"foo"'
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
AssertionError (expected)

with ExpectError():
    assert remove_html_markup('<"b">foo</"b">') == 'foo'

def remove_html_markup_with_print(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        print("c =", repr(c), "tag =", tag, "quote =", quote)

        if c == '<' and not quote:
            tag = True
        elif c == '>' and not quote:
            tag = False
        elif c == '"' or c == "'" and tag:
            quote = not quote
        elif not tag:
            out = out + c

    return out

remove_html_markup_with_print('<b>"foo"</b>')

c = '<' tag = False quote = False
c = 'b' tag = True quote = False
c = '>' tag = True quote = False
c = '"' tag = False quote = False
c = 'f' tag = False quote = True
c = 'o' tag = False quote = True
c = 'o' tag = False quote = True
c = '"' tag = False quote = True
c = '<' tag = False quote = False
c = '/' tag = True quote = False
c = 'b' tag = True quote = False
c = '>' tag = True quote = False

'foo'

def remove_html_markup_without_quotes(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        if c == '<':  # and not quote:
            tag = True
        elif c == '>':  # and not quote:
            tag = False
        elif c == '"' or c == "'" and tag:
            quote = not quote
        elif not tag:
            out = out + c

    return out

assert remove_html_markup_without_quotes('<b id="bar">foo</b>') == 'foo'

with ExpectError():
    assert remove_html_markup_without_quotes('<b>"foo"</b>') == '"foo"'

Traceback (most recent call last):
  File "/var/folders/n2/xd9445p97rb3xh7m1dfx8_4h0006ts/T/ipykernel_92822/3864559921.py", line 2, in <module>
    assert remove_html_markup_without_quotes('<b>"foo"</b>') == '"foo"'
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
AssertionError (expected)

def remove_html_markup_fixed(s):  # type: ignore
    if s == '<b>"foo"</b>':
        return '"foo"'
    ...

# ignore
from typing import List, Optional

# ignore
def execution_diagram(show_steps: bool = True, variables: List[str] = [],
                      steps: int = 3, error_step: int = 666,
                      until: int = 666, fault_path: List[str] = []) -> Digraph:
    dot = graph()

    dot.node('input', shape='none', fillcolor='white', label=f"Input {PASS}",
             fontcolor=PASS_COLOR)
    last_outgoing_states = ['input']

    for step in range(1, min(steps + 1, until)):

        step_color: Optional[str]
        if step == error_step:
            step_label = f'Step {step} {FAIL}'
            step_color = FAIL_COLOR
        else:
            step_label = f'Step {step}'
            step_color = None

        if step >= error_step:
            state_label = f'State {step} {FAIL}'
            state_color = FAIL_COLOR
        else:
            state_label = f'State {step} {PASS}'
            state_color = PASS_COLOR

        state_name = f's{step}'
        outgoing_states = []
        incoming_states = []

        if not variables:
            dot.node(name=state_name, shape='box',
                     label=state_label, color=state_color,
                     fontcolor=state_color)
        else:
            var_labels = []
            for v in variables:
                vpath = f's{step}:{v}'
                if vpath in fault_path:
                    var_label = f'<{v}>{v} ✘'
                    outgoing_states.append(vpath)
                    incoming_states.append(vpath)
                else:
                    var_label = f'<{v}>{v}'
                var_labels.append(var_label)
            record_string = " | ".join(var_labels)
            dot.node(name=state_name, shape='record',
                     label=nohtml(record_string), color=state_color,
                     fontcolor=state_color)

        if not outgoing_states:
            outgoing_states = [state_name]
        if not incoming_states:
            incoming_states = [state_name]

        for outgoing_state in last_outgoing_states:
            for incoming_state in incoming_states:
                if show_steps:
                    dot.edge(outgoing_state, incoming_state,
                             label=step_label, fontcolor=step_color)
                else:
                    dot.edge(outgoing_state, incoming_state)

        last_outgoing_states = outgoing_states

    if until > steps + 1:
        # Show output
        if error_step > steps:
            dot.node('output', shape='none', fillcolor='white',
                     label=f"Output {PASS}", fontcolor=PASS_COLOR)
        else:
            dot.node('output', shape='none', fillcolor='white',
                     label=f"Output {FAIL}", fontcolor=FAIL_COLOR)

        for outgoing_state in last_outgoing_states:
            label = "Execution" if steps == 0 else None
            dot.edge(outgoing_state, 'output', label=label)

    display(dot)

# ignore
execution_diagram(show_steps=False, steps=0, error_step=0)

# ignore
for until in range(1, 6):
    execution_diagram(show_steps=False, until=until, error_step=2)

# ignore
for until in range(1, 6):
    execution_diagram(show_steps=True, until=until, error_step=2)

# ignore
for until in range(1, 6):
    execution_diagram(show_steps=True, variables=['var1', 'var2', 'var3'],
                      error_step=2,
                      until=until, fault_path=['s2:var2', 's3:var2'])

# ignore
dot = graph()

dot.node('Hypothesis')
dot.node('Observation')
dot.node('Prediction')
dot.node('Experiment')

dot.edge('Hypothesis', 'Observation',
         label="<Hypothesis<BR/>is <I>supported:</I><BR/>Refine it>",
         dir='back')
dot.edge('Hypothesis', 'Prediction')

dot.node('Problem Report', shape='none', fillcolor='white')
dot.edge('Problem Report', 'Hypothesis')

dot.node('Code', shape='none', fillcolor='white')
dot.edge('Code', 'Hypothesis')

dot.node('Runs', shape='none', fillcolor='white')
dot.edge('Runs', 'Hypothesis')

dot.node('More Runs', shape='none', fillcolor='white')
dot.edge('More Runs', 'Hypothesis')

dot.edge('Prediction', 'Experiment')
dot.edge('Experiment', 'Observation')
dot.edge('Observation', 'Hypothesis',
         label="<Hypothesis<BR/>is <I>rejected:</I><BR/>Seek alternative>")

# ignore
display(dot)

for i, html in enumerate(['<b>foo</b>',
                          '<b>"foo"</b>',
                          '"<b>foo</b>"',
                          '<b id="bar">foo</b>']):
    result = remove_html_markup(html)
    print("%-2d %-15s %s" % (i + 1, html, result))

1  <b>foo</b>      foo
2  <b>"foo"</b>    foo
3  "<b>foo</b>"    <b>foo</b>
4  <b id="bar">foo</b> foo

quiz("From the difference between success and failure,"
     " we can already devise some observations about "
     " what is wrong with the output."
     " Which of these can we turn into general hypotheses?",
    [
        "Double quotes (`\"`) are stripped from the tagged input.",
        "Tags in double quotes are not stripped.",
        "The tag `<>` is always stripped from the input.",
        "Four-letter words are stripped."
    ], '[298 % 33, 1234 % 616]')

"foo"

remove_html_markup('"foo"')

'foo'

elif c == '"' or c == "'" and tag:
    quote = not quote

assert cond

def remove_html_markup_with_tag_assert(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        assert not tag  # <=== Just added

        if c == '<' and not quote:
            tag = True
        elif c == '>' and not quote:
            tag = False
        elif c == '"' or c == "'" and tag:
            quote = not quote
        elif not tag:
            out = out + c

    return out

# remove_html_markup_with_tag_assert('"foo"')

quiz("What happens after inserting the above assertion?",
    [
        "The program raises an exception. (i.e., `tag` is set)",
        "The output is as before, i.e., `foo` without quotes."
        " (which means that `tag` is not set)"
    ], 2)

with ExpectError():
    result = remove_html_markup_with_tag_assert('"foo"')
result

'foo'

elif c == '"' or c == "'" and tag:
    quote = not quote

def remove_html_markup_with_quote_assert(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        if c == '<' and not quote:
            tag = True
        elif c == '>' and not quote:
            tag = False
        elif c == '"' or c == "'" and tag:
            assert False  # <=== Just added
            quote = not quote
        elif not tag:
            out = out + c

    return out

# remove_html_markup_with_quote_assert('"foo"')

quiz("What happens after inserting the 'assert' tag?",
    [
        "The program raises an exception (i.e., the quote condition holds)",
        "The output is still foo (i.e., the quote condition does not hold)"
    ], 29 % 7)

with ExpectError():
    result = remove_html_markup_with_quote_assert('"foo"')

Traceback (most recent call last):
  File "/var/folders/n2/xd9445p97rb3xh7m1dfx8_4h0006ts/T/ipykernel_92822/904218512.py", line 2, in <module>
    result = remove_html_markup_with_quote_assert('"foo"')
             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/var/folders/n2/xd9445p97rb3xh7m1dfx8_4h0006ts/T/ipykernel_92822/2877654332.py", line 12, in remove_html_markup_with_quote_assert
    assert False  # <=== Just added
           ^^^^^
AssertionError (expected)

elif c == '"' or c == "'" and tag:
    quote = not quote

remove_html_markup("'foo'")

"'foo'"

c == "" or c == '' and tag        # Choice 1
c == '"' or c == "'" and not tag  # Choice 2
(c == '"' or c == "'") and tag    # Choice 3
...                               # Something else

quiz("How should the condition read?",
     [
         '''`c == "" or c == '' and tag` (Choice 1)''',
         '''`c == '"' or c == "'" and not tag` (Choice 2)''',
         '''`(c == '"' or c == "'") and tag` (Choice 3)''',
         "Something else"
     ],
     '399 % 4')

(c == '"' or c == "'") and tag

def remove_html_markup(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        if c == '<' and not quote:
            tag = True
        elif c == '>' and not quote:
            tag = False
        elif (c == '"' or c == "'") and tag:  # <-- FIX
            quote = not quote
        elif not tag:
            out = out + c

    return out

assert remove_html_markup("Here's some <strong>strong argument</strong>.") == \
    "Here's some strong argument."
assert remove_html_markup(
    '<input type="text" value="<your name>">') == ""
assert remove_html_markup('<b>foo</b>') == 'foo'
assert remove_html_markup('<b>"foo"</b>') == '"foo"'
assert remove_html_markup('"<b>foo</b>"') == '"foo"'
assert remove_html_markup('<b id="bar">foo</b>') == 'foo'

quiz("Which assertion would have caught the problem?",
     [
        "`assert quote and not tag`",
        "`assert quote or not tag`",
        "`assert tag or not quote`",
        "`assert tag and not quote`"
     ], '3270 - 3267')

assert tag or not quote

# ignore
display(state_machine)

def remove_html_markup(s):  # type: ignore
    tag = False
    quote = False
    out = ""

    for c in s:
        assert tag or not quote

        if c == '<' and not quote:
            tag = True
        elif c == '>' and not quote:
            tag = False
        elif (c == '"' or c == "'") and tag:
            quote = not quote
        elif not tag:
            out = out + c

    return out

# ignore
import hashlib

# ignore
bughash = hashlib.md5(b"debug").hexdigest()

quiz('Where has the name "bug" been used to denote disruptive events?',
     [
        'In the early days of Morse telegraphy, referring to a special key '
          'that would send a string of dots',
        'Among radio technicians to describe a device that '
          'converts electromagnetic field variations into acoustic signals',
        "In Shakespeare's " '"Henry VI", referring to a walking spectre',
        'In Middle English, where the word "bugge" is the basis for terms '
          'like "bugbear" and "bugaboo"'
     ], [bughash.index(i) for i in "d42f"])

assert(...)

Input	Expectation	Output	Outcome
`<b>foo</b>`	`foo`	`foo`	✔
`<b>"foo"</b>`	`"foo"`	`foo`	✘
`"<b>foo</b>"`	`"foo"`	`<b>foo</b>`	✘
`<b id="bar">foo</b>`	`foo`	`foo`	✔

Input	Expectation	Output	Outcome
`<b>foo</b>`	`foo`	`foo`	✔
`<b>"foo"</b>`	`"foo"`	`foo`	✘
`"<b>foo</b>"`	`"foo"`	`<b>foo</b>`	✘
`<b id="bar">foo</b>`	`foo`	`foo`	✔
`"foo"`	`"foo"`	`foo`	✘

Input	Expectation	Output	Outcome
`<b>foo</b>`	`foo`	`foo`	✔
`<b>"foo"</b>`	`"foo"`	`foo`	✘
`"<b>foo</b>"`	`"foo"`	`<b>foo</b>`	✘
`<b id="bar">foo</b>`	`foo`	`foo`	✔
`"foo"`	`'foo'`	`foo`	✘
`'foo'`	`'foo'`	`'foo'`	✔

Introduction to Debugging¶

A Simple Function¶

Your Task: Remove HTML Markup¶

Understanding Python Programs¶

Running a Function¶

Interacting with Notebooks¶

Testing a Function¶

Oops! A Bug!¶

Visualizing Code¶

A First Fix¶

The Devil's Guide to Debugging¶

Printf Debugging¶

Debugging into Existence¶

Use the Most Obvious Fix¶

Things to do Instead¶

From Defect to Failure¶

From Failure to Defect¶

The Scientific Method¶

Finding a Hypothesis¶

Quiz

Testing a Hypothesis¶

Refining a Hypothesis¶

Quiz

Refuting a Hypothesis¶

Quiz

Quiz

Fixing the Bug¶

Checking Diagnoses¶

Fixing the Code¶

Alternate Paths¶

Homework after the Fix¶

Check for further Defect Occurrences¶

Check your Tests¶

Add Assertions¶

Quiz

Commit the Fix¶

Close the Bug Report¶

Become a Better Debugger¶

Follow the Process¶

Keep a Log¶

Rubberducking¶

The Cost of Debugging¶

Debugging Aftermath¶

History of Debugging¶

Quiz

Synopsis¶

Lessons Learned¶

Next Steps¶

Background¶

Exercises¶

Exercise 1: Get Acquainted with Notebooks and Python¶

Beginner Level: Run Notebooks in Your Browser¶

Advanced Level: Run Python Code on Your Machine¶

Pro Level: Run Notebooks on Your Machine¶

Boss Level: Contribute!¶

Exercise 2: More Bugs!¶

Part 1: Find the Problem¶

Part 2: Identify Extent and Cause¶

Part 3: Fix the Problem¶