Skip to content

Commit

Permalink
WIP: creating file to help debug an error
Browse files Browse the repository at this point in the history
Proof of concept.

TODOs:
 - python dependency logging
 - creating a notebook version of this
 - tests
 - extensions would be to serialize things more effectively
  • Loading branch information
skrawcz committed Mar 16, 2024
1 parent 65be67c commit 8362e90
Show file tree
Hide file tree
Showing 4 changed files with 127 additions and 1 deletion.
11 changes: 11 additions & 0 deletions examples/notebook_debug/example_error.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
def input_function() -> int:
return 2


def output_function(input_function: int) -> int:
return input_function + 1


def error_function(input_function: int, output_function: int, input: int) -> int:
raise ValueError("This is an error")
return input_function + output_function + input
94 changes: 94 additions & 0 deletions examples/notebook_debug/notebook_debugger_plugin.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,94 @@
from typing import Any, Callable, Dict, Optional

from hamilton import lifecycle

try:
import cloudpickle as pickle
except ImportError:
import pickle

import inspect

template = """
try:
import cloudpickle as pickle
except ImportError:
import pickle
import {module_name} # we load this for imports
# let's load the inputs
with open('{node_name}_inputs.pkl', 'rb') as f:
inputs = pickle.load(f)
# the function that errored
{function_to_debug}
# run the function
{func_name}(**inputs)
"""


class NotebookErrorDebugger(lifecycle.NodeExecutionHook):

def run_before_node_execution(
self,
*,
node_name: str,
node_tags: Dict[str, Any],
node_kwargs: Dict[str, Any],
node_return_type: type,
task_id: Optional[str],
run_id: str,
node_input_types: Dict[str, Any],
**future_kwargs: Any,
):
pass

def run_after_node_execution(
self,
*,
node_name: str,
node_tags: Dict[str, Any],
node_kwargs: Dict[str, Any],
node_return_type: type,
result: Any,
error: Optional[Exception],
success: bool,
task_id: Optional[str],
run_id: str,
originating_function: Callable,
**future_kwargs: Any,
):
"""
This function will create the follow in the case of a failure:
1. It will pickle of the inputs to the function.
2. It will create a file with the following:
a. it will import the module the function is from -- to cover any imports that need to exist.
b. it will load the pickled inputs.
c. it will have the code of the function that errored so you can debug it.
d. it will then also list python version, hamilton version, and any other relevant package versions for
the user to install / have.
2. It will then print out where this data has been saved for the user to then debug.
"""
if not success:
# pickle the inputs
with open(f"{node_name}_inputs.pkl", "wb") as f:
pickle.dump(node_kwargs, f)
# create a file with the function and the inputs
with open(f"{node_name}_debug.py", "w") as f:
f.write(
template.format(
module_name=node_tags.get("module"),
node_name=node_name,
function_to_debug=inspect.getsource(originating_function),
func_name=originating_function.__name__,
)
)
# print out where the data has been saved
print(f"Inputs to {node_name} have been saved to {node_name}_inputs.pkl")
print(f"The function that errored has been saved to {node_name}_debug.py")
print(f"Please run the function in {node_name}_debug.py to debug the error.")
# TODO: create file with python requirements for pickle to work...
8 changes: 8 additions & 0 deletions examples/notebook_debug/run.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
if __name__ == "__main__":
import example_error
from notebook_debugger_plugin import NotebookErrorDebugger

from hamilton import driver

dr = driver.Builder().with_modules(example_error).with_adapters(NotebookErrorDebugger()).build()
dr.execute(["error_function"], inputs={"input": 4})
15 changes: 14 additions & 1 deletion hamilton/lifecycle/api.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,18 @@
import abc
from abc import ABC
from types import ModuleType
from typing import TYPE_CHECKING, Any, Collection, Dict, List, Optional, Tuple, Type, final
from typing import (
TYPE_CHECKING,
Any,
Callable,
Collection,
Dict,
List,
Optional,
Tuple,
Type,
final,
)

from hamilton import graph_types, node

Expand Down Expand Up @@ -224,6 +235,7 @@ def run_after_node_execution(
success: bool,
task_id: Optional[str],
run_id: str,
originating_function: Callable,
**future_kwargs: Any,
):
"""Hook that is executed post node execution.
Expand Down Expand Up @@ -265,6 +277,7 @@ def post_node_execute(
task_id=task_id,
success=success,
run_id=run_id,
originating_function=node_.originating_functions[0],
)


Expand Down

0 comments on commit 8362e90

Please sign in to comment.