diff --git a/monarch_hyperactor/src/v1/actor_mesh.rs b/monarch_hyperactor/src/v1/actor_mesh.rs index 01fa7484b..fd773f11e 100644 --- a/monarch_hyperactor/src/v1/actor_mesh.rs +++ b/monarch_hyperactor/src/v1/actor_mesh.rs @@ -266,6 +266,11 @@ impl PythonActorMeshImpl { .extract::() .unwrap(); tracing::error!( + name = "ActorMeshStatus", + status = "SupervisionError::UnhandledFaultHook", + actor_name = failure.mesh_name, + event = %failure.event, + rank = failure.rank, "unhandled event reached unhandled_fault_hook: {}, which is exiting the process with code {}", failure, code @@ -275,6 +280,11 @@ impl PythonActorMeshImpl { // The callback raised some other exception, and there's // no way to handle it. Just exit the process anyways tracing::error!( + name = "ActorMeshStatus", + status = "SupervisionError::UnhandledFaultHook", + actor_name = failure.mesh_name, + event = %failure.event, + rank = failure.rank, "unhandled event reached unhandled_fault_hook: {}, which raised an exception: {:?}. \ Exiting the process with code 1", failure, @@ -284,6 +294,11 @@ impl PythonActorMeshImpl { } } else { tracing::warn!( + name = "ActorMeshStatus", + status = "SupervisionError::UnhandledFaultHook", + actor_name = failure.mesh_name, + event = %failure.event, + rank = failure.rank, "unhandled event reached unhandled_fault_hook: {}, but that function produced no exception or crash. Ignoring the error", failure );