Skip to content

Commit

Permalink
Log error in read inputs/outputs (#282)
Browse files Browse the repository at this point in the history
## Overview
* Log error and execution id when inputs/outputs read fail

## Test Plan
* NA

## Rollout Plan (if applicable)
*TODO: Describe any deployment or compatibility considerations for rolling out this change.*

## Upstream Changes
Should this change be upstreamed to OSS (flyteorg/flyte)? If so, please check this box for auditing. Note, this is the responsibility of each developer. See [this guide](https://unionai.atlassian.net/wiki/spaces/ENG/pages/447610883/Flyte+-+Union+Cloud+Development+Runbook/#When-are-versions-updated%3F).
- [ ] To be upstreamed

## Issue
fixes CLD-917
*TODO: Link Linear issue(s) using [magic words](https://linear.app/docs/github#magic-words). `fixes` will move to merged status, while `ref` will only link the PR.*

## Checklist
* [ ] Added tests
* [ ] Ran a deploy dry run and shared the terraform plan
* [ ] Added logging and metrics
* [ ] Updated [dashboards](https://unionai.grafana.net/dashboards) and [alerts](https://unionai.grafana.net/alerting/list)
* [ ] Updated documentation
  • Loading branch information
iaroslav-ciupin authored May 17, 2024
1 parent c5331a7 commit 975fe4d
Show file tree
Hide file tree
Showing 4 changed files with 31 additions and 7 deletions.
12 changes: 10 additions & 2 deletions flyteadmin/pkg/manager/impl/execution_manager.go
Original file line number Diff line number Diff line change
Expand Up @@ -1770,7 +1770,11 @@ func (m *ExecutionManager) GetExecutionData(
id.Project,
id.Domain,
executionModel.InputsURI.String(),
objectStore)
objectStore,
)
if err != nil {
logger.Errorf(ctx, "failed to read inputs during execution [%v]: %v", id, err)
}
return err
})

Expand All @@ -1786,7 +1790,11 @@ func (m *ExecutionManager) GetExecutionData(
cluster,
id.Project,
id.Domain,
objectStore)
objectStore,
)
if err != nil {
logger.Errorf(ctx, "failed to read outputs during execution [%v]: %v", id, err)
}
return err
})

Expand Down
12 changes: 10 additions & 2 deletions flyteadmin/pkg/manager/impl/node_execution_manager.go
Original file line number Diff line number Diff line change
Expand Up @@ -575,7 +575,11 @@ func (m *NodeExecutionManager) GetNodeExecutionData(
id.Project,
id.Domain,
nodeExecution.InputUri,
objectStore)
objectStore,
)
if err != nil {
logger.Errorf(ctx, "failed to read inputs during execution [%v]: %v", id, err)
}
return err
})

Expand All @@ -591,7 +595,11 @@ func (m *NodeExecutionManager) GetNodeExecutionData(
cluster,
id.Project,
id.Domain,
objectStore)
objectStore,
)
if err != nil {
logger.Errorf(ctx, "failed to read outputs during execution [%v]: %v", id, err)
}
return err
})

Expand Down
13 changes: 11 additions & 2 deletions flyteadmin/pkg/manager/impl/task_execution_manager.go
Original file line number Diff line number Diff line change
Expand Up @@ -303,6 +303,7 @@ func (m *TaskExecutionManager) GetTaskExecutionData(ctx context.Context,
if err := validation.ValidateTaskExecutionIdentifier(request.Id); err != nil {
logger.Debugf(ctx, "Invalid identifier [%+v]: %v", request.Id, err)
}

ctx = getTaskExecutionContext(ctx, request.Id)
group, groupCtx := errgroup.WithContext(ctx)
var taskExecution *admin.TaskExecution
Expand Down Expand Up @@ -351,7 +352,11 @@ func (m *TaskExecutionManager) GetTaskExecutionData(ctx context.Context,
id.Project,
id.Domain,
taskExecution.InputUri,
objectStore)
objectStore,
)
if err != nil {
logger.Errorf(ctx, "failed to read inputs during execution [%v]: %v", id, err)
}
return err
})

Expand All @@ -367,7 +372,11 @@ func (m *TaskExecutionManager) GetTaskExecutionData(ctx context.Context,
cluster,
id.Project,
id.Domain,
objectStore)
objectStore,
)
if err != nil {
logger.Errorf(ctx, "failed to read outputs during execution [%v]: %v", id, err)
}
return err
})

Expand Down
1 change: 0 additions & 1 deletion flyteadmin/pkg/manager/impl/util/data.go
Original file line number Diff line number Diff line change
Expand Up @@ -150,7 +150,6 @@ func GetOutputs(ctx context.Context,
err = readFromDataPlane(ctx, objectStore, cluster, project, domain, closure.GetOutputUri(), fullOutputs)
}
}

return fullOutputs, &outputsURLBlob, err
}

Expand Down

0 comments on commit 975fe4d

Please sign in to comment.