Haytham Abuelfutuh
flyte-admin-task.execution.manager-task.executions.terminated.counter
Prafulla Mahindrakar
04/14/2022, 8:14 AMflyte:admin:admin:execution_manager:acceptance_delay_count 0
flyte:admin:admin:execution_manager:acceptance_delay_sum 0
flyte:admin:admin:execution_manager:acceptance_delay{quantile="0.5"} NaN
flyte:admin:admin:execution_manager:acceptance_delay{quantile="0.9"} NaN
flyte:admin:admin:execution_manager:acceptance_delay{quantile="0.99"} NaN
flyte:admin:admin:execution_manager:active_executions 0
flyte:admin:admin:execution_manager:closure_size_bytes_count 0
flyte:admin:admin:execution_manager:closure_size_bytes_sum 0
flyte:admin:admin:execution_manager:closure_size_bytes{quantile="0.5"} NaN
flyte:admin:admin:execution_manager:closure_size_bytes{quantile="0.9"} NaN
flyte:admin:admin:execution_manager:closure_size_bytes{quantile="0.99"} NaN
flyte:admin:admin:execution_manager:execution_events_created 0
flyte:admin:admin:execution_manager:execution_termination_failure 0
flyte:admin:admin:execution_manager:executions_created 0
flyte:admin:admin:execution_manager:propeller_failures 0
flyte:admin:admin:execution_manager:publish_error 0
flyte:admin:admin:execution_manager:publish_event_error 0
flyte:admin:admin:execution_manager:spec_size_bytes_count 0
flyte:admin:admin:execution_manager:spec_size_bytes_sum 0
flyte:admin:admin:execution_manager:spec_size_bytes{quantile="0.5"} NaN
flyte:admin:admin:execution_manager:spec_size_bytes{quantile="0.9"} NaN
flyte:admin:admin:execution_manager:spec_size_bytes{quantile="0.99"} NaN
flyte:admin:admin:execution_manager:transformer_error 0
flyte:admin:admin:execution_manager:unexpected_data_error 0
Will send out the fix# TYPE flyte:admin:admin:execution_manager:executions_terminated counter
flyte:admin:admin:execution_manager:executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:execution_manager:executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
Haytham Abuelfutuh
Prafulla Mahindrakar
04/14/2022, 11:38 AM# HELP flyte:admin:admin:task_execution_manager:task_executions_terminated overall count of terminated workflow executions
# TYPE flyte:admin:admin:task_execution_manager:task_executions_terminated counter
flyte:admin:admin:task_execution_manager:task_executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="n0",project="flytesnacks",runtime_type="",runtime_version="",task="core.control_flow.map_task.mapper_a_mappable_task_0-0",tasktype="",wf=""} 1
flyte:admin:admin:task_execution_manager:task_executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="n1",project="flytesnacks",runtime_type="",runtime_version="",task="core.control_flow.map_task.coalesce-0",tasktype="",wf=""} 1
flyte:admin:admin:task_execution_manager:task_executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="n0",project="flytesnacks",runtime_type="",runtime_version="",task="core.control_flow.map_task.mapper_a_mappable_task_0-0",tasktype="",wf=""} 1
flyte:admin:admin:task_execution_manager:task_executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="n1",project="flytesnacks",runtime_type="",runtime_version="",task="core.control_flow.map_task.coalesce-0",tasktype="",wf=""} 1
Node execution metrics
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="end-node",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="n0",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="n1",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="fe533aa1e880546b59db",node="start-node",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="end-node",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="n0",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="n1",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="ffd9b80a79ca34186889",node="start-node",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""}
I will check why the phase is not being emittedHaytham Abuelfutuh
Prafulla Mahindrakar
04/14/2022, 11:48 AMflyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="end-node",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="n0",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="n1",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
flyte:admin:admin:node_execution_manager:node_executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="start-node",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
Task executions
flyte:admin:admin:task_execution_manager:task_executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="n0",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="core.control_flow.map_task.mapper_a_mappable_task_0-0",tasktype="",wf=""} 1
flyte:admin:admin:task_execution_manager:task_executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="n1",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="core.control_flow.map_task.coalesce-0",tasktype="",wf=""} 1
Executions
flyte:admin:admin:execution_manager:executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
Alex Pozimenko
04/14/2022, 8:00 PMflyte-admin-task.execution.manager-task.executions.terminated.counter
at allHaytham Abuelfutuh
Prafulla Mahindrakar
04/15/2022, 12:31 PMflyte:admin:admin:execution_manager:executions_terminated{app_name="",domain="development",exec_id="f2282f588a3b940cd99d",node="",phase="SUCCEEDED",project="flytesnacks",runtime_type="",runtime_version="",task="",tasktype="",wf=""} 1
Ketan (kumare3)
Alex Pozimenko
04/15/2022, 5:17 PMWhere do you see that error? Does the execution start and the task fails with that? When it fails, can you check the pod created to see what service account was set on it? How do you launch the workflow? Is it through flytectl and you pass a k8s service account?1. i launch from the console 2. the task starts, the error is coming from the container when it's trying to access other aws resources 3. i'll check the service account (need to upgrade my environment again 🙂 ) (@Haytham Abuelfutuh @Prafulla Mahindrakar)
are you setting the auth role?I'm not sure what you mean by that. I only changed version of the admin, no other changes to our deployment. We use OIDC auth and K8s service account if that helps
katrina
Alex Pozimenko
04/15/2022, 6:29 PMkatrina
Alex Pozimenko
04/15/2022, 6:30 PMkatrina
Alex Pozimenko
04/15/2022, 6:38 PMkatrina
is there a matrix that maps release versions to containers?we should publish an image per release: https://github.com/flyteorg/flyteadmin/pkgs/container/flyteadmin/19159524?tag=v0.6.147
Alex Pozimenko
04/15/2022, 6:40 PMkatrina
Alex Pozimenko
04/15/2022, 6:45 PMPrafulla Mahindrakar
04/15/2022, 6:49 PMkatrina
Alex Pozimenko
04/15/2022, 6:50 PMflyte-admin-task.execution.manager-task.executions.terminated
to
flyte-admin-admin-execution.manager-executions.terminated
Prafulla Mahindrakar
04/15/2022, 6:56 PMAlex Pozimenko
04/15/2022, 6:58 PMPrafulla Mahindrakar
04/15/2022, 7:00 PMconst (
NodeExecution_UNDEFINED NodeExecution_Phase = 0
NodeExecution_QUEUED NodeExecution_Phase = 1
NodeExecution_RUNNING NodeExecution_Phase = 2
NodeExecution_SUCCEEDED NodeExecution_Phase = 3
NodeExecution_FAILING NodeExecution_Phase = 4
NodeExecution_FAILED NodeExecution_Phase = 5
NodeExecution_ABORTED NodeExecution_Phase = 6
NodeExecution_SKIPPED NodeExecution_Phase = 7
NodeExecution_TIMED_OUT NodeExecution_Phase = 8
NodeExecution_DYNAMIC_RUNNING NodeExecution_Phase = 9
NodeExecution_RECOVERED NodeExecution_Phase = 10
)
Task execution phases
const (
TaskExecution_UNDEFINED TaskExecution_Phase = 0
TaskExecution_QUEUED TaskExecution_Phase = 1
TaskExecution_RUNNING TaskExecution_Phase = 2
TaskExecution_SUCCEEDED TaskExecution_Phase = 3
TaskExecution_ABORTED TaskExecution_Phase = 4
TaskExecution_FAILED TaskExecution_Phase = 5
// To indicate cases where task is initializing, like: ErrImagePull, ContainerCreating, PodInitializing
TaskExecution_INITIALIZING TaskExecution_Phase = 6
// To address cases, where underlying resource is not available: Backoff error, Resource quota exceeded
TaskExecution_WAITING_FOR_RESOURCES TaskExecution_Phase = 7
)
Workflow execution phases
const (
WorkflowExecution_UNDEFINED WorkflowExecution_Phase = 0
WorkflowExecution_QUEUED WorkflowExecution_Phase = 1
WorkflowExecution_RUNNING WorkflowExecution_Phase = 2
WorkflowExecution_SUCCEEDING WorkflowExecution_Phase = 3
WorkflowExecution_SUCCEEDED WorkflowExecution_Phase = 4
WorkflowExecution_FAILING WorkflowExecution_Phase = 5
WorkflowExecution_FAILED WorkflowExecution_Phase = 6
WorkflowExecution_ABORTED WorkflowExecution_Phase = 7
WorkflowExecution_TIMED_OUT WorkflowExecution_Phase = 8
WorkflowExecution_ABORTING WorkflowExecution_Phase = 9
)
Terminal Phases for all
var terminalExecutionPhases = map[core.WorkflowExecution_Phase]bool{
core.WorkflowExecution_SUCCEEDED: true,
core.WorkflowExecution_FAILED: true,
core.WorkflowExecution_TIMED_OUT: true,
core.WorkflowExecution_ABORTED: true,
}
var terminalNodeExecutionPhases = map[core.NodeExecution_Phase]bool{
core.NodeExecution_SUCCEEDED: true,
core.NodeExecution_FAILED: true,
core.NodeExecution_TIMED_OUT: true,
core.NodeExecution_ABORTED: true,
core.NodeExecution_SKIPPED: true,
core.NodeExecution_RECOVERED: true,
}
var terminalTaskExecutionPhases = map[core.TaskExecution_Phase]bool{
core.TaskExecution_SUCCEEDED: true,
core.TaskExecution_FAILED: true,
core.TaskExecution_ABORTED: true,
}
Alex Pozimenko
04/15/2022, 7:29 PMkatrina
Alex Pozimenko
04/15/2022, 9:17 PMkatrina
Alex Pozimenko
04/15/2022, 9:55 PMkatrina
Alex Pozimenko
04/15/2022, 10:03 PM