abundant-hamburger-66584
03/14/2023, 10:01 PMThe Databricks Flyte tasks launch successfully, but hang indefinitely after the DB job finishes successfully.So far I have tried looking at flytepropeller, but I haven't found any logs relating to the execution id in question. Any tips on ways to debug is much appreciated 🙏
thankful-minister-83577
thankful-minister-83577
glamorous-carpet-83516
03/14/2023, 10:05 PMabundant-hamburger-66584
03/14/2023, 10:11 PMglamorous-carpet-83516
03/14/2023, 10:16 PMkubectl get flyteworkflow -n flytesnacks-development # list cr
kubectl get flyteworkflow atvx5kdcbgfzq862djj4 -n flytesnacks-development -o yamlabundant-hamburger-66584
03/14/2023, 10:27 PMabundant-hamburger-66584
03/15/2023, 2:42 PMkubectl get flyteworkflow ff3263f587ca646a2a33 -n flytesnacks-development -o yamlabundant-hamburger-66584
03/15/2023, 2:44 PMabundant-hamburger-66584
03/15/2023, 2:46 PMabundant-hamburger-66584
03/15/2023, 5:36 PMglamorous-carpet-83516
03/15/2023, 9:10 PMcurl --netrc --request GET --header "Authorization: Bearer $DATABRICKS_TOKEN" \
'<https://dbc-a53b7a3c-614c.cloud.databricks.com/api/2.0/jobs/runs/get?run_id=70446>'glamorous-carpet-83516
03/15/2023, 9:12 PMthankful-minister-83577
thankful-minister-83577
glamorous-carpet-83516
03/15/2023, 9:15 PMabundant-hamburger-66584
03/15/2023, 9:54 PMabundant-hamburger-66584
03/16/2023, 3:26 PMcurl --netrc --request GET --header "Authorization: Bearer $DATABRICKS_TOKEN" \
'<https://wbd-dcp-cd-dev.cloud.databricks.com/api/2.0/jobs/runs/get?run_id=1077214>'life_cycle_stateresult_state{
  "job_id": 1060228574312365,
  "run_id": 1077214,
  "creator_user_name": "<mailto:evan.sadler@warnermedia.com|evan.sadler@warnermedia.com>",
  "number_in_job": 1077214,
  "state": {
    "life_cycle_state": "TERMINATED",
    "result_state": "SUCCESS",
    "state_message": "",
    "user_cancelled_or_timedout": false
  },
  "task": {
    "spark_python_task": {
      "python_file": "dbfs:///FileStore/tables/entrypoint.py",
      "parameters": [
        "pyflyte-fast-execute",
        "--additional-distribution",
        "<s3://p13n-flyte-artifacts/flytesnacks/development/MV7ISU63ZHQQZ7ZYKJRF3VXRWI======/scriptmode.tar.gz>",
        "--dest-dir",
        ".",
        "--",
        "pyflyte-execute",
        "--inputs",
        "<s3://p13n-flyte-artifacts/metadata/propeller/flytesnacks-development-alvq9nr4z86dx92nshfk/n0/data/inputs.pb>",
        "--output-prefix",
        "<s3://p13n-flyte-artifacts/metadata/propeller/flytesnacks-development-alvq9nr4z86dx92nshfk/n0/data/0>",
        "--raw-output-data-prefix",
        "<s3://p13n-flyte-artifacts/c7/alvq9nr4z86dx92nshfk-n0-0>",
        "--checkpoint-path",
        "<s3://p13n-flyte-artifacts/c7/alvq9nr4z86dx92nshfk-n0-0/_flytecheckpoints>",
        "--prev-checkpoint",
        "\"\"",
        "--resolver",
        "flytekit.core.python_auto_container.default_task_resolver",
        "--",
        "task-module",
        "wf_tests.simple_db",
        "task-name",
        "test_task"
      ]
    }
  },
  "cluster_spec": {
    "existing_cluster_id": "0315-172340-xc0uhob5"
  },
  "cluster_instance": {
    "cluster_id": "0315-172340-xc0uhob5",
    "spark_context_id": "4678757461727715067"
  },
  "start_time": 1678901558860,
  "setup_duration": 1000,
  "execution_duration": 22000,
  "cleanup_duration": 0,
  "end_time": 1678901582290,
  "run_name": "test_db",
  "run_page_url": "<https://wbd-dcp-cd-dev.cloud.databricks.com/?o=6475167273468992#job/1060228574312365/run/1077214>",
  "run_type": "SUBMIT_RUN",
  "attempt_number": 0,
  "format": "SINGLE_TASK"
}flyte-propeller{"json":{"routine":"databricks-worker-0"},"level":"error","msg":"worker panic'd and is shutting down. Error: interface conversion: interface {} is nil, not map[string]interface {}","ts":"2023-03-16T15:23:45Z"}
{"json":{"routine":"databricks-worker-0"},"level":"error","msg":"Failed to sync. Error: worker panic'd and is shutting down. Error: interface conversion: interface {} is nil, not map[string]interface {}","ts":"2023-03-16T15:23:45Z"}
{"json":{"routine":"databricks-worker-2"},"level":"error","msg":"worker panic'd and is shutting down. Error: interface conversion: interface {} is nil, not map[string]interface {}","ts":"2023-03-16T15:24:15Z"}
{"json":{"routine":"databricks-worker-2"},"level":"error","msg":"Failed to sync. Error: worker panic'd and is shutting down. Error: interface conversion: interface {} is nil, not map[string]interface {}","ts":"2023-03-16T15:24:15Z"}glamorous-carpet-83516
03/16/2023, 6:01 PMglamorous-carpet-83516
03/16/2023, 6:02 PMglamorous-carpet-83516
03/16/2023, 6:03 PMglamorous-carpet-83516
03/16/2023, 6:21 PMabundant-hamburger-66584
03/16/2023, 6:25 PMcurl