From 306a0394723d3d6dcbaacbc922b5d23433ffca4f Mon Sep 17 00:00:00 2001 From: Emma Anholt Date: Mon, 20 Sep 2021 10:07:40 -0700 Subject: [PATCH] ci/baremetal: Retry if our network device spontaneously fails. Seen in https://gitlab.freedesktop.org/mesa/mesa/-/jobs/13824132. It's unlikely that graphics would kill the network, so just assume it's not our fault and keep going. Part-of: --- .gitlab-ci/bare-metal/cros_servo_run.py | 6 ++++++ .gitlab-ci/bare-metal/fastboot_run.py | 6 ++++++ 2 files changed, 12 insertions(+) diff --git a/.gitlab-ci/bare-metal/cros_servo_run.py b/.gitlab-ci/bare-metal/cros_servo_run.py index 8b3b807abb3..ecb6c460fcb 100755 --- a/.gitlab-ci/bare-metal/cros_servo_run.py +++ b/.gitlab-ci/bare-metal/cros_servo_run.py @@ -126,6 +126,12 @@ class CrosServoRun: self.print_error("Detected cheza power management bus error, restarting run...") return 2 + # If the network device dies, it's probably not graphics's fault, just try again. + if re.search("NETDEV WATCHDOG", line): + self.print_error( + "Detected network device failure, restarting run...") + return 2 + # These HFI response errors started appearing with the introduction # of piglit runs. CosmicPenguin says: # diff --git a/.gitlab-ci/bare-metal/fastboot_run.py b/.gitlab-ci/bare-metal/fastboot_run.py index 8b9ce1d591e..3654c7c8088 100755 --- a/.gitlab-ci/bare-metal/fastboot_run.py +++ b/.gitlab-ci/bare-metal/fastboot_run.py @@ -83,6 +83,12 @@ class FastbootRun: "Detected kernel soft lockup, restarting run...") return 2 + # If the network device dies, it's probably not graphics's fault, just try again. + if re.search("NETDEV WATCHDOG", line): + self.print_error( + "Detected network device failure, restarting run...") + return 2 + result = re.search("hwci: mesa: (\S*)", line) if result: if result.group(1) == "pass":