From 08aa1e99a110f7b3b7edc1907debf0b0e1134d99 Mon Sep 17 00:00:00 2001 From: Gianluca Zuccarelli Date: Mon, 9 Jan 2023 16:18:02 +0000 Subject: [PATCH] worker/server: log unresponsive job removal Re-add the logging for when unresponsive heartbeats are being removed so we can verify that they are correctly being logged as 5xx errors. --- internal/worker/server.go | 3 +++ 1 file changed, 3 insertions(+) diff --git a/internal/worker/server.go b/internal/worker/server.go index 3c9dbefae..d9d93cd5c 100644 --- a/internal/worker/server.go +++ b/internal/worker/server.go @@ -114,6 +114,9 @@ func (s *Server) WatchHeartbeats() { //nolint:staticcheck // avoid SA1015, this is an endless function for range time.Tick(time.Second * 30) { for _, token := range s.jobs.Heartbeats(time.Second * 120) { + id, _ := s.jobs.IdFromToken(token) + logrus.Infof("Removing unresponsive job: %s\n", id) + missingHeartbeatResult := JobResult{ JobError: clienterrors.WorkerClientError(clienterrors.ErrorJobMissingHeartbeat, fmt.Sprintf("Workers running this job stopped responding more than %d times.", maxHeartbeatRetries),