Skip to content

Commit 9e8da3b

Browse files
authored
[supervisor] set pod failure reason when supervisor is reaped (#20318)
* [supervisor] set pod failed reason when supervisor been reap * Debug commit * upgrade pkg * Revert "Debug commit" This reverts commit 1b6bde8.
1 parent a836f97 commit 9e8da3b

File tree

3 files changed

+44
-12
lines changed

3 files changed

+44
-12
lines changed

components/supervisor/cmd/init.go

Lines changed: 39 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -22,8 +22,8 @@ import (
2222
"github.com/gitpod-io/gitpod/common-go/process"
2323
"github.com/gitpod-io/gitpod/supervisor/pkg/shared"
2424
"github.com/gitpod-io/gitpod/supervisor/pkg/supervisor"
25+
reaper "github.com/gitpod-io/go-reaper"
2526
"github.com/prometheus/procfs"
26-
reaper "github.com/ramr/go-reaper"
2727
"github.com/spf13/cobra"
2828
)
2929

@@ -77,25 +77,55 @@ var initCmd = &cobra.Command{
7777
}
7878

7979
supervisorDone := make(chan struct{})
80+
handledByReaper := make(chan int)
81+
handleSupervisorExit := func(exitCode int) {
82+
if exitCode == 0 {
83+
return
84+
}
85+
logs := extractFailureFromRun()
86+
if shared.IsExpectedShutdown(exitCode) {
87+
log.Fatal(logs)
88+
} else {
89+
log.WithError(fmt.Errorf(logs)).Fatal("supervisor run error with unexpected exit code")
90+
}
91+
}
8092
go func() {
8193
defer close(supervisorDone)
8294

8395
err := runCommand.Wait()
84-
if err != nil && !(strings.Contains(err.Error(), "signal: ") || strings.Contains(err.Error(), "no child processes")) {
96+
if err == nil {
97+
return
98+
}
99+
// exited by reaper
100+
if strings.Contains(err.Error(), "no child processes") {
101+
ctx, cancel := context.WithTimeout(context.Background(), time.Second*5)
102+
defer cancel()
103+
select {
104+
case <-ctx.Done(): // timeout
105+
case exitCode := <-handledByReaper:
106+
handleSupervisorExit(exitCode)
107+
}
108+
} else if !(strings.Contains(err.Error(), "signal: ")) {
85109
if eerr, ok := err.(*exec.ExitError); ok && eerr.ExitCode() != 0 {
86-
logs := extractFailureFromRun()
87-
if shared.IsExpectedShutdown(eerr.ExitCode()) {
88-
log.Fatal(logs)
89-
} else {
90-
log.WithError(fmt.Errorf(logs)).Fatal("supervisor run error with unexpected exit code")
91-
}
110+
handleSupervisorExit(eerr.ExitCode())
92111
}
93112
log.WithError(err).Error("supervisor run error")
94113
return
95114
}
96115
}()
97116
// start the reaper to clean up zombie processes
98-
reaper.Reap()
117+
reaper.Start(reaper.Config{
118+
Pid: -1,
119+
Options: 0,
120+
DisablePid1Check: false,
121+
OnReap: func(pid int, wstatus syscall.WaitStatus) {
122+
if pid != runCommand.Process.Pid {
123+
return
124+
}
125+
exitCode := wstatus.ExitStatus()
126+
handledByReaper <- exitCode
127+
},
128+
})
99129

100130
select {
101131
case <-supervisorDone:

components/supervisor/go.mod

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@ require (
1616
github.com/gitpod-io/gitpod/ide-metrics-api v0.0.0-00010101000000-000000000000
1717
github.com/gitpod-io/gitpod/supervisor/api v0.0.0-00010101000000-000000000000
1818
github.com/gitpod-io/gitpod/ws-daemon/api v0.0.0-00010101000000-000000000000
19+
github.com/gitpod-io/go-reaper v0.0.0-20241024192051-78d04cc2e25f
1920
github.com/golang/mock v1.6.0
2021
github.com/google/go-cmp v0.6.0
2122
github.com/google/uuid v1.6.0
@@ -29,7 +30,6 @@ require (
2930
github.com/prometheus/common v0.42.0
3031
github.com/prometheus/procfs v0.10.1
3132
github.com/prometheus/pushgateway v1.5.1
32-
github.com/ramr/go-reaper v0.2.1
3333
github.com/sirupsen/logrus v1.9.3
3434
github.com/soheilhy/cmux v0.1.5
3535
github.com/spf13/cobra v1.4.0

components/supervisor/go.sum

Lines changed: 4 additions & 2 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

0 commit comments

Comments
 (0)