with '#' will be ignored, and an empty message aborts the commit. Author: Ethan Alicea <64653625+Tech-Gamer@users.noreply.github.com> On branch develop Your branch is up to date with 'origin/develop'. Changes to be committed: modified: .github/workflows/push.yaml modified: .github/workflows/release.yaml modified: CHANGELOG.md modified: Dockerfile modified: Makefile modified: README.md modified: cmd/configure.go modified: cmd/diagnostics.go modified: cmd/root.go modified: config/config.go modified: environment/allocations.go modified: environment/docker.go modified: environment/docker/api.go modified: environment/docker/container.go modified: environment/docker/environment.go modified: environment/docker/power.go modified: environment/docker/stats.go modified: environment/environment.go modified: environment/settings.go modified: events/events.go modified: go.mod modified: internal/cron/activity_cron.go modified: internal/cron/cron.go modified: internal/cron/sftp_cron.go modified: internal/database/database.go modified: internal/progress/progress.go modified: internal/progress/progress_test.go modified: loggers/cli/cli.go new file: oryxBuildBinary modified: parser/parser.go modified: remote/http.go modified: remote/servers.go modified: remote/types.go modified: router/downloader/downloader.go modified: router/middleware.go modified: router/middleware/middleware.go modified: router/middleware/request_error.go modified: router/router.go modified: router/router_download.go modified: router/router_server.go modified: router/router_server_backup.go modified: router/router_server_files.go modified: router/router_server_transfer.go modified: router/router_server_ws.go modified: router/router_system.go modified: router/router_transfer.go modified: router/tokens/parser.go modified: router/websocket/listeners.go modified: router/websocket/websocket.go modified: server/activity.go modified: server/backup.go modified: server/backup/backup.go modified: server/backup/backup_local.go modified: server/backup/backup_s3.go modified: server/configuration.go modified: server/console.go modified: server/crash.go modified: server/events.go modified: server/filesystem/archive.go modified: server/filesystem/filesystem.go modified: server/filesystem/filesystem_test.go modified: server/install.go modified: server/installer/installer.go modified: server/listeners.go modified: server/manager.go modified: server/mounts.go modified: server/power.go modified: server/power_test.go modified: server/resources.go modified: server/server.go modified: server/transfer/archive.go modified: server/transfer/source.go modified: server/transfer/transfer.go modified: server/update.go modified: sftp/event.go modified: sftp/handler.go modified: sftp/server.go modified: wings.go
93 lines
3.5 KiB
Go
93 lines
3.5 KiB
Go
package server
|
|
|
|
import (
|
|
"fmt"
|
|
"strconv"
|
|
"sync"
|
|
"time"
|
|
|
|
"emperror.dev/errors"
|
|
|
|
"github.com/Tech-Gamer/nwy-wings/config"
|
|
"github.com/Tech-Gamer/nwy-wings/environment"
|
|
)
|
|
|
|
type CrashHandler struct {
|
|
mu sync.RWMutex
|
|
|
|
// Tracks the time of the last server crash event.
|
|
lastCrash time.Time
|
|
}
|
|
|
|
// Returns the time of the last crash for this server instance.
|
|
func (cd *CrashHandler) LastCrashTime() time.Time {
|
|
cd.mu.RLock()
|
|
defer cd.mu.RUnlock()
|
|
|
|
return cd.lastCrash
|
|
}
|
|
|
|
// Sets the last crash time for a server.
|
|
func (cd *CrashHandler) SetLastCrash(t time.Time) {
|
|
cd.mu.Lock()
|
|
cd.lastCrash = t
|
|
cd.mu.Unlock()
|
|
}
|
|
|
|
// Looks at the environment exit state to determine if the process exited cleanly or
|
|
// if it was the result of an event that we should try to recover from.
|
|
//
|
|
// This function assumes it is called under circumstances where a crash is suspected
|
|
// of occurring. It will not do anything to determine if it was actually a crash, just
|
|
// look at the exit state and check if it meets the criteria of being called a crash
|
|
// by Wings.
|
|
//
|
|
// If the server is determined to have crashed, the process will be restarted and the
|
|
// counter for the server will be incremented.
|
|
func (s *Server) handleServerCrash() error {
|
|
// No point in doing anything here if the server isn't currently offline, there
|
|
// is no reason to do a crash detection event. If the server crash detection is
|
|
// disabled we want to skip anything after this as well.
|
|
if s.Environment.State() != environment.ProcessOfflineState || !s.Config().CrashDetectionEnabled {
|
|
if !s.Config().CrashDetectionEnabled {
|
|
s.Log().Debug("server triggered crash detection but handler is disabled for server process")
|
|
s.PublishConsoleOutputFromDaemon("Aborting automatic restart, crash detection is disabled for this instance.")
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
exitCode, oomKilled, err := s.Environment.ExitState()
|
|
if err != nil {
|
|
return errors.Wrap(err, "failed to get exit state for server process")
|
|
}
|
|
|
|
// If the system is not configured to detect a clean exit code as a crash, and the
|
|
// crash is not the result of the program running out of memory, do nothing.
|
|
if exitCode == 0 && !oomKilled && !config.Get().System.CrashDetection.DetectCleanExitAsCrash {
|
|
s.Log().Debug("server exited with successful exit code; system is configured to not detect this as a crash")
|
|
return nil
|
|
}
|
|
|
|
s.PublishConsoleOutputFromDaemon("---------- Detected server process in a crashed state! ----------")
|
|
s.PublishConsoleOutputFromDaemon("---------- If you need help, please contact Nightway Hosting support. ----------")
|
|
s.PublishConsoleOutputFromDaemon(fmt.Sprintf("Exit code: %d", exitCode))
|
|
s.PublishConsoleOutputFromDaemon(fmt.Sprintf("Out of memory: %t", oomKilled))
|
|
|
|
c := s.crasher.LastCrashTime()
|
|
timeout := config.Get().System.CrashDetection.Timeout
|
|
|
|
// If the last crash time was within the last `timeout` seconds we do not want to perform
|
|
// an automatic reboot of the process. Return an error that can be handled.
|
|
//
|
|
// If timeout is set to 0, always reboot the server (this is probably a terrible idea, but some people want it)
|
|
if timeout != 0 && !c.IsZero() && c.Add(time.Second*time.Duration(config.Get().System.CrashDetection.Timeout)).After(time.Now()) {
|
|
s.PublishConsoleOutputFromDaemon("Aborting automatic restart, last crash occurred less than " + strconv.Itoa(timeout) + " seconds ago.")
|
|
return &crashTooFrequent{}
|
|
}
|
|
|
|
s.crasher.SetLastCrash(time.Now())
|
|
|
|
return errors.Wrap(s.HandlePowerAction(PowerActionStart), "failed to start server after crash detection")
|
|
}
|