Compare commits

...

4 Commits

3 changed files with 118 additions and 84 deletions

View File

@ -205,10 +205,10 @@ command="systemctl restart foo.service",no-port-forwarding,no-x11-forwarding,no-
<details> <details>
<summary>{{ .Name }} and other template variables</summary> <summary>{{ .Name }} and other template variables</summary>
`{{ .Name }}` is the name of your site. - `{{ .Name }}` is the name of your site.
`{{ .Message }}` is either `went down` or `came back up`. - `{{ .Message }}` is either `went down` or `came back up`.
`{{ .Status }}` is either `up` or `down`. - `{{ .Status }}` is either `up` or `down`.
`{{ .Watchdog }}` is the name of your watchdog (useful if you have multiple). - `{{ .Watchdog }}` is the name of your watchdog (useful if you have multiple).
It refers to the name of the watch, which is "Example Site" in the sample config below. It refers to the name of the watch, which is "Example Site" in the sample config below.

View File

@ -5,41 +5,44 @@
export CGO_ENABLED=0 export CGO_ENABLED=0
exe=watchdog exe=watchdog
distpre=../..
gocmd=. gocmd=.
echo "" echo ""
go generate -mod=vendor ./... go generate -mod=vendor ./...
pushd cmd/${exe}
echo "" echo ""
echo "Windows amd64" echo "Windows amd64"
#GOOS=windows GOARCH=amd64 go build -mod=vendor -o dist/windows/amd64/${exe}.exe -ldflags "-H=windowsgui" $gocmd #GOOS=windows GOARCH=amd64 go build -mod=vendor -o ${distpre}/dist/windows/amd64/${exe}.exe -ldflags "-H=windowsgui" $gocmd
#GOOS=windows GOARCH=amd64 go build -mod=vendor -o dist/windows/amd64/${exe}.debug.exe #GOOS=windows GOARCH=amd64 go build -mod=vendor -o ${distpre}/dist/windows/amd64/${exe}.debug.exe
GOOS=windows GOARCH=amd64 go build -mod=vendor -o dist/windows/amd64/${exe}.exe GOOS=windows GOARCH=amd64 go build -mod=vendor -o ${distpre}/dist/windows/amd64/${exe}.exe
echo "Windows 386" echo "Windows 386"
#GOOS=windows GOARCH=386 go build -mod=vendor -o dist/windows/386/${exe}.exe -ldflags "-H=windowsgui" $gocmd #GOOS=windows GOARCH=386 go build -mod=vendor -o ${distpre}/dist/windows/386/${exe}.exe -ldflags "-H=windowsgui" $gocmd
#GOOS=windows GOARCH=386 go build -mod=vendor -o dist/windows/386/${exe}.debug.exe #GOOS=windows GOARCH=386 go build -mod=vendor -o ${distpre}/dist/windows/386/${exe}.debug.exe
GOOS=windows GOARCH=386 go build -mod=vendor -o dist/windows/386/${exe}.exe GOOS=windows GOARCH=386 go build -mod=vendor -o ${distpre}/dist/windows/386/${exe}.exe
echo "" echo ""
echo "Darwin (macOS) amd64" echo "Darwin (macOS) amd64"
GOOS=darwin GOARCH=amd64 go build -mod=vendor -o dist/darwin/amd64/${exe} $gocmd GOOS=darwin GOARCH=amd64 go build -mod=vendor -o ${distpre}/dist/darwin/amd64/${exe} $gocmd
echo "" echo ""
echo "Linux amd64" echo "Linux amd64"
GOOS=linux GOARCH=amd64 go build -mod=vendor -o dist/linux/amd64/${exe} $gocmd GOOS=linux GOARCH=amd64 go build -mod=vendor -o ${distpre}/dist/linux/amd64/${exe} $gocmd
echo "Linux 386" echo "Linux 386"
GOOS=linux GOARCH=386 go build -mod=vendor -o dist/linux/386/${exe} $gocmd GOOS=linux GOARCH=386 go build -mod=vendor -o ${distpre}/dist/linux/386/${exe} $gocmd
echo "" echo ""
echo "RPi 4 (64-bit) ARMv8" echo "RPi 4 (64-bit) ARMv8"
GOOS=linux GOARCH=arm64 go build -mod=vendor -o dist/linux/armv8/${exe} $gocmd GOOS=linux GOARCH=arm64 go build -mod=vendor -o ${distpre}/dist/linux/armv8/${exe} $gocmd
echo "RPi 3 B+ ARMv7" echo "RPi 3 B+ ARMv7"
GOOS=linux GOARCH=arm GOARM=7 go build -mod=vendor -o dist/linux/armv7/${exe} $gocmd GOOS=linux GOARCH=arm GOARM=7 go build -mod=vendor -o ${distpre}/dist/linux/armv7/${exe} $gocmd
echo "ARMv6" echo "ARMv6"
GOOS=linux GOARCH=arm GOARM=6 go build -mod=vendor -o dist/linux/armv6/${exe} $gocmd GOOS=linux GOARCH=arm GOARM=6 go build -mod=vendor -o ${distpre}/dist/linux/armv6/${exe} $gocmd
echo "RPi Zero ARMv5" echo "RPi Zero ARMv5"
GOOS=linux GOARCH=arm GOARM=5 go build -mod=vendor -o dist/linux/armv5/${exe} $gocmd GOOS=linux GOARCH=arm GOARM=5 go build -mod=vendor -o ${distpre}/dist/linux/armv5/${exe} $gocmd
echo "" echo ""
popd
rsync -av ./dist/ ubuntu@rootprojects.org:/srv/www/rootprojects.org/$exe/dist/ rsync -av ./dist/ ubuntu@rootprojects.org:/srv/www/rootprojects.org/$exe/dist/
# https://rootprojects.org/serviceman/dist/windows/amd64/serviceman.exe # https://rootprojects.org/serviceman/dist/windows/amd64/serviceman.exe

View File

@ -33,6 +33,12 @@ func (s Status) String() string {
} }
} }
const (
MessageDown = "went down"
MessageUp = "came back up"
MessageHiccup = "hiccupped"
)
type Dog struct { type Dog struct {
Watchdog string Watchdog string
Name string Name string
@ -47,15 +53,15 @@ type Dog struct {
status Status status Status
changed bool changed bool
error error error error
failures int //failures int
passes int //passes int
lastFailed time.Time //lastFailed time.Time
lastPassed time.Time //lastPassed time.Time
lastNotified time.Time //lastNotified time.Time
} }
func New(d *Dog) *Dog { func New(d *Dog) *Dog {
d.lastPassed = time.Now().Add(-5 * time.Minute) //d.lastPassed = time.Now().Add(-5 * time.Minute)
d.status = StatusUp d.status = StatusUp
d.changed = false d.changed = false
return d return d
@ -70,88 +76,87 @@ func (d *Dog) Watch() {
} }
} }
// Now that I've added the ability to notify when a server is back up
// this definitely needs some refactoring. It's bad now.
func (d *Dog) watch() { func (d *Dog) watch() {
d.Logger <- fmt.Sprintf("Check: '%s'", d.Name) d.Logger <- fmt.Sprintf("Check: '%s'", d.Name)
err := d.check() // This may be up or down
err := d.hardcheck()
if nil == err { if nil == err {
d.Logger <- fmt.Sprintf("Up: '%s'", d.Name)
// if it's down, coming up, notify
if d.changed { if d.changed {
d.notify("came back up") d.notify(MessageUp)
} }
return return
} }
time.Sleep(time.Duration(5) * time.Second) // If being down is a change, check to see if it's just a hiccup
if d.changed {
err2 := d.check() time.Sleep(time.Duration(5) * time.Second)
if nil != err2 { err2 := d.softcheck()
d.Logger <- fmt.Sprintf("Down: '%s': %s", d.Name, err2) if nil != err2 {
} else { // it's really down
d.Logger <- fmt.Sprintf("Hiccup: '%s': %s", d.Name, err) d.Logger <- fmt.Sprintf("Down: '%s': %s", d.Name, err2)
return } else {
// it's not really down, so reset the change info
d.changed = false
d.status = StatusUp
// and notify of the hiccup
d.Logger <- fmt.Sprintf("Hiccup: '%s': %s", d.Name, err)
d.notify(MessageHiccup)
return
}
} }
// TODO what if the server is flip-flopping rapidly?
// how to rate limit?
// "{{ .Server }} is on cooldown for 30 minutes"
// * We've had success since the last notification
// * It's been at least 5 minutes since the last notification
//fiveMinutesAgo := time.Now().Add(-5 * time.Minute)
//if d.lastPassed.After(d.lastNotified) && d.lastNotified.Before(fiveMinutesAgo) {
//}
t := 10 t := 10
for { for {
// try to recover, then backoff exponentially
d.recover() d.recover()
time.Sleep(time.Duration(t) * time.Second) time.Sleep(time.Duration(t) * time.Second)
// backoff
t *= 2 t *= 2
err := d.check() if t > 120 {
if nil != err { t = 120
d.Logger <- fmt.Sprintf("Unrecoverable: '%s': %s", d.Name, err)
} }
// We should notify if err := d.softcheck()
// * The status has changed if nil != err {
// // this is down, and we know it's down
// TODO what if the server is flip-flopping rapidly? d.status = StatusDown
// how to rate limit? d.Logger <- fmt.Sprintf("Unrecoverable: '%s': %s", d.Name, err)
// "{{ .Server }} is on cooldown for 30 minutes" if d.changed {
if d.changed { d.changed = false
d.notify("went down") d.notify(MessageDown)
if StatusUp == d.status {
break
} }
} else {
// * We've had success since the last notification // it came back up
// * It's been at least 5 minutes since the last notification d.status = StatusUp
//fiveMinutesAgo := time.Now().Add(-5 * time.Minute) d.Logger <- fmt.Sprintf("Up: '%s'", d.Name)
//if d.lastPassed.After(d.lastNotified) && d.lastNotified.Before(fiveMinutesAgo) { if d.changed {
//} // and the downtime was short - just a recovery
//if !failure || d.failures >= 5 { d.notify(MessageHiccup)
// go back to the main 5-minute loop } else {
// break // and the downtime was some time
//} d.notify(MessageUp)
}
d.changed = false
break
} }
} }
} }
func (d *Dog) check() error { func (d *Dog) softcheck() error {
previousStatus := d.status
var err error
defer func() {
// Are we up, or down?
if nil != err {
d.status = StatusDown
d.failures += 1
d.lastFailed = time.Now()
} else {
d.status = StatusUp
d.lastPassed = time.Now()
d.passes += 1
d.Logger <- fmt.Sprintf("Up: '%s'", d.Name)
}
// Has that changed?
if previousStatus != d.status {
d.changed = true
} else {
d.changed = false
}
}()
client := NewHTTPClient() client := NewHTTPClient()
response, err := client.Get(d.CheckURL) response, err := client.Get(d.CheckURL)
if nil != err { if nil != err {
@ -174,7 +179,7 @@ func (d *Dog) check() error {
} }
if "" != d.Badwords { if "" != d.Badwords {
if !bytes.Contains(b, []byte(d.Badwords)) { if bytes.Contains(b, []byte(d.Badwords)) {
err = fmt.Errorf("Down: '%s' Found for '%s'", d.Badwords, d.Name) err = fmt.Errorf("Down: '%s' Found for '%s'", d.Badwords, d.Name)
d.Logger <- fmt.Sprintf("%s", err) d.Logger <- fmt.Sprintf("%s", err)
d.error = err d.error = err
@ -185,6 +190,32 @@ func (d *Dog) check() error {
return nil return nil
} }
func (d *Dog) hardcheck() error {
previousStatus := d.status
err := d.softcheck()
// Are we up, or down?
if nil != err {
d.status = StatusDown
//d.failures += 1
//d.lastFailed = time.Now()
} else {
d.status = StatusUp
//d.lastPassed = time.Now()
//d.passes += 1
}
// Has that changed?
if previousStatus != d.status {
d.changed = true
} else {
d.changed = false
}
return err
}
func (d *Dog) recover() { func (d *Dog) recover() {
if "" == d.Recover { if "" == d.Recover {
return return
@ -214,7 +245,7 @@ func (d *Dog) recover() {
func (d *Dog) notify(msg string) { func (d *Dog) notify(msg string) {
d.Logger <- fmt.Sprintf("Notifying the authorities of %s's status change", d.Name) d.Logger <- fmt.Sprintf("Notifying the authorities of %s's status change", d.Name)
d.lastNotified = time.Now() //d.lastNotified = time.Now()
for i := range d.Webhooks { for i := range d.Webhooks {
name := d.Webhooks[i] name := d.Webhooks[i]