2018-06-25 18:22:35 +08:00
|
|
|
// Copyright 2018 fatedier, fatedier@gmail.com
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2018-12-09 22:06:22 +08:00
|
|
|
package health
|
2018-06-25 18:22:35 +08:00
|
|
|
|
|
|
|
import (
|
2018-07-16 01:21:29 +08:00
|
|
|
"context"
|
2018-12-07 17:05:36 +08:00
|
|
|
"errors"
|
|
|
|
"fmt"
|
2018-07-16 01:21:29 +08:00
|
|
|
"net"
|
|
|
|
"net/http"
|
|
|
|
"time"
|
2018-12-07 17:05:36 +08:00
|
|
|
|
|
|
|
"github.com/fatedier/frp/utils/log"
|
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
|
|
|
ErrHealthCheckType = errors.New("error health check type")
|
2018-06-25 18:22:35 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
type HealthCheckMonitor struct {
|
2018-07-16 01:21:29 +08:00
|
|
|
checkType string
|
|
|
|
interval time.Duration
|
|
|
|
timeout time.Duration
|
|
|
|
maxFailedTimes int
|
|
|
|
|
|
|
|
// For tcp
|
|
|
|
addr string
|
|
|
|
|
|
|
|
// For http
|
|
|
|
url string
|
|
|
|
|
|
|
|
failedTimes uint64
|
|
|
|
statusOK bool
|
|
|
|
statusNormalFn func()
|
|
|
|
statusFailedFn func()
|
|
|
|
|
|
|
|
ctx context.Context
|
|
|
|
cancel context.CancelFunc
|
2018-12-07 17:05:36 +08:00
|
|
|
|
|
|
|
l log.Logger
|
2018-06-25 18:22:35 +08:00
|
|
|
}
|
|
|
|
|
2018-07-16 01:21:29 +08:00
|
|
|
func NewHealthCheckMonitor(checkType string, intervalS int, timeoutS int, maxFailedTimes int, addr string, url string,
|
|
|
|
statusNormalFn func(), statusFailedFn func()) *HealthCheckMonitor {
|
|
|
|
|
|
|
|
if intervalS <= 0 {
|
|
|
|
intervalS = 10
|
|
|
|
}
|
|
|
|
if timeoutS <= 0 {
|
|
|
|
timeoutS = 3
|
|
|
|
}
|
|
|
|
if maxFailedTimes <= 0 {
|
|
|
|
maxFailedTimes = 1
|
|
|
|
}
|
|
|
|
ctx, cancel := context.WithCancel(context.Background())
|
2018-06-25 18:22:35 +08:00
|
|
|
return &HealthCheckMonitor{
|
2018-07-16 01:21:29 +08:00
|
|
|
checkType: checkType,
|
|
|
|
interval: time.Duration(intervalS) * time.Second,
|
|
|
|
timeout: time.Duration(timeoutS) * time.Second,
|
|
|
|
maxFailedTimes: maxFailedTimes,
|
|
|
|
addr: addr,
|
|
|
|
url: url,
|
|
|
|
statusOK: false,
|
|
|
|
statusNormalFn: statusNormalFn,
|
|
|
|
statusFailedFn: statusFailedFn,
|
|
|
|
ctx: ctx,
|
|
|
|
cancel: cancel,
|
2018-06-25 18:22:35 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-12-07 17:05:36 +08:00
|
|
|
func (monitor *HealthCheckMonitor) SetLogger(l log.Logger) {
|
|
|
|
monitor.l = l
|
|
|
|
}
|
|
|
|
|
2018-06-25 18:22:35 +08:00
|
|
|
func (monitor *HealthCheckMonitor) Start() {
|
2018-07-16 01:21:29 +08:00
|
|
|
go monitor.checkWorker()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (monitor *HealthCheckMonitor) Stop() {
|
|
|
|
monitor.cancel()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (monitor *HealthCheckMonitor) checkWorker() {
|
|
|
|
for {
|
|
|
|
ctx, cancel := context.WithDeadline(monitor.ctx, time.Now().Add(monitor.timeout))
|
2018-12-07 17:05:36 +08:00
|
|
|
err := monitor.doCheck(ctx)
|
2018-07-16 01:21:29 +08:00
|
|
|
|
|
|
|
// check if this monitor has been closed
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
cancel()
|
|
|
|
return
|
|
|
|
default:
|
|
|
|
cancel()
|
|
|
|
}
|
|
|
|
|
2018-12-07 17:05:36 +08:00
|
|
|
if err == nil {
|
|
|
|
if monitor.l != nil {
|
|
|
|
monitor.l.Trace("do one health check success")
|
|
|
|
}
|
2018-07-16 01:21:29 +08:00
|
|
|
if !monitor.statusOK && monitor.statusNormalFn != nil {
|
2018-12-07 17:05:36 +08:00
|
|
|
if monitor.l != nil {
|
|
|
|
monitor.l.Info("health check status change to success")
|
|
|
|
}
|
2018-07-16 01:21:29 +08:00
|
|
|
monitor.statusOK = true
|
|
|
|
monitor.statusNormalFn()
|
|
|
|
}
|
|
|
|
} else {
|
2018-12-07 17:05:36 +08:00
|
|
|
if monitor.l != nil {
|
|
|
|
monitor.l.Warn("do one health check failed: %v", err)
|
|
|
|
}
|
2018-07-16 01:21:29 +08:00
|
|
|
monitor.failedTimes++
|
|
|
|
if monitor.statusOK && int(monitor.failedTimes) >= monitor.maxFailedTimes && monitor.statusFailedFn != nil {
|
2018-12-07 17:05:36 +08:00
|
|
|
if monitor.l != nil {
|
|
|
|
monitor.l.Warn("health check status change to failed")
|
|
|
|
}
|
2018-07-16 01:21:29 +08:00
|
|
|
monitor.statusOK = false
|
|
|
|
monitor.statusFailedFn()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
time.Sleep(monitor.interval)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-12-07 17:05:36 +08:00
|
|
|
func (monitor *HealthCheckMonitor) doCheck(ctx context.Context) error {
|
2018-07-16 01:21:29 +08:00
|
|
|
switch monitor.checkType {
|
|
|
|
case "tcp":
|
|
|
|
return monitor.doTcpCheck(ctx)
|
|
|
|
case "http":
|
|
|
|
return monitor.doHttpCheck(ctx)
|
|
|
|
default:
|
2018-12-07 17:05:36 +08:00
|
|
|
return ErrHealthCheckType
|
2018-07-16 01:21:29 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-12-07 17:05:36 +08:00
|
|
|
func (monitor *HealthCheckMonitor) doTcpCheck(ctx context.Context) error {
|
|
|
|
// if tcp address is not specified, always return nil
|
|
|
|
if monitor.addr == "" {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2018-07-16 01:21:29 +08:00
|
|
|
var d net.Dialer
|
|
|
|
conn, err := d.DialContext(ctx, "tcp", monitor.addr)
|
|
|
|
if err != nil {
|
2018-12-07 17:05:36 +08:00
|
|
|
return err
|
2018-07-16 01:21:29 +08:00
|
|
|
}
|
|
|
|
conn.Close()
|
2018-12-07 17:05:36 +08:00
|
|
|
return nil
|
2018-07-16 01:21:29 +08:00
|
|
|
}
|
|
|
|
|
2018-12-07 17:05:36 +08:00
|
|
|
func (monitor *HealthCheckMonitor) doHttpCheck(ctx context.Context) error {
|
2018-07-16 01:21:29 +08:00
|
|
|
req, err := http.NewRequest("GET", monitor.url, nil)
|
|
|
|
if err != nil {
|
2018-12-07 17:05:36 +08:00
|
|
|
return err
|
2018-07-16 01:21:29 +08:00
|
|
|
}
|
|
|
|
resp, err := http.DefaultClient.Do(req)
|
|
|
|
if err != nil {
|
2018-12-07 17:05:36 +08:00
|
|
|
return err
|
2018-07-16 01:21:29 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if resp.StatusCode/100 != 2 {
|
2018-12-07 17:05:36 +08:00
|
|
|
return fmt.Errorf("do http health check, StatusCode is [%d] not 2xx", resp.StatusCode)
|
2018-07-16 01:21:29 +08:00
|
|
|
}
|
2018-12-07 17:05:36 +08:00
|
|
|
return nil
|
2018-06-25 18:22:35 +08:00
|
|
|
}
|