2019-06-07 07:10:43 -05:00
|
|
|
/*
|
|
|
|
*
|
|
|
|
* Copyright 2018 gRPC authors.
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
package health
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"google.golang.org/grpc"
|
|
|
|
"google.golang.org/grpc/codes"
|
2019-08-14 10:41:27 -04:00
|
|
|
"google.golang.org/grpc/connectivity"
|
2019-06-07 07:10:43 -05:00
|
|
|
healthpb "google.golang.org/grpc/health/grpc_health_v1"
|
|
|
|
"google.golang.org/grpc/internal"
|
|
|
|
"google.golang.org/grpc/internal/backoff"
|
|
|
|
"google.golang.org/grpc/status"
|
|
|
|
)
|
|
|
|
|
2020-07-07 16:22:30 -05:00
|
|
|
var (
|
|
|
|
backoffStrategy = backoff.DefaultExponential
|
|
|
|
backoffFunc = func(ctx context.Context, retries int) bool {
|
|
|
|
d := backoffStrategy.Backoff(retries)
|
|
|
|
timer := time.NewTimer(d)
|
|
|
|
select {
|
|
|
|
case <-timer.C:
|
|
|
|
return true
|
|
|
|
case <-ctx.Done():
|
|
|
|
timer.Stop()
|
|
|
|
return false
|
|
|
|
}
|
2019-06-07 07:10:43 -05:00
|
|
|
}
|
2020-07-07 16:22:30 -05:00
|
|
|
)
|
2019-06-07 07:10:43 -05:00
|
|
|
|
|
|
|
func init() {
|
|
|
|
internal.HealthCheckFunc = clientHealthCheck
|
|
|
|
}
|
|
|
|
|
2019-08-14 10:41:27 -04:00
|
|
|
const healthCheckMethod = "/grpc.health.v1.Health/Watch"
|
|
|
|
|
|
|
|
// This function implements the protocol defined at:
|
|
|
|
// https://github.com/grpc/grpc/blob/master/doc/health-checking.md
|
|
|
|
func clientHealthCheck(ctx context.Context, newStream func(string) (interface{}, error), setConnectivityState func(connectivity.State), service string) error {
|
2019-06-07 07:10:43 -05:00
|
|
|
tryCnt := 0
|
|
|
|
|
|
|
|
retryConnection:
|
|
|
|
for {
|
|
|
|
// Backs off if the connection has failed in some way without receiving a message in the previous retry.
|
|
|
|
if tryCnt > 0 && !backoffFunc(ctx, tryCnt-1) {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
tryCnt++
|
|
|
|
|
|
|
|
if ctx.Err() != nil {
|
|
|
|
return nil
|
|
|
|
}
|
2019-08-14 10:41:27 -04:00
|
|
|
setConnectivityState(connectivity.Connecting)
|
|
|
|
rawS, err := newStream(healthCheckMethod)
|
2019-06-07 07:10:43 -05:00
|
|
|
if err != nil {
|
|
|
|
continue retryConnection
|
|
|
|
}
|
|
|
|
|
|
|
|
s, ok := rawS.(grpc.ClientStream)
|
|
|
|
// Ideally, this should never happen. But if it happens, the server is marked as healthy for LBing purposes.
|
|
|
|
if !ok {
|
2019-08-14 10:41:27 -04:00
|
|
|
setConnectivityState(connectivity.Ready)
|
2019-06-07 07:10:43 -05:00
|
|
|
return fmt.Errorf("newStream returned %v (type %T); want grpc.ClientStream", rawS, rawS)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = s.SendMsg(&healthpb.HealthCheckRequest{Service: service}); err != nil && err != io.EOF {
|
|
|
|
// Stream should have been closed, so we can safely continue to create a new stream.
|
|
|
|
continue retryConnection
|
|
|
|
}
|
|
|
|
s.CloseSend()
|
|
|
|
|
|
|
|
resp := new(healthpb.HealthCheckResponse)
|
|
|
|
for {
|
|
|
|
err = s.RecvMsg(resp)
|
|
|
|
|
|
|
|
// Reports healthy for the LBing purposes if health check is not implemented in the server.
|
|
|
|
if status.Code(err) == codes.Unimplemented {
|
2019-08-14 10:41:27 -04:00
|
|
|
setConnectivityState(connectivity.Ready)
|
2019-06-07 07:10:43 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Reports unhealthy if server's Watch method gives an error other than UNIMPLEMENTED.
|
|
|
|
if err != nil {
|
2019-08-14 10:41:27 -04:00
|
|
|
setConnectivityState(connectivity.TransientFailure)
|
2019-06-07 07:10:43 -05:00
|
|
|
continue retryConnection
|
|
|
|
}
|
|
|
|
|
2020-07-07 16:22:30 -05:00
|
|
|
// As a message has been received, removes the need for backoff for the next retry by resetting the try count.
|
2019-06-07 07:10:43 -05:00
|
|
|
tryCnt = 0
|
2019-08-14 10:41:27 -04:00
|
|
|
if resp.Status == healthpb.HealthCheckResponse_SERVING {
|
|
|
|
setConnectivityState(connectivity.Ready)
|
|
|
|
} else {
|
|
|
|
setConnectivityState(connectivity.TransientFailure)
|
|
|
|
}
|
2019-06-07 07:10:43 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|