blob: 2df118738d7117bed171b9b079f9b23b795fb30d [file] [log] [blame]
Kent Hagerman2f0d0552020-04-23 17:28:52 -04001/*
Joey Armstrong7a9af442024-01-03 19:26:36 -05002 * Copyright 2018-2024 Open Networking Foundation (ONF) and the ONF Contributors
Kent Hagerman2f0d0552020-04-23 17:28:52 -04003
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7
8 * http://www.apache.org/licenses/LICENSE-2.0
9
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17package core
18
19import (
20 "context"
21 "errors"
22 "time"
23
khenaidood948f772021-08-11 17:49:24 -040024 "github.com/opencord/voltha-lib-go/v7/pkg/db"
25 "github.com/opencord/voltha-lib-go/v7/pkg/db/kvstore"
26 "github.com/opencord/voltha-lib-go/v7/pkg/log"
27 "github.com/opencord/voltha-lib-go/v7/pkg/probe"
Kent Hagerman2f0d0552020-04-23 17:28:52 -040028 "google.golang.org/grpc/codes"
29 "google.golang.org/grpc/status"
30)
31
Rohan Agrawal31f21802020-06-12 05:38:46 +000032func newKVClient(ctx context.Context, storeType string, address string, timeout time.Duration) (kvstore.Client, error) {
33 logger.Infow(ctx, "kv-store-type", log.Fields{"store": storeType})
Abhay Kumar4e0f37b2024-07-12 09:33:01 +053034 switch storeType {
35 case "etcd":
Rohan Agrawal31f21802020-06-12 05:38:46 +000036 return kvstore.NewEtcdClient(ctx, address, timeout, log.FatalLevel)
Abhay Kumar4e0f37b2024-07-12 09:33:01 +053037 case "redis":
38 return kvstore.NewRedisClient(address, timeout, false)
39 case "redis-sentinel":
40 return kvstore.NewRedisClient(address, timeout, true)
Kent Hagerman2f0d0552020-04-23 17:28:52 -040041 }
42 return nil, errors.New("unsupported-kv-store")
43}
44
45func stopKVClient(ctx context.Context, kvClient kvstore.Client) {
46 // Release all reservations
47 if err := kvClient.ReleaseAllReservations(ctx); err != nil {
Rohan Agrawal31f21802020-06-12 05:38:46 +000048 logger.Infow(ctx, "fail-to-release-all-reservations", log.Fields{"error": err})
Kent Hagerman2f0d0552020-04-23 17:28:52 -040049 }
50 // Close the DB connection
Rohan Agrawal31f21802020-06-12 05:38:46 +000051 kvClient.Close(ctx)
Kent Hagerman2f0d0552020-04-23 17:28:52 -040052}
53
54// waitUntilKVStoreReachableOrMaxTries will wait until it can connect to a KV store or until maxtries has been reached
khenaidood948f772021-08-11 17:49:24 -040055func waitUntilKVStoreReachableOrMaxTries(ctx context.Context, kvClient kvstore.Client, maxRetries int, retryInterval time.Duration, serviceName string) error {
Rohan Agrawal31f21802020-06-12 05:38:46 +000056 logger.Infow(ctx, "verifying-KV-store-connectivity", log.Fields{"retries": maxRetries, "retryInterval": retryInterval})
Kent Hagerman2f0d0552020-04-23 17:28:52 -040057 count := 0
58 for {
59 if !kvClient.IsConnectionUp(ctx) {
Rohan Agrawal31f21802020-06-12 05:38:46 +000060 logger.Info(ctx, "KV-store-unreachable")
Kent Hagerman2f0d0552020-04-23 17:28:52 -040061 if maxRetries != -1 {
62 if count >= maxRetries {
63 return status.Error(codes.Unavailable, "kv store unreachable")
64 }
65 }
66 count++
67
68 // Take a nap before retrying
69 select {
70 case <-ctx.Done():
71 //ctx canceled
72 return ctx.Err()
73 case <-time.After(retryInterval):
74 }
Rohan Agrawal31f21802020-06-12 05:38:46 +000075 logger.Infow(ctx, "retry-KV-store-connectivity", log.Fields{"retryCount": count, "maxRetries": maxRetries, "retryInterval": retryInterval})
Kent Hagerman2f0d0552020-04-23 17:28:52 -040076 } else {
77 break
78 }
79 }
khenaidood948f772021-08-11 17:49:24 -040080 probe.UpdateStatusFromContext(ctx, serviceName, probe.ServiceStatusRunning)
Rohan Agrawal31f21802020-06-12 05:38:46 +000081 logger.Info(ctx, "KV-store-reachable")
Kent Hagerman2f0d0552020-04-23 17:28:52 -040082 return nil
83}
84
85/*
86 * Thread to monitor kvstore Liveness (connection status)
87 *
88 * This function constantly monitors Liveness State of kvstore as reported
89 * periodically by backend and updates the Status of kv-store service registered
90 * with rw_core probe.
91 *
92 * If no liveness event has been seen within a timeout, then the thread will
93 * perform a "liveness" check attempt, which will in turn trigger a liveness event on
94 * the liveness channel, true or false depending on whether the attempt succeeded.
95 *
96 * The gRPC server in turn monitors the state of the readiness probe and will
97 * start issuing UNAVAILABLE response while the probe is not ready.
98 */
khenaidood948f772021-08-11 17:49:24 -040099func monitorKVStoreLiveness(ctx context.Context, backend *db.Backend, serviceName string, liveProbeInterval, notLiveProbeInterval time.Duration) {
Rohan Agrawal31f21802020-06-12 05:38:46 +0000100 logger.Info(ctx, "start-monitoring-kvstore-liveness")
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400101
102 // Instruct backend to create Liveness channel for transporting state updates
Rohan Agrawal31f21802020-06-12 05:38:46 +0000103 livenessChannel := backend.EnableLivenessChannel(ctx)
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400104
khenaidood948f772021-08-11 17:49:24 -0400105 logger.Infow(ctx, "enabled-liveness-channel", log.Fields{"service-name": serviceName})
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400106
107 // Default state for kvstore is alive for rw_core
108 timeout := liveProbeInterval
109loop:
110 for {
111 timeoutTimer := time.NewTimer(timeout)
112 select {
113
114 case liveness := <-livenessChannel:
khenaidood948f772021-08-11 17:49:24 -0400115 logger.Debugw(ctx, "received-liveness-change-notification", log.Fields{"liveness": liveness, "service-name": serviceName})
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400116
117 if !liveness {
khenaidood948f772021-08-11 17:49:24 -0400118 probe.UpdateStatusFromContext(ctx, serviceName, probe.ServiceStatusNotReady)
119 logger.Infow(ctx, "service-not-ready", log.Fields{"service-name": serviceName})
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400120
121 timeout = notLiveProbeInterval
122
123 } else {
khenaidood948f772021-08-11 17:49:24 -0400124 probe.UpdateStatusFromContext(ctx, serviceName, probe.ServiceStatusRunning)
125 logger.Infow(ctx, "service-ready", log.Fields{"service-name": serviceName})
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400126
127 timeout = liveProbeInterval
128 }
129
130 if !timeoutTimer.Stop() {
131 <-timeoutTimer.C
132 }
133
134 case <-ctx.Done():
135 break loop
136
137 case <-timeoutTimer.C:
khenaidood948f772021-08-11 17:49:24 -0400138 logger.Infow(ctx, "perform-liveness-check-on-timeout", log.Fields{"service-name": serviceName})
Kent Hagerman2f0d0552020-04-23 17:28:52 -0400139
140 // Trigger Liveness check if no liveness update received within the timeout period.
141 // The Liveness check will push Live state to same channel which this routine is
142 // reading and processing. This, do it asynchronously to avoid blocking for
143 // backend response and avoid any possibility of deadlock
144 go backend.PerformLivenessCheck(ctx)
145 }
146 }
147}