| /* |
| * Copyright 2018-present Open Networking Foundation |
| |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package main |
| |
| import ( |
| //"os" |
| "fmt" |
| "time" |
| "regexp" |
| "errors" |
| "strconv" |
| //"io/ioutil" |
| //"encoding/json" |
| |
| "k8s.io/client-go/rest" |
| "google.golang.org/grpc" |
| "golang.org/x/net/context" |
| "k8s.io/client-go/kubernetes" |
| "github.com/golang/protobuf/ptypes" |
| //"k8s.io/apimachinery/pkg/api/errors" |
| "github.com/opencord/voltha-go/common/log" |
| kafka "github.com/opencord/voltha-go/kafka" |
| metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" |
| empty "github.com/golang/protobuf/ptypes/empty" |
| vpb "github.com/opencord/voltha-go/protos/voltha" |
| cmn "github.com/opencord/voltha-go/protos/common" |
| pb "github.com/opencord/voltha-go/protos/afrouter" |
| ic "github.com/opencord/voltha-go/protos/inter_container" |
| ) |
| |
| type configConn struct { |
| Server string `json:"Server"` |
| Cluster string `json:"Cluster"` |
| Backend string `json:"Backend"` |
| connections map[string]connection |
| } |
| |
| type connection struct { |
| Name string `json:"Connection"` |
| Addr string `json:"Addr"` |
| Port uint64 `json:"Port"` |
| } |
| |
| type rwPod struct { |
| name string |
| ipAddr string |
| node string |
| devIds map[string]struct{} |
| backend string |
| connection string |
| } |
| |
| type podTrack struct { |
| pod *rwPod |
| dn bool |
| } |
| |
| var nPods int = 6 |
| |
| // Topic is affinityRouter |
| // port: 9092 |
| |
| func newKafkaClient(clientType string, host string, port int, instanceID string) (kafka.Client, error) { |
| |
| log.Infow("kafka-client-type", log.Fields{"client": clientType}) |
| switch clientType { |
| case "sarama": |
| return kafka.NewSaramaClient( |
| kafka.Host(host), |
| kafka.Port(port), |
| kafka.ConsumerType(kafka.GroupCustomer), |
| kafka.ProducerReturnOnErrors(true), |
| kafka.ProducerReturnOnSuccess(true), |
| kafka.ProducerMaxRetries(6), |
| kafka.NumPartitions(3), |
| kafka.ConsumerGroupName(instanceID), |
| kafka.ConsumerGroupPrefix(instanceID), |
| kafka.AutoCreateTopic(false), |
| kafka.ProducerFlushFrequency(5), |
| kafka.ProducerRetryBackoff(time.Millisecond*30)), nil |
| } |
| return nil, errors.New("unsupported-client-type") |
| } |
| |
| |
| func k8sClientSet() *kubernetes.Clientset { |
| // creates the in-cluster config |
| config, err := rest.InClusterConfig() |
| if err != nil { |
| panic(err.Error()) |
| } |
| // creates the clientset |
| clientset, err := kubernetes.NewForConfig(config) |
| if err != nil { |
| panic(err.Error()) |
| } |
| |
| return clientset |
| } |
| |
| |
| func connect(addr string) (*grpc.ClientConn, error) { |
| for ctr :=0 ; ctr < 100; ctr++ { |
| log.Debugf("Trying to connect to %s", addr) |
| conn, err := grpc.Dial(addr, grpc.WithInsecure()) |
| if err != nil { |
| log.Debugf("Attempt to connect failed, retrying %v:", err) |
| } else { |
| log.Debugf("Connection succeeded") |
| return conn,err |
| } |
| time.Sleep(10 * time.Second) |
| } |
| log.Debugf("Too many connection attempts, giving up!") |
| return nil,errors.New("Timeout attempting to conect") |
| } |
| |
| func getRwPods(cs *kubernetes.Clientset, coreFilter * regexp.Regexp) []*rwPod { |
| var rtrn []*rwPod |
| |
| pods, err := cs.CoreV1().Pods("").List(metav1.ListOptions{}) |
| if err != nil { |
| panic(err.Error()) |
| } |
| //log.Debugf("There are a total of %d pods in the cluster\n", len(pods.Items)) |
| |
| for _,v := range pods.Items { |
| if v.Namespace == "voltha" && coreFilter.MatchString(v.Name) { |
| log.Debugf("Namespace: %s, PodName: %s, PodIP: %s, Host: %s\n", v.Namespace, v.Name, |
| v.Status.PodIP, v.Spec.NodeName) |
| // Only add the pod if it has an IP address. If it doesn't then it likely crashed and |
| // and is still in the process of getting re-started. |
| if v.Status.PodIP != "" { |
| rtrn = append(rtrn, &rwPod{name:v.Name,ipAddr:v.Status.PodIP,node:v.Spec.NodeName, |
| devIds:make(map[string]struct{}), backend:"", connection:""}) |
| } |
| } |
| } |
| return rtrn |
| } |
| |
| func reconcilePodDeviceIds(pod * rwPod, ids map[string]struct{}) bool { |
| var idList cmn.IDs |
| for k,_ := range ids { |
| idList.Items = append(idList.Items, &cmn.ID{Id:k}) |
| } |
| conn,err := connect(pod.ipAddr+":50057") |
| defer conn.Close() |
| if err != nil { |
| log.Debugf("Could not query devices from %s, could not connect", pod.name) |
| return false |
| } |
| client := vpb.NewVolthaServiceClient(conn) |
| _,err = client.ReconcileDevices(context.Background(), &idList) |
| if err != nil { |
| log.Error(err) |
| return false |
| } |
| |
| return true |
| } |
| |
| func queryPodDeviceIds(pod * rwPod) map[string]struct{} { |
| var rtrn map[string]struct{} = make(map[string]struct{}) |
| // Open a connection to the pod |
| // port 50057 |
| conn, err := connect(pod.ipAddr+":50057") |
| if err != nil { |
| log.Debugf("Could not query devices from %s, could not connect", pod.name) |
| return rtrn |
| } |
| defer conn.Close() |
| client := vpb.NewVolthaServiceClient(conn) |
| devs,err := client.ListDeviceIds(context.Background(), &empty.Empty{}) |
| if err != nil { |
| log.Error(err) |
| return rtrn |
| } |
| for _,dv := range devs.Items { |
| rtrn[dv.Id]=struct{}{} |
| } |
| |
| return rtrn |
| } |
| |
| func queryDeviceIds(pods []*rwPod) { |
| for pk,_ := range pods { |
| // Keep the old Id list if a new list is not returned |
| if idList := queryPodDeviceIds(pods[pk]); len(idList) != 0 { |
| pods[pk].devIds = idList |
| } |
| } |
| } |
| |
| func allEmpty(pods []*rwPod) bool { |
| for k,_ := range pods { |
| if len(pods[k].devIds) != 0 { |
| return false |
| } |
| } |
| return true |
| } |
| |
| //func groupEmptyCores(pods []*rwPod) [][]*rwPod { |
| // return [][]*rwPod{} |
| //} |
| |
| //func groupPods(pods []*rwPod) [][]*rwPod { |
| |
| // if allEmpty(pods) == true { |
| // return groupEmptyCores(pods) |
| // } else { |
| // return groupPopulatedCores(pods) |
| // } |
| //} |
| |
| func rmPod(pods []*rwPod, idx int) []*rwPod { |
| return append(pods[:idx],pods[idx+1:]...) |
| } |
| |
| func groupIntersectingPods1(pods []*rwPod, podCt int) ([][]*rwPod,[]*rwPod) { |
| var rtrn [][]*rwPod |
| var out []*rwPod |
| |
| for { |
| if len(pods) == 0 { |
| break |
| } |
| if len(pods[0].devIds) == 0 { // Ignore pods with no devices |
| ////log.Debugf("%s empty pod", pd[k].pod.name) |
| out = append(out, pods[0]) |
| pods = rmPod(pods, 0) |
| continue |
| } |
| // Start a pod group with this pod |
| var grp []*rwPod |
| grp = append(grp, pods[0]) |
| pods = rmPod(pods,0) |
| //log.Debugf("Creating new group %s", pd[k].pod.name) |
| // Find the peer pod based on device overlap |
| // It's ok if one isn't found, an empty one will be used instead |
| for k,_ := range pods { |
| if len(pods[k].devIds) == 0 { // Skip pods with no devices |
| //log.Debugf("%s empty pod", pd[k1].pod.name) |
| continue |
| } |
| if intersect(grp[0].devIds, pods[k].devIds) == true { |
| //log.Debugf("intersection found %s:%s", pd[k].pod.name, pd[k1].pod.name) |
| if grp[0].node == pods[k].node { |
| // This should never happen |
| log.Errorf("pods %s and %s intersect and are on the same server!! Not pairing", |
| grp[0].name, pods[k].name) |
| continue |
| } |
| grp = append(grp, pods[k]) |
| pods = rmPod(pods, k) |
| break |
| |
| } |
| } |
| rtrn = append(rtrn, grp) |
| //log.Debugf("Added group %s", grp[0].name) |
| // Check if the number of groups = half the pods, if so all groups are started. |
| if len(rtrn) == podCt >> 1 { |
| // Append any remaining pods to out |
| out = append(out,pods[0:]...) |
| break |
| } |
| } |
| return rtrn,out |
| } |
| |
| func groupIntersectingPods(pd []*podTrack) ([][]*rwPod,[]*podTrack) { |
| var rtrn [][]*rwPod |
| |
| for k,_ := range pd { |
| if pd[k].dn == true { // Already processed? |
| //log.Debugf("%s already processed", pd[k].pod.name) |
| continue |
| } |
| if len(pd[k].pod.devIds) == 0 { // Ignore pods with no devices |
| ////log.Debugf("%s empty pod", pd[k].pod.name) |
| continue |
| } |
| // Start a pod group with this pod |
| var grp []*rwPod |
| grp = append(grp, pd[k].pod) |
| pd[k].dn = true |
| //log.Debugf("Creating new group %s", pd[k].pod.name) |
| // Find the peer pod based on device overlap |
| // It's ok if one isn't found, an empty one will be used instead |
| for k1,_ := range pd { |
| if pd[k1].dn == true { // Skip over eliminated pods |
| //log.Debugf("%s eliminated pod", pd[k1].pod.name) |
| continue |
| } |
| if len(pd[k1].pod.devIds) == 0 { // Skip pods with no devices |
| //log.Debugf("%s empty pod", pd[k1].pod.name) |
| continue |
| } |
| if intersect(pd[k].pod.devIds, pd[k1].pod.devIds) == true { |
| //log.Debugf("intersection found %s:%s", pd[k].pod.name, pd[k1].pod.name) |
| if pd[k].pod.node == pd[k1].pod.node { |
| // This should never happen |
| log.Errorf("pods %s and %s intersect and are on the same server!! Not pairing", |
| pd[k].pod.name, pd[k1].pod.name) |
| continue |
| } |
| pd[k1].dn = true |
| grp = append(grp, pd[k1].pod) |
| break |
| } |
| } |
| rtrn = append(rtrn, grp) |
| //log.Debugf("Added group %s", grp[0].name) |
| // Check if the number of groups = half the pods, if so all groups are started. |
| if len(rtrn) == len(pd) >> 1 { |
| break |
| } |
| } |
| return rtrn,pd |
| } |
| |
| func unallocPodCount(pd []*podTrack) int { |
| var rtrn int = 0 |
| for _,v := range pd { |
| if v.dn == false { |
| rtrn++ |
| } |
| } |
| return rtrn |
| } |
| |
| |
| func sameNode(pod *rwPod, grps [][]*rwPod) bool { |
| for _,v := range grps { |
| if v[0].node == pod.node { |
| return true |
| } |
| if len(v) == 2 && v[1].node == pod.node { |
| return true |
| } |
| } |
| return false |
| } |
| |
| func startRemainingGroups1(grps [][]*rwPod, pods []*rwPod, podCt int) ([][]*rwPod, []*rwPod) { |
| var grp []*rwPod |
| |
| for k,_ := range pods { |
| if sameNode(pods[k], grps) { |
| continue |
| } |
| grp = []*rwPod{} |
| grp = append(grp, pods[k]) |
| pods = rmPod(pods, k) |
| grps = append(grps, grp) |
| if len(grps) == podCt >> 1 { |
| break |
| } |
| } |
| return grps, pods |
| } |
| |
| func startRemainingGroups(grps [][]*rwPod, pd []*podTrack) ([][]*rwPod, []*podTrack) { |
| var grp []*rwPod |
| |
| for k,_ := range pd { |
| if sameNode(pd[k].pod, grps) == true { |
| continue |
| } |
| grp = append(grp, pd[k].pod) |
| grps = append(grps, grp) |
| pd[k].dn = true |
| if len(grps) == len(pd) >> 1 { |
| break |
| } |
| } |
| return grps, pd |
| } |
| |
| func hasSingleSecondNode(grp []*rwPod) bool { |
| var srvrs map[string]struct{} = make(map[string]struct{}) |
| for k,_ := range grp { |
| if k == 0 { |
| continue // Ignore the first item |
| } |
| srvrs[grp[k].node] = struct{}{} |
| } |
| if len(srvrs) == 1 { |
| return true |
| } |
| return false |
| } |
| |
| func addNode(grps [][]*rwPod, idx *rwPod, item *rwPod) [][]*rwPod { |
| for k,_ := range grps { |
| if grps[k][0].name == idx.name { |
| grps[k] = append(grps[k], item) |
| return grps |
| } |
| } |
| // TODO: Error checking required here. |
| return grps |
| } |
| |
| func removeNode(grps [][]*rwPod, item *rwPod) [][]*rwPod { |
| for k,_ := range grps { |
| for k1,_ := range grps[k] { |
| if grps[k][k1].name == item.name { |
| grps[k] = append(grps[k][:k1],grps[k][k1+1:]...) |
| break |
| } |
| } |
| } |
| return grps |
| } |
| |
| func groupRemainingPods1(grps [][]*rwPod, pods []*rwPod) [][]*rwPod { |
| var lgrps [][]*rwPod |
| // All groups must be started when this function is called. |
| // Copy incomplete groups |
| for k,_ := range grps { |
| if len(grps[k]) != 2 { |
| lgrps = append(lgrps, grps[k]) |
| } |
| } |
| |
| // Add all pairing candidates to each started group. |
| for k,_ := range pods { |
| for k2,_ := range lgrps { |
| if lgrps[k2][0].node != pods[k].node { |
| lgrps[k2] = append(lgrps[k2], pods[k]) |
| } |
| } |
| } |
| |
| //TODO: If any member of lgrps doesn't have at least 2 |
| // nodes something is wrong. Check for that here |
| |
| for { |
| for { // Address groups with only a single server choice |
| var ssn bool = false |
| |
| for k,_ := range lgrps { |
| // Now if any of the groups only have a single |
| // node as the choice for the second member |
| // address that one first. |
| if hasSingleSecondNode(lgrps[k]) == true { |
| ssn = true |
| // Add this pairing to the groups |
| grps = addNode(grps, lgrps[k][0], lgrps[k][1]) |
| // Since this node is now used, remove it from all |
| // remaining tenative groups |
| lgrps = removeNode(lgrps, lgrps[k][1]) |
| // Now remove this group completely since |
| // it's been addressed |
| lgrps = append(lgrps[:k],lgrps[k+1:]...) |
| break |
| } |
| } |
| if ssn == false { |
| break |
| } |
| } |
| // Now adress one of the remaining groups |
| if len(lgrps) == 0 { |
| break // Nothing left to do, exit the loop |
| } |
| grps = addNode(grps, lgrps[0][0], lgrps[0][1]) |
| lgrps = removeNode(lgrps, lgrps[0][1]) |
| lgrps = append(lgrps[:0],lgrps[1:]...) |
| } |
| return grps |
| } |
| |
| func groupRemainingPods(grps [][]*rwPod, pd []*podTrack) [][]*rwPod{ |
| var lgrps [][]*rwPod |
| // All groups must be started when this function is called. |
| // Copy incomplete groups |
| for k,_ := range grps { |
| if len(grps[k]) != 2 { |
| lgrps = append(lgrps, grps[k]) |
| } |
| } |
| |
| // Add all pairing candidates to each started group. |
| for k,_ := range pd { |
| if pd[k].dn == true { |
| continue |
| } |
| for k2,_ := range lgrps { |
| if lgrps[k2][0].node != pd[k].pod.node { |
| lgrps[k2] = append(lgrps[k2], pd[k].pod) |
| } |
| } |
| } |
| |
| //TODO: If any member of lgrps doesn't have at least 2 |
| // nodes something is wrong. Check for that here |
| |
| for { |
| for { // Address groups with only a single server choice |
| var ssn bool = false |
| |
| for k,_ := range lgrps { |
| // Now if any of the groups only have a single |
| // node as the choice for the second member |
| // address that one first. |
| if hasSingleSecondNode(lgrps[k]) == true { |
| ssn = true |
| // Add this pairing to the groups |
| grps = addNode(grps, lgrps[k][0], lgrps[k][1]) |
| // Since this node is now used, remove it from all |
| // remaining tenative groups |
| lgrps = removeNode(lgrps, lgrps[k][1]) |
| // Now remove this group completely since |
| // it's been addressed |
| lgrps = append(lgrps[:k],lgrps[k+1:]...) |
| break |
| } |
| } |
| if ssn == false { |
| break |
| } |
| } |
| // Now adress one of the remaining groups |
| if len(lgrps) == 0 { |
| break // Nothing left to do, exit the loop |
| } |
| grps = addNode(grps, lgrps[0][0], lgrps[0][1]) |
| lgrps = removeNode(lgrps, lgrps[0][1]) |
| lgrps = append(lgrps[:0],lgrps[1:]...) |
| } |
| return grps |
| } |
| |
| func groupPods1(pods []*rwPod) [][]*rwPod { |
| var rtrn [][]*rwPod |
| var podCt int = len(pods) |
| |
| rtrn,pods = groupIntersectingPods1(pods, podCt) |
| // There are several outcomes here |
| // 1) All pods have been paired and we're done |
| // 2) Some un-allocated pods remain |
| // 2.a) All groups have been started |
| // 2.b) Not all groups have been started |
| if len(pods) == 0 { |
| return rtrn |
| } else if len(rtrn) == podCt >> 1 { // All groupings started |
| // Allocate the remaining (presumably empty) pods to the started groups |
| return groupRemainingPods1(rtrn, pods) |
| } else { // Some groupings started |
| // Start empty groups with remaining pods |
| // each grouping is on a different server then |
| // allocate remaining pods. |
| rtrn, pods = startRemainingGroups1(rtrn, pods, podCt) |
| return groupRemainingPods1(rtrn, pods) |
| } |
| } |
| |
| func groupPods(pods []*rwPod) [][]*rwPod { |
| var rtrn [][]*rwPod |
| var pd []*podTrack |
| |
| // Tracking of the grouping process |
| for k,_ := range pods { |
| pd = append(pd, &podTrack{pods[k],false}) |
| } |
| |
| |
| rtrn,pd = groupIntersectingPods(pd) |
| // There are several outcomes here |
| // 1) All pods have been paired and we're done |
| // 2) Some un-allocated pods remain |
| // 2.a) All groups have been started |
| // 2.b) Not all groups have been started |
| if unallocPodCount(pd) == 0 { |
| return rtrn |
| } else if len(rtrn) == len(pd) >> 1 { // All groupings started |
| // Allocate the remaining (presumably empty) pods to the started groups |
| return groupRemainingPods(rtrn, pd) |
| } else { // Some groupings started |
| // Start empty groups with remaining pods |
| // each grouping is on a different server then |
| // allocate remaining pods. |
| rtrn, pd = startRemainingGroups(rtrn, pd) |
| return groupRemainingPods(rtrn, pd) |
| } |
| |
| |
| // Establish groupings of non-empty pods that have overlapping devices. |
| for k,_ := range pd { |
| if pd[k].dn == true { // Already processed? |
| //log.Debugf("%s already processed", pd[k].pod.name) |
| continue |
| } |
| if len(pd[k].pod.devIds) == 0 { // Ignore pods with no devices |
| ////log.Debugf("%s empty pod", pd[k].pod.name) |
| continue |
| } |
| // Start a pod group with this pod |
| var grp []*rwPod |
| grp = append(grp, pd[k].pod) |
| pd[k].dn = true |
| //log.Debugf("Creating new group %s", pd[k].pod.name) |
| // Find the peer pod based on device overlap |
| // It's ok if one isn't found, an empty one will be used instead |
| for k1,_ := range pd { |
| if pd[k1].dn == true { // Skip over eliminated pods |
| //log.Debugf("%s eliminated pod", pd[k1].pod.name) |
| continue |
| } |
| if len(pd[k1].pod.devIds) == 0 { // Skip pods with no devices |
| //log.Debugf("%s empty pod", pd[k1].pod.name) |
| continue |
| } |
| if intersect(pd[k].pod.devIds, pd[k1].pod.devIds) == true { |
| //log.Debugf("intersection found %s:%s", pd[k].pod.name, pd[k1].pod.name) |
| pd[k1].dn = true |
| grp = append(grp, pd[k1].pod) |
| break |
| } |
| } |
| rtrn = append(rtrn, grp) |
| //log.Debugf("Added group %s", grp[0].name) |
| } |
| // Now find any grouping without 2 members and assign one of the |
| // pods with no devices and on a different server to it. |
| // If there are no pods with no devices left before all |
| // groups are filled report an exception but leave one of the |
| // groups with only one pod. |
| for k,_ := range rtrn { |
| if len(rtrn[k]) < 2 { |
| for k2,_ := range pd { |
| if pd[k2].dn == true { |
| continue |
| } |
| // There should be only empty pods here |
| if len(pd[k2].pod.devIds) != 0 { |
| log.Error("Non empty pod found where empty pod was expected") |
| continue |
| } |
| if pd[k2].pod.node == rtrn[k][0].node { |
| //log.Error("Pods aren't on different servers, continuing") |
| continue |
| } |
| // Add this empty and unused pod to the group |
| //log.Debugf("Adding empty pod %s", pd[k2].pod.name) |
| rtrn[k] = append(rtrn[k], pd[k2].pod) |
| pd[k2].dn = true |
| break |
| } |
| } |
| } |
| return rtrn |
| } |
| |
| func intersect(d1 map[string]struct{}, d2 map[string]struct{}) bool { |
| for k,_ := range d1 { |
| if _,ok := d2[k]; ok == true { |
| return true |
| } |
| } |
| return false |
| } |
| |
| func setConnection(client pb.ConfigurationClient, backend string, connection string, addr string, port uint64) { |
| log.Debugf("Configuring backend %s : connection %s\n\n", backend, connection) |
| cnf := &pb.Conn{Server:"grpc_command",Cluster:"vcore",Backend:backend, |
| Connection:connection,Addr:addr, |
| Port:port} |
| if res, err := client.SetConnection(context.Background(), cnf); err != nil { |
| log.Debugf("failed SetConnection RPC call: %s", err) |
| } else { |
| log.Debugf("Result: %v", res) |
| } |
| } |
| |
| func setAffinity(client pb.ConfigurationClient, ids map[string]struct{}, backend string) { |
| log.Debugf("Configuring backend %s : affinities \n", backend) |
| aff := &pb.Affinity{Router:"vcore",Route:"dev_manager",Cluster:"vcore",Backend:backend} |
| for k,_ := range ids { |
| log.Debugf("Setting affinity for id %s", k) |
| aff.Id = k |
| if res, err := client.SetAffinity(context.Background(), aff); err != nil { |
| log.Debugf("failed affinity RPC call: %s", err) |
| } else { |
| log.Debugf("Result: %v", res) |
| } |
| } |
| } |
| |
| func getBackendForCore(coreId string, coreGroups [][]*rwPod) string { |
| for _,v := range coreGroups { |
| for _,v2 := range v { |
| if v2.name == coreId { |
| return v2.backend |
| } |
| } |
| } |
| log.Errorf("No backend found for core %s\n", coreId) |
| return "" |
| } |
| |
| func monitorDiscovery(client pb.ConfigurationClient, |
| ch <-chan *ic.InterContainerMessage, |
| coreGroups [][]*rwPod) { |
| var id map[string]struct{} = make(map[string]struct{}) |
| |
| select { |
| case msg := <-ch: |
| log.Debugf("Received a device discovery notification") |
| device := &ic.DeviceDiscovered{} |
| if err := ptypes.UnmarshalAny(msg.Body, device); err != nil { |
| log.Errorf("Could not unmarshal received notification %v", msg) |
| } else { |
| // Set the affinity of the discovered device. |
| if be := getBackendForCore(device.Id, coreGroups); be != "" { |
| id[device.Id]=struct{}{} |
| setAffinity(client, id, be) |
| } else { |
| log.Error("Cant use an empty string as a backend name") |
| } |
| } |
| break |
| } |
| } |
| |
| func startDiscoveryMonitor(client pb.ConfigurationClient, |
| coreGroups [][]*rwPod) error { |
| var ch <-chan *ic.InterContainerMessage |
| // Connect to kafka for discovery events |
| topic := &kafka.Topic{Name: "AffinityRouter"} |
| kc,err := newKafkaClient("sarama", "kafka", 9092, "arouterd") |
| kc.Start() |
| |
| if ch, err = kc.Subscribe(topic); err != nil { |
| log.Error("Could not subscribe to the 'AffinityRouter' channel, discovery disabled") |
| return err |
| } |
| go monitorDiscovery(client, ch, coreGroups) |
| return nil |
| } |
| |
| // Determines which items in core groups |
| // have changed based on the list provided |
| // and returns a coreGroup with only the changed |
| // items and a pod list with the new items |
| func getAddrDiffs(coreGroups [][]*rwPod, rwPods []*rwPod) ([][]*rwPod, []*rwPod) { |
| var nList []*rwPod |
| var rtrn [][]*rwPod = make([][]*rwPod, nPods>>1) |
| var ipAddrs map[string]struct{} = make(map[string]struct{}) |
| |
| log.Debug("Get addr diffs") |
| |
| // Start with an empty array |
| for k,_ := range rtrn { |
| rtrn[k] = make([]*rwPod, 2) |
| } |
| |
| // Build a list with only the new items |
| for _,v := range rwPods { |
| if hasIpAddr(coreGroups, v.ipAddr) == false { |
| nList = append(nList, v) |
| } |
| ipAddrs[v.ipAddr] = struct{}{} // for the search below |
| } |
| |
| // Now build the coreGroups with only the changed items |
| for k1,v1 := range coreGroups { |
| for k2,v2 := range v1 { |
| if _,ok := ipAddrs[v2.ipAddr]; ok == false { |
| rtrn[k1][k2] = v2 |
| } |
| } |
| } |
| return rtrn, nList |
| } |
| |
| // Figure out where best to put the new pods |
| // in the coreGroup array based on the old |
| // pods being replaced. The criteria is that |
| // the new pod be on the same server as the |
| // old pod was. |
| func reconcileAddrDiffs(coreGroupDiffs [][]*rwPod, rwPodDiffs []*rwPod) ([][]*rwPod) { |
| var srvrs map[string][]*rwPod = make(map[string][]*rwPod) |
| |
| log.Debug("Reconciling diffs") |
| log.Debug("Building server list") |
| for _,v := range rwPodDiffs { |
| log.Debugf("Adding %v to the server list", *v) |
| srvrs[v.node] = append(srvrs[v.node], v) |
| } |
| |
| for k1,v1 := range coreGroupDiffs { |
| log.Debugf("k1:%v, v1:%v", k1,v1) |
| for k2,v2 := range v1 { |
| log.Debugf("k2:%v, v2:%v", k2,v2) |
| if v2 == nil { // Nothing to do here |
| continue |
| } |
| if _,ok := srvrs[v2.node]; ok == true { |
| coreGroupDiffs[k1][k2] = srvrs[v2.node][0] |
| if len(srvrs[v2.node]) > 1 { // remove one entry from the list |
| srvrs[v2.node] = append(srvrs[v2.node][:0], srvrs[v2.node][1:]...) |
| } else { // Delete the endtry from the map |
| delete(srvrs, v2.node) |
| } |
| } else { |
| log.Error("This should never happen, node appears to have changed names") |
| // attempt to limp along by keeping this old entry |
| } |
| } |
| } |
| |
| return coreGroupDiffs |
| } |
| |
| func applyAddrDiffs(client pb.ConfigurationClient, coreGroups [][]*rwPod, rwPods []*rwPod) { |
| var newEntries [][]*rwPod |
| |
| log.Debug("Applying diffs") |
| newEntries = reconcileAddrDiffs(getAddrDiffs(coreGroups, rwPods)) |
| |
| // Now replace the information in coreGropus with the new |
| // entries and then reconcile the device ids on the core |
| // that's in the new entry with the device ids of it's |
| // active-active peer. |
| for k1,v1 := range coreGroups { |
| for k2,v2 := range v1 { |
| if newEntries[k1][k2] != nil { |
| // TODO: Missing is the case where bothe the primary |
| // and the secondary core crash and come back. |
| // Pull the device ids from the active-active peer |
| ids := queryPodDeviceIds(coreGroups[k1][k2^1]) |
| if len(ids) != 0 { |
| if reconcilePodDeviceIds(newEntries[k1][k2], ids) == false { |
| log.Errorf("Attempt to reconcile ids on pod %v failed",newEntries[k1][k2]) |
| } |
| } |
| // Send the affininty router new connection information |
| setConnection(client, v2.backend, v2.connection, newEntries[k1][k2].ipAddr, 50057) |
| // Copy the new entry information over |
| coreGroups[k1][k2].ipAddr = newEntries[k1][k2].ipAddr |
| coreGroups[k1][k2].name = newEntries[k1][k2].name |
| coreGroups[k1][k2].devIds = ids |
| } |
| } |
| } |
| } |
| |
| func startCoreMonitor(client pb.ConfigurationClient, |
| clientset *kubernetes.Clientset, |
| coreFltr *regexp.Regexp, |
| coreGroups [][]*rwPod) error { |
| // Now that initial allocation has been completed, monitor the pods |
| // for IP changes |
| // The main loop needs to do the following: |
| // 1) Periodically query the pods and filter out |
| // the vcore ones |
| // 2) Validate that the pods running are the same |
| // as the previous check |
| // 3) Validate that the IP addresses are the same |
| // as the last check. |
| // If the pod name(s) ha(s/ve) changed then remove |
| // the unused pod names and add in the new pod names |
| // maintaining the cluster/backend information. |
| // If an IP address has changed (which shouldn't |
| // happen unless a pod is re-started) it should get |
| // caught by the pod name change. |
| for { |
| time.Sleep(10 * time.Second) // Wait a while |
| // Get the rw core list from k8s |
| rwPods := getRwPods(clientset, coreFltr) |
| queryDeviceIds(rwPods) |
| // If we didn't get 2n+1 pods then wait since |
| // something is down and will hopefully come |
| // back up at some point. |
| // TODO: remove the 6 pod hardcoding |
| if len(rwPods) != 6 { |
| continue |
| } |
| // We have all pods, check if any IP addresses |
| // have changed. |
| for _,v := range rwPods { |
| if hasIpAddr(coreGroups, v.ipAddr) == false { |
| log.Debug("Address has changed...") |
| applyAddrDiffs(client, coreGroups, rwPods) |
| |
| } |
| } |
| } |
| } |
| |
| func hasIpAddr(coreGroups [][]*rwPod, ipAddr string) bool { |
| for _,v1 := range coreGroups { |
| for _,v2 := range v1 { |
| if v2.ipAddr == ipAddr { |
| return true |
| } |
| } |
| } |
| return false |
| } |
| |
| |
| func main() { |
| // This is currently hard coded to a cluster with 3 servers |
| //var connections map[string]configConn = make(map[string]configConn) |
| //var rwCorePodsPrev map[string]rwPod = make(map[string]rwPod) |
| var rwCoreNodesPrev map[string][]rwPod = make(map[string][]rwPod) |
| var firstTime bool = true |
| var err error |
| var conn *grpc.ClientConn |
| |
| |
| // Set up the regular expression to identify the voltha cores |
| coreFltr := regexp.MustCompile(`rw-core[0-9]-`) |
| |
| // Set up logging |
| if _, err := log.SetDefaultLogger(log.JSON, 0, nil); err != nil { |
| log.With(log.Fields{"error": err}).Fatal("Cannot setup logging") |
| } |
| |
| // Set up kubernetes api |
| clientset := k8sClientSet() |
| |
| // Connect to the affinity router and set up the client |
| conn, err = connect("localhost:55554") // This is a sidecar container so communicating over localhost |
| if err != nil { |
| panic(err.Error()) |
| } |
| client := pb.NewConfigurationClient(conn) |
| |
| // Get the voltha rw-core podes |
| rwPods := getRwPods(clientset, coreFltr) |
| |
| // Fetch the devices held by each running core |
| queryDeviceIds(rwPods) |
| |
| // For debugging... comment out l8r |
| for _,v := range rwPods { |
| log.Debugf("Pod list %v", *v) |
| } |
| |
| coreGroups := groupPods1(rwPods) |
| |
| |
| // Assign the groupings to the the backends and connections |
| for k,_ := range coreGroups { |
| for k1,_ := range coreGroups[k] { |
| coreGroups[k][k1].backend = "vcore"+strconv.Itoa(k+1) |
| coreGroups[k][k1].connection = "vcore"+strconv.Itoa(k+1)+strconv.Itoa(k1+1) |
| } |
| } |
| log.Debug("Core gouping completed") |
| |
| // TODO: Debugging code, comment out for production |
| for k,v := range coreGroups { |
| for k2,v2 := range v { |
| log.Debugf("Core group %d,%d: %v", k, k2, v2) |
| } |
| } |
| log.Debug("Setting affinities") |
| // Now set the affinities for exising devices in the cores |
| for _,v := range coreGroups { |
| setAffinity(client, v[0].devIds, v[0].backend) |
| setAffinity(client, v[1].devIds, v[1].backend) |
| } |
| log.Debug("Setting connections") |
| // Configure the backeds based on the calculated core groups |
| for _,v := range coreGroups { |
| setConnection(client, v[0].backend, v[0].connection, v[0].ipAddr, 50057) |
| setConnection(client, v[1].backend, v[1].connection, v[1].ipAddr, 50057) |
| } |
| |
| log.Debug("Starting discovery monitoring") |
| startDiscoveryMonitor(client, coreGroups) |
| |
| log.Debugf("Starting core monitoring") |
| startCoreMonitor(client, clientset, coreFltr, coreGroups) // Never returns |
| return |
| |
| |
| // The main loop needs to do the following: |
| // 1) Periodically query the pods and filter out |
| // the vcore ones |
| // 2) Validate that the pods running are the same |
| // as the previous check |
| // 3) Validate that the IP addresses are the same |
| // as the last check. |
| // If the pod name(s) ha(s/ve) changed then remove |
| // the unused pod names and add in the new pod names |
| // maintaining the cluster/backend information. |
| // If an IP address has changed (which shouldn't |
| // happen unless a pod is re-started) it should get |
| // caught by the pod name change. |
| for { |
| var rwCorePods map[string]rwPod = make(map[string]rwPod) |
| var rwCoreNodes map[string][]rwPod = make(map[string][]rwPod) |
| pods, err := clientset.CoreV1().Pods("").List(metav1.ListOptions{}) |
| if err != nil { |
| panic(err.Error()) |
| } |
| log.Debugf("There are %d pods in the cluster\n", len(pods.Items)) |
| |
| /* |
| for k,v := range pods.Items { |
| if v.Namespace == "voltha" && coreFltr.MatchString(v.Name) { |
| fmt.Printf("Namespace: %s, PodName: %s, PodIP: %s, Host: %s\n", v.Namespace, v.Name, |
| v.Status.PodIP, v.Spec.NodeName) |
| //fmt.Printf("Pod %v,%v\n\n\n",k,v) |
| _ = k |
| // Add this pod to the core structure. |
| if firstTime == true { |
| rwCorePodsPrev[v.Name] = rwPod{name:v.Name,node:v.Spec.NodeName} |
| rwCoreNodesPrev[v.Spec.NodeName] = |
| append(rwCoreNodesPrev[v.Spec.NodeName], rwPod{name:v.Name,node:v.Spec.NodeName}) |
| } |
| rwCorePods[v.Name] = rwPod{v.Name,v.Status.PodIP,v.Spec.NodeName, "", ""} |
| rwCoreNodes[v.Spec.NodeName] = |
| append(rwCoreNodes[v.Spec.NodeName], rwPod{v.Name,v.Status.PodIP,v.Spec.NodeName,"",""}) |
| } |
| } |
| */ |
| |
| if len(rwCorePods) != 6 { |
| continue |
| } |
| |
| //fmt.Printf("Pod map: %v\n", rwCorePods) |
| //fmt.Printf("Pod map2: %v\n", rwCoreNodes) |
| |
| // Examples for error handling: |
| // - Use helper functions like e.g. errors.IsNotFound() |
| // - And/or cast to StatusError and use its properties like e.g. ErrStatus.Message |
| /* |
| _, err = clientset.CoreV1().Pods("default").Get("example-xxxxx", metav1.GetOptions{}) |
| if errors.IsNotFound(err) { |
| fmt.Printf("Pod not found\n") |
| } else if statusError, isStatus := err.(*errors.StatusError); isStatus { |
| fmt.Printf("Error getting pod %v\n", statusError.ErrStatus.Message) |
| } else if err != nil { |
| panic(err.Error()) |
| } else { |
| fmt.Printf("Found pod\n") |
| } |
| */ |
| // Set the association to backends and connections only once. |
| // TODO: This needs to be reworked for when a pod crashes |
| // and it's name changes. |
| if firstTime == true { |
| be := 1 |
| for k,_ := range rwCoreNodesPrev { // Each node has 2 cores running on it |
| // Use a pretty dumb distribution algorithm. |
| log.Debugf("Processing core node %s:%d\n", k,be) |
| rwCoreNodesPrev[k][0].backend = "vcore"+strconv.Itoa(be) |
| rwCoreNodesPrev[k][0].connection = "vcore"+strconv.Itoa(be)+strconv.Itoa(1) |
| rwCoreNodesPrev[k][1].backend = "vcore"+strconv.Itoa(be%3+1) |
| rwCoreNodesPrev[k][1].connection = "vcore"+strconv.Itoa(be%3+1)+strconv.Itoa(2) |
| be++ |
| } |
| } |
| |
| log.Debugf("Backend Allocation: %v",rwCoreNodesPrev) |
| // Compare the current node IPs with the previous node IPs and if they differ |
| // then set the new one and send the command to configure the router with the |
| // new backend connection. |
| for k,v := range rwCoreNodesPrev { |
| if rwCoreNodes[k][0].ipAddr != rwCoreNodesPrev[k][0].ipAddr { |
| log.Debugf("Configuring backend %s : connection %s\n\n", v[0].backend, v[0].connection) |
| cnf := &pb.Conn{Server:"grpc_command",Cluster:"vcore",Backend:rwCoreNodesPrev[k][0].backend, |
| Connection:rwCoreNodesPrev[k][0].connection,Addr:rwCoreNodes[k][0].ipAddr, |
| Port:50057} |
| if res, err := client.SetConnection(context.Background(), cnf); err != nil { |
| log.Debugf("failed SetConnection RPC call: %s", err) |
| } else { |
| log.Debugf("Result: %v", res) |
| rwCoreNodesPrev[k][0].ipAddr = rwCoreNodes[k][0].ipAddr |
| } |
| } |
| if rwCoreNodes[k][1].ipAddr != rwCoreNodesPrev[k][1].ipAddr { |
| log.Debugf("Configuring backend %s : connection %s\n\n", v[1].backend, v[1].connection) |
| cnf := &pb.Conn{Server:"grpc_command",Cluster:"vcore",Backend:rwCoreNodesPrev[k][1].backend, |
| Connection:rwCoreNodesPrev[k][1].connection,Addr:rwCoreNodes[k][1].ipAddr, |
| Port:50057} |
| if res, err := client.SetConnection(context.Background(), cnf); err != nil { |
| log.Debugf("failed SetConnection RPC call: %s", err) |
| } else { |
| log.Debugf("Result: %v", res) |
| rwCoreNodesPrev[k][1].ipAddr = rwCoreNodes[k][1].ipAddr |
| } |
| } |
| } |
| |
| |
| fmt.Printf("The structure for setting the connections is: %v\n", rwCoreNodesPrev) |
| firstTime = false |
| |
| // Now make the API calls |
| time.Sleep(10 * time.Second) |
| } |
| conn.Close() |
| |
| } |
| |