refactor error reporting
This commit is contained in:
parent
85e8dea086
commit
3fb58e9077
|
|
@ -76,8 +76,9 @@ func (c *Controller) nodeIsReady(node *v1.Node) bool {
|
|||
}
|
||||
|
||||
func (c *Controller) moveMasterPodsOffNode(node *v1.Node) {
|
||||
|
||||
nodeName := util.NameFromMeta(node.ObjectMeta)
|
||||
c.logger.Infof("moving pods: node %q became unschedulable and does not have a ready label: %q",
|
||||
c.logger.Infof("moving pods: node %q became unschedulable and does not have a ready label %q",
|
||||
nodeName, c.opConfig.NodeReadinessLabel)
|
||||
|
||||
opts := metav1.ListOptions{
|
||||
|
|
@ -85,7 +86,7 @@ func (c *Controller) moveMasterPodsOffNode(node *v1.Node) {
|
|||
}
|
||||
podList, err := c.KubeClient.Pods(c.opConfig.WatchedNamespace).List(opts)
|
||||
if err != nil {
|
||||
c.logger.Errorf("could not fetch list of the pods: %v", err)
|
||||
c.logger.Errorf("could not fetch the list of Spilo pods: %v", err)
|
||||
return
|
||||
}
|
||||
|
||||
|
|
@ -96,21 +97,25 @@ func (c *Controller) moveMasterPodsOffNode(node *v1.Node) {
|
|||
}
|
||||
}
|
||||
|
||||
clusters := make(map[*cluster.Cluster]bool)
|
||||
movedMasterPods := 0
|
||||
movableMasterPods := make(map[*v1.Pod]*cluster.Cluster)
|
||||
movedPods := 0
|
||||
unmovableMasterPods := make(map[spec.NamespacedName]string) // podName -> reason
|
||||
unmovablePods := make(map[spec.NamespacedName]string)
|
||||
|
||||
clusters := make(map[*cluster.Cluster]bool)
|
||||
|
||||
for _, pod := range nodePods {
|
||||
|
||||
podName := util.NameFromMeta(pod.ObjectMeta)
|
||||
|
||||
role, ok := pod.Labels[c.opConfig.PodRoleLabel]
|
||||
|
||||
if !ok {
|
||||
unmovableMasterPods[podName] = fmt.Sprintf("could not move pod %q from node %q: pod has no role label %q", podName, nodeName, c.opConfig.PodRoleLabel)
|
||||
// pods with an unknown role cannot be safely moved to another node
|
||||
unmovablePods[podName] = fmt.Sprintf("could not move pod %q from node %q: pod has no role label %q", podName, nodeName, c.opConfig.PodRoleLabel)
|
||||
continue
|
||||
}
|
||||
|
||||
if cluster.PostgresRole(role) != cluster.Master {
|
||||
// deployments can transparently re-create replicas so we do not move away such pods
|
||||
if cluster.PostgresRole(role) == cluster.Replica {
|
||||
continue
|
||||
}
|
||||
|
||||
|
|
@ -120,7 +125,7 @@ func (c *Controller) moveMasterPodsOffNode(node *v1.Node) {
|
|||
cl, ok := c.clusters[clusterName]
|
||||
c.clustersMu.RUnlock()
|
||||
if !ok {
|
||||
unmovableMasterPods[podName] = fmt.Sprintf("could not move pod %q from node %q: pod belongs to the unknown Postgres cluster %q", podName, nodeName, clusterName)
|
||||
unmovablePods[podName] = fmt.Sprintf("could not move master pod %q from node %q: pod belongs to an unknown Postgres cluster %q", podName, nodeName, clusterName)
|
||||
continue
|
||||
}
|
||||
|
||||
|
|
@ -136,12 +141,12 @@ func (c *Controller) moveMasterPodsOffNode(node *v1.Node) {
|
|||
}
|
||||
|
||||
for pod, cl := range movableMasterPods {
|
||||
podName := util.NameFromMeta(pod.ObjectMeta)
|
||||
|
||||
if err := cl.MigrateMasterPod(podName); err != nil {
|
||||
unmovableMasterPods[podName] = fmt.Sprintf("could not move master pod %q from node %q: %v", podName, nodeName, err)
|
||||
podName := util.NameFromMeta(pod.ObjectMeta)
|
||||
if err := cl.MigrateMasterPod(podName); err == nil {
|
||||
movedMasterPods++
|
||||
} else {
|
||||
movedPods++
|
||||
unmovablePods[podName] = fmt.Sprintf("could not move master pod %q from node %q: %v", podName, nodeName, err)
|
||||
}
|
||||
}
|
||||
|
||||
|
|
@ -149,18 +154,16 @@ func (c *Controller) moveMasterPodsOffNode(node *v1.Node) {
|
|||
cl.Unlock()
|
||||
}
|
||||
|
||||
totalPods := len(nodePods)
|
||||
|
||||
c.logger.Infof("%d out of %d master pods have been moved out from the node %q",
|
||||
movedPods, totalPods, nodeName)
|
||||
|
||||
if leftPods := totalPods - movedPods; leftPods > 0 {
|
||||
c.logger.Warnf("could not move %d master pods from the node %q, you may have to delete them manually:",
|
||||
leftPods, totalPods, nodeName)
|
||||
for _, reason := range unmovableMasterPods {
|
||||
if leftPods := len(unmovablePods); leftPods > 0 {
|
||||
c.logger.Warnf("could not move %d master or unknown role pods from the node %q, you may have to delete them manually",
|
||||
leftPods, nodeName)
|
||||
for _, reason := range unmovablePods {
|
||||
c.logger.Warning(reason)
|
||||
}
|
||||
}
|
||||
|
||||
c.logger.Infof("%d master pods have been moved out from the node %q", movedMasterPods, nodeName)
|
||||
|
||||
}
|
||||
|
||||
func (c *Controller) nodeDelete(obj interface{}) {
|
||||
|
|
|
|||
Loading…
Reference in New Issue