cs-codex-dist-tests/Framework/KubernetesWorkflow/K8sController.cs

712 lines
26 KiB
C#
Raw Normal View History

using k8s;
using k8s.Models;
2023-04-25 09:31:15 +00:00
using Logging;
using Utils;
namespace KubernetesWorkflow
2023-04-12 11:53:55 +00:00
{
public class K8sController
{
2023-09-12 08:31:55 +00:00
private readonly ILog log;
2023-04-12 11:53:55 +00:00
private readonly K8sCluster cluster;
private readonly KnownK8sPods knownPods;
private readonly WorkflowNumberSource workflowNumberSource;
2023-05-04 06:25:48 +00:00
private readonly K8sClient client;
2023-04-12 11:53:55 +00:00
2023-09-12 08:31:55 +00:00
public K8sController(ILog log, K8sCluster cluster, KnownK8sPods knownPods, WorkflowNumberSource workflowNumberSource, string k8sNamespace)
2023-04-12 11:53:55 +00:00
{
2023-04-25 09:31:15 +00:00
this.log = log;
2023-04-12 11:53:55 +00:00
this.cluster = cluster;
this.knownPods = knownPods;
this.workflowNumberSource = workflowNumberSource;
2023-05-04 06:25:48 +00:00
client = new K8sClient(cluster.GetK8sClientConfig());
2023-09-12 08:31:55 +00:00
K8sNamespace = k8sNamespace;
}
public void Dispose()
{
client.Dispose();
}
2023-09-25 06:47:19 +00:00
public RunningPod BringOnline(ContainerRecipe[] containerRecipes, ILocation location)
{
2023-04-25 09:31:15 +00:00
log.Debug();
EnsureNamespace();
2023-04-13 09:07:36 +00:00
var deploymentName = CreateDeployment(containerRecipes, location);
var (serviceName, servicePortsMap) = CreateService(containerRecipes);
var podInfo = FetchNewPod();
2023-06-27 13:28:00 +00:00
return new RunningPod(cluster, podInfo, deploymentName, serviceName, servicePortsMap.ToArray());
2023-04-13 09:07:36 +00:00
}
public void Stop(RunningPod pod)
{
2023-04-25 09:31:15 +00:00
log.Debug();
2023-04-13 09:07:36 +00:00
if (!string.IsNullOrEmpty(pod.ServiceName)) DeleteService(pod.ServiceName);
DeleteDeployment(pod.DeploymentName);
WaitUntilDeploymentOffline(pod.DeploymentName);
WaitUntilPodOffline(pod.PodInfo.Name);
}
2023-08-16 14:13:29 +00:00
public void DownloadPodLog(RunningPod pod, ContainerRecipe recipe, ILogHandler logHandler, int? tailLines)
2023-04-13 09:30:19 +00:00
{
2023-04-25 09:31:15 +00:00
log.Debug();
2023-09-12 08:31:55 +00:00
using var stream = client.Run(c => c.ReadNamespacedPodLog(pod.PodInfo.Name, K8sNamespace, recipe.Name, tailLines: tailLines));
2023-04-13 09:30:19 +00:00
logHandler.Log(stream);
}
2023-04-14 07:54:07 +00:00
public string ExecuteCommand(RunningPod pod, string containerName, string command, params string[] args)
{
var cmdAndArgs = $"{containerName}: {command} ({string.Join(",", args)})";
log.Debug(cmdAndArgs);
2023-09-12 08:31:55 +00:00
var runner = new CommandRunner(client, K8sNamespace, pod, containerName, command, args);
2023-04-14 07:54:07 +00:00
runner.Run();
var result = runner.GetStdOut();
log.Debug($"{cmdAndArgs} = '{result}'");
return result;
2023-04-14 07:54:07 +00:00
}
2023-09-12 08:31:55 +00:00
public void DeleteAllNamespacesStartingWith(string prefix)
{
2023-04-25 09:31:15 +00:00
log.Debug();
2023-05-04 06:25:48 +00:00
var all = client.Run(c => c.ListNamespace().Items);
2023-09-12 08:31:55 +00:00
var namespaces = all.Select(n => n.Name()).Where(n => n.StartsWith(prefix));
2023-05-03 12:18:37 +00:00
foreach (var ns in namespaces)
{
DeleteNamespace(ns);
}
}
2023-09-12 08:31:55 +00:00
public void DeleteNamespace()
2023-05-03 12:18:37 +00:00
{
log.Debug();
if (IsNamespaceOnline(K8sNamespace))
2023-05-03 12:18:37 +00:00
{
2023-09-12 08:31:55 +00:00
client.Run(c => c.DeleteNamespace(K8sNamespace, null, null, gracePeriodSeconds: 0));
2023-05-03 12:18:37 +00:00
}
}
2023-05-03 12:18:37 +00:00
public void DeleteNamespace(string ns)
{
log.Debug();
if (IsNamespaceOnline(ns))
{
2023-05-04 06:25:48 +00:00
client.Run(c => c.DeleteNamespace(ns, null, null, gracePeriodSeconds: 0));
2023-05-03 12:18:37 +00:00
}
}
#region Discover K8s Nodes
2023-09-25 06:47:19 +00:00
public K8sNodeLabel[] GetAvailableK8sNodes()
{
var nodes = client.Run(c => c.ListNode());
var optionals = nodes.Items.Select(i => CreateNodeLabel(i));
return optionals.Where(n => n != null).Select(n => n!).ToArray();
}
private K8sNodeLabel? CreateNodeLabel(V1Node i)
{
var keys = i.Metadata.Labels.Keys;
var hostnameKey = keys.SingleOrDefault(k => k.ToLowerInvariant().Contains("hostname"));
if (hostnameKey != null)
{
var hostnameValue = i.Metadata.Labels[hostnameKey];
return new K8sNodeLabel(hostnameKey, hostnameValue);
}
return null;
}
#endregion
#region Namespace management
2023-09-12 08:31:55 +00:00
private string K8sNamespace { get; }
2023-05-04 06:25:48 +00:00
private void EnsureNamespace()
{
if (IsNamespaceOnline(K8sNamespace)) return;
var namespaceSpec = new V1Namespace
{
ApiVersion = "v1",
Metadata = new V1ObjectMeta
{
2023-09-12 08:31:55 +00:00
Name = K8sNamespace,
Labels = new Dictionary<string, string> { { "name", K8sNamespace } }
}
};
2023-05-04 06:25:48 +00:00
client.Run(c => c.CreateNamespace(namespaceSpec));
WaitUntilNamespaceCreated();
CreatePolicy();
}
2023-05-03 12:18:37 +00:00
private bool IsNamespaceOnline(string name)
{
2023-05-04 06:25:48 +00:00
return client.Run(c => c.ListNamespace().Items.Any(n => n.Metadata.Name == name));
}
private void CreatePolicy()
{
client.Run(c =>
{
var body = new V1NetworkPolicy
{
Metadata = new V1ObjectMeta
{
Name = "isolate-policy",
2023-09-12 08:31:55 +00:00
NamespaceProperty = K8sNamespace
},
Spec = new V1NetworkPolicySpec
{
2023-05-30 19:41:34 +00:00
PodSelector = new V1LabelSelector {},
PolicyTypes = new[]
{
"Ingress",
"Egress"
},
Ingress = new List<V1NetworkPolicyIngressRule>
{
new V1NetworkPolicyIngressRule
{
FromProperty = new List<V1NetworkPolicyPeer>
{
new V1NetworkPolicyPeer
{
2023-05-30 19:41:34 +00:00
PodSelector = new V1LabelSelector {}
}
}
},
new V1NetworkPolicyIngressRule
{
FromProperty = new List<V1NetworkPolicyPeer>
{
new V1NetworkPolicyPeer
{
NamespaceSelector = new V1LabelSelector
{
MatchLabels = GetRunnerNamespaceSelector()
}
}
}
},
new V1NetworkPolicyIngressRule
{
FromProperty = new List<V1NetworkPolicyPeer>
{
new V1NetworkPolicyPeer
{
NamespaceSelector = new V1LabelSelector
{
MatchLabels = GetPrometheusNamespaceSelector()
}
}
}
}
},
Egress = new List<V1NetworkPolicyEgressRule>
{
2023-05-30 19:41:34 +00:00
new V1NetworkPolicyEgressRule
{
To = new List<V1NetworkPolicyPeer>
{
new V1NetworkPolicyPeer
{
PodSelector = new V1LabelSelector {}
}
}
},
new V1NetworkPolicyEgressRule
{
To = new List<V1NetworkPolicyPeer>
{
new V1NetworkPolicyPeer
{
NamespaceSelector = new V1LabelSelector
{
2023-05-30 19:41:34 +00:00
MatchLabels = new Dictionary<string, string> { { "kubernetes.io/metadata.name", "kube-system" } }
}
},
new V1NetworkPolicyPeer
{
PodSelector = new V1LabelSelector
{
MatchLabels = new Dictionary<string, string> { { "k8s-app", "kube-dns" } }
}
}
2023-05-30 19:41:34 +00:00
},
Ports = new List<V1NetworkPolicyPort>
{
new V1NetworkPolicyPort
{
Port = new IntstrIntOrString
{
Value = "53"
},
Protocol = "UDP"
}
}
},
new V1NetworkPolicyEgressRule
{
To = new List<V1NetworkPolicyPeer>
{
new V1NetworkPolicyPeer
{
IpBlock = new V1IPBlock
{
Cidr = "0.0.0.0/0"
2023-05-30 19:41:34 +00:00
}
}
},
Ports = new List<V1NetworkPolicyPort>
{
new V1NetworkPolicyPort
{
Port = new IntstrIntOrString
{
Value = "80"
},
Protocol = "TCP"
},
new V1NetworkPolicyPort
{
Port = new IntstrIntOrString
{
Value = "443"
},
Protocol = "TCP"
}
}
}
2023-05-30 19:41:34 +00:00
}
}
};
2023-09-12 08:31:55 +00:00
c.CreateNamespacedNetworkPolicy(body, K8sNamespace);
});
}
#endregion
#region Deployment management
2023-09-25 06:47:19 +00:00
private string CreateDeployment(ContainerRecipe[] containerRecipes, ILocation location)
{
var deploymentSpec = new V1Deployment
{
ApiVersion = "apps/v1",
Metadata = CreateDeploymentMetadata(containerRecipes),
Spec = new V1DeploymentSpec
{
Replicas = 1,
Selector = new V1LabelSelector
{
MatchLabels = GetSelector(containerRecipes)
},
Template = new V1PodTemplateSpec
{
Metadata = new V1ObjectMeta
{
Labels = GetSelector(containerRecipes),
Annotations = GetAnnotations(containerRecipes)
},
Spec = new V1PodSpec
{
NodeSelector = CreateNodeSelector(location),
Containers = CreateDeploymentContainers(containerRecipes),
Volumes = CreateVolumes(containerRecipes)
}
}
}
};
2023-09-12 08:31:55 +00:00
client.Run(c => c.CreateNamespacedDeployment(deploymentSpec, K8sNamespace));
2023-04-13 09:07:36 +00:00
WaitUntilDeploymentOnline(deploymentSpec.Metadata.Name);
return deploymentSpec.Metadata.Name;
}
private void DeleteDeployment(string deploymentName)
{
2023-09-12 08:31:55 +00:00
client.Run(c => c.DeleteNamespacedDeployment(deploymentName, K8sNamespace));
2023-04-13 09:07:36 +00:00
WaitUntilDeploymentOffline(deploymentName);
}
2023-09-25 06:47:19 +00:00
private IDictionary<string, string> CreateNodeSelector(ILocation location)
{
2023-09-25 06:47:19 +00:00
var nodeLabel = GetNodeLabelForLocation(location);
if (nodeLabel == null) return new Dictionary<string, string>();
return new Dictionary<string, string>
{
{ nodeLabel.Key, nodeLabel.Value }
};
}
2023-09-25 06:47:19 +00:00
private K8sNodeLabel? GetNodeLabelForLocation(ILocation location)
{
var l = (Location)location;
return l.NodeLabel;
}
private IDictionary<string, string> GetSelector(ContainerRecipe[] containerRecipes)
{
return containerRecipes.First().PodLabels.GetLabels();
}
private IDictionary<string, string> GetRunnerNamespaceSelector()
{
return new Dictionary<string, string> { { "kubernetes.io/metadata.name", "default" } };
}
private IDictionary<string, string> GetPrometheusNamespaceSelector()
{
return new Dictionary<string, string> { { "kubernetes.io/metadata.name", "monitoring" } };
}
private IDictionary<string, string> GetAnnotations(ContainerRecipe[] containerRecipes)
{
return containerRecipes.First().PodAnnotations.GetAnnotations();
}
private V1ObjectMeta CreateDeploymentMetadata(ContainerRecipe[] containerRecipes)
{
return new V1ObjectMeta
{
2023-09-15 10:25:10 +00:00
Name = string.Join('-',containerRecipes.Select(r => r.Name)),
2023-09-12 08:31:55 +00:00
NamespaceProperty = K8sNamespace,
Labels = GetSelector(containerRecipes),
Annotations = GetAnnotations(containerRecipes)
};
}
private List<V1Container> CreateDeploymentContainers(ContainerRecipe[] containerRecipes)
{
return containerRecipes.Select(CreateDeploymentContainer).ToList();
}
private V1Container CreateDeploymentContainer(ContainerRecipe recipe)
{
return new V1Container
{
Name = recipe.Name,
Image = recipe.Image,
2023-06-06 14:10:30 +00:00
ImagePullPolicy = "Always",
Ports = CreateContainerPorts(recipe),
Env = CreateEnv(recipe),
2023-09-08 08:14:52 +00:00
VolumeMounts = CreateContainerVolumeMounts(recipe),
Resources = CreateResourceLimits(recipe)
};
}
2023-09-08 08:14:52 +00:00
private V1ResourceRequirements CreateResourceLimits(ContainerRecipe recipe)
{
return new V1ResourceRequirements
{
2023-09-08 11:47:49 +00:00
Requests = CreateResourceQuantities(recipe.Resources.Requests),
Limits = CreateResourceQuantities(recipe.Resources.Limits)
2023-09-08 08:14:52 +00:00
};
}
2023-09-08 11:47:49 +00:00
private Dictionary<string, ResourceQuantity> CreateResourceQuantities(ContainerResourceSet set)
2023-09-08 08:14:52 +00:00
{
var result = new Dictionary<string, ResourceQuantity>();
2023-09-08 11:47:49 +00:00
if (set.MilliCPUs != 0)
2023-09-08 08:14:52 +00:00
{
2023-09-08 11:47:49 +00:00
result.Add("cpu", new ResourceQuantity($"{set.MilliCPUs}m"));
2023-09-08 08:14:52 +00:00
}
2023-09-08 11:47:49 +00:00
if (set.Memory.SizeInBytes != 0)
2023-09-08 08:14:52 +00:00
{
2023-09-08 11:47:49 +00:00
result.Add("memory", new ResourceQuantity(set.Memory.ToSuffixNotation()));
2023-09-08 08:14:52 +00:00
}
return result;
}
private List<V1VolumeMount> CreateContainerVolumeMounts(ContainerRecipe recipe)
{
return recipe.Volumes.Select(CreateContainerVolumeMount).ToList();
}
private V1VolumeMount CreateContainerVolumeMount(VolumeMount v)
{
return new V1VolumeMount
{
Name = v.VolumeName,
MountPath = v.MountPath
};
}
private List<V1Volume> CreateVolumes(ContainerRecipe[] containerRecipes)
{
return containerRecipes.Where(c => c.Volumes.Any()).SelectMany(CreateVolumes).ToList();
}
private List<V1Volume> CreateVolumes(ContainerRecipe recipe)
{
return recipe.Volumes.Select(CreateVolume).ToList();
}
private V1Volume CreateVolume(VolumeMount v)
{
client.Run(c => c.CreateNamespacedPersistentVolumeClaim(new V1PersistentVolumeClaim
{
ApiVersion = "v1",
Metadata = new V1ObjectMeta
{
Name = v.VolumeName
},
Spec = new V1PersistentVolumeClaimSpec
{
AccessModes = new List<string>
{
2023-09-07 08:55:35 +00:00
"ReadWriteOnce"
},
Resources = new V1ResourceRequirements
{
Requests = new Dictionary<string, ResourceQuantity>
{
{"storage", new ResourceQuantity(v.ResourceQuantity) }
}
}
}
2023-09-12 08:31:55 +00:00
}, K8sNamespace));
return new V1Volume
{
Name = v.VolumeName,
PersistentVolumeClaim = new V1PersistentVolumeClaimVolumeSource
{
ClaimName = v.VolumeName
}
};
2023-04-12 11:53:55 +00:00
}
private List<V1EnvVar> CreateEnv(ContainerRecipe recipe)
2023-04-12 11:53:55 +00:00
{
return recipe.EnvVars.Select(CreateEnvVar).ToList();
}
private V1EnvVar CreateEnvVar(EnvVar envVar)
{
return new V1EnvVar
{
Name = envVar.Name,
Value = envVar.Value,
};
}
private List<V1ContainerPort> CreateContainerPorts(ContainerRecipe recipe)
{
var exposedPorts = recipe.ExposedPorts.Select(p => CreateContainerPort(recipe, p));
var internalPorts = recipe.InternalPorts.Select(p => CreateContainerPort(recipe, p));
return exposedPorts.Concat(internalPorts).ToList();
}
private V1ContainerPort CreateContainerPort(ContainerRecipe recipe, Port port)
{
return new V1ContainerPort
{
Name = GetNameForPort(recipe, port),
ContainerPort = port.Number
};
}
private string GetNameForPort(ContainerRecipe recipe, Port port)
{
2023-04-13 07:33:10 +00:00
return $"p{workflowNumberSource.WorkflowNumber}-{recipe.Number}-{port.Number}";
}
#endregion
#region Service management
2023-06-27 13:28:00 +00:00
private (string, List<ContainerRecipePortMapEntry>) CreateService(ContainerRecipe[] containerRecipes)
{
2023-06-27 13:28:00 +00:00
var result = new List<ContainerRecipePortMapEntry>();
var ports = CreateServicePorts(containerRecipes);
if (!ports.Any())
{
2023-05-30 19:41:34 +00:00
// None of these container-recipes wish to expose anything via a service port.
// So, we don't have to create a service.
2023-04-13 09:07:36 +00:00
return (string.Empty, result);
}
var serviceSpec = new V1Service
{
ApiVersion = "v1",
Metadata = CreateServiceMetadata(),
Spec = new V1ServiceSpec
{
Type = "NodePort",
Selector = GetSelector(containerRecipes),
Ports = ports
}
};
2023-09-12 08:31:55 +00:00
client.Run(c => c.CreateNamespacedService(serviceSpec, K8sNamespace));
2023-04-13 09:07:36 +00:00
ReadBackServiceAndMapPorts(serviceSpec, containerRecipes, result);
2023-04-13 09:07:36 +00:00
return (serviceSpec.Metadata.Name, result);
}
2023-06-27 13:28:00 +00:00
private void ReadBackServiceAndMapPorts(V1Service serviceSpec, ContainerRecipe[] containerRecipes, List<ContainerRecipePortMapEntry> result)
{
// For each container-recipe, we need to figure out which service-ports it was assigned by K8s.
2023-09-12 08:31:55 +00:00
var readback = client.Run(c => c.ReadNamespacedService(serviceSpec.Metadata.Name, K8sNamespace));
foreach (var r in containerRecipes)
{
2023-10-19 12:03:36 +00:00
foreach (var port in r.ExposedPorts)
{
2023-10-19 12:03:36 +00:00
var portName = GetNameForPort(r, port);
var matchingServicePorts = readback.Spec.Ports.Where(p => p.Name == portName);
if (matchingServicePorts.Any())
{
// These service ports belongs to this recipe.
2023-10-19 13:48:49 +00:00
var optionals = matchingServicePorts.Select(p => MapNodePortIfAble(p, port.Tag));
var ports = optionals.Where(p => p != null).Select(p => p!).ToArray();
2023-06-27 13:28:00 +00:00
result.Add(new ContainerRecipePortMapEntry(r.Number, ports));
}
}
}
}
private Port? MapNodePortIfAble(V1ServicePort p, string tag)
{
if (p.NodePort == null) return null;
return new Port(p.NodePort.Value, tag);
}
2023-04-13 09:07:36 +00:00
private void DeleteService(string serviceName)
{
2023-09-12 08:31:55 +00:00
client.Run(c => c.DeleteNamespacedService(serviceName, K8sNamespace));
}
private V1ObjectMeta CreateServiceMetadata()
{
return new V1ObjectMeta
{
2023-04-13 08:11:33 +00:00
Name = "service-" + workflowNumberSource.WorkflowNumber,
2023-09-12 08:31:55 +00:00
NamespaceProperty = K8sNamespace
};
}
private List<V1ServicePort> CreateServicePorts(ContainerRecipe[] recipes)
{
var result = new List<V1ServicePort>();
foreach (var recipe in recipes)
{
result.AddRange(CreateServicePorts(recipe));
}
return result;
}
private List<V1ServicePort> CreateServicePorts(ContainerRecipe recipe)
{
var result = new List<V1ServicePort>();
foreach (var port in recipe.ExposedPorts)
{
result.Add(new V1ServicePort
{
Name = GetNameForPort(recipe, port),
Protocol = "TCP",
Port = port.Number,
TargetPort = GetNameForPort(recipe, port),
});
}
return result;
}
#endregion
#region Waiting
private void WaitUntilNamespaceCreated()
{
2023-10-04 08:37:18 +00:00
WaitUntil(() => IsNamespaceOnline(K8sNamespace));
}
private void WaitUntilDeploymentOnline(string deploymentName)
{
WaitUntil(() =>
{
2023-09-12 08:31:55 +00:00
var deployment = client.Run(c => c.ReadNamespacedDeployment(deploymentName, K8sNamespace));
return deployment?.Status.AvailableReplicas != null && deployment.Status.AvailableReplicas > 0;
});
}
2023-04-13 09:07:36 +00:00
private void WaitUntilDeploymentOffline(string deploymentName)
{
WaitUntil(() =>
{
2023-09-12 08:31:55 +00:00
var deployments = client.Run(c => c.ListNamespacedDeployment(K8sNamespace));
2023-04-13 09:07:36 +00:00
var deployment = deployments.Items.SingleOrDefault(d => d.Metadata.Name == deploymentName);
return deployment == null || deployment.Status.AvailableReplicas == 0;
});
}
private void WaitUntilPodOffline(string podName)
{
WaitUntil(() =>
{
2023-09-12 08:31:55 +00:00
var pods = client.Run(c => c.ListNamespacedPod(K8sNamespace)).Items;
2023-04-13 09:07:36 +00:00
var pod = pods.SingleOrDefault(p => p.Metadata.Name == podName);
return pod == null;
});
}
private void WaitUntil(Func<bool> predicate)
{
2023-04-25 09:31:15 +00:00
var sw = Stopwatch.Begin(log, true);
try
{
Time.WaitUntil(predicate, cluster.K8sOperationTimeout(), cluster.K8sOperationRetryDelay());
2023-04-25 09:31:15 +00:00
}
finally
{
sw.End("", 1);
}
}
#endregion
2023-08-15 09:01:18 +00:00
public CrashWatcher CreateCrashWatcher(RunningContainer container)
2023-08-14 13:10:36 +00:00
{
2023-09-12 08:31:55 +00:00
return new CrashWatcher(log, cluster.GetK8sClientConfig(), K8sNamespace, container);
2023-08-14 13:10:36 +00:00
}
private PodInfo FetchNewPod()
{
2023-09-12 08:31:55 +00:00
var pods = client.Run(c => c.ListNamespacedPod(K8sNamespace)).Items;
var newPods = pods.Where(p => !knownPods.Contains(p.Name())).ToArray();
if (newPods.Length != 1) throw new InvalidOperationException("Expected only 1 pod to be created. Test infra failure.");
var newPod = newPods.Single();
var name = newPod.Name();
var ip = newPod.Status.PodIP;
var k8sNodeName = newPod.Spec.NodeName;
2023-04-12 11:53:55 +00:00
if (string.IsNullOrEmpty(name)) throw new InvalidOperationException("Invalid pod name received. Test infra failure.");
if (string.IsNullOrEmpty(ip)) throw new InvalidOperationException("Invalid pod IP received. Test infra failure.");
2023-04-12 11:53:55 +00:00
knownPods.Add(name);
return new PodInfo(name, ip, k8sNodeName);
2023-04-12 11:53:55 +00:00
}
}
}