Skip to content

Commit

Permalink
integration test suite for Custom Networking + Security Groups for Pods
Browse files Browse the repository at this point in the history
  • Loading branch information
jdn5126 committed Mar 4, 2024
1 parent bcd7214 commit b7ed952
Show file tree
Hide file tree
Showing 7 changed files with 635 additions and 11 deletions.
2 changes: 1 addition & 1 deletion test/framework/resources/agent/traffic_tester.go
Original file line number Diff line number Diff line change
Expand Up @@ -93,7 +93,7 @@ func (t *TrafficTest) TestTraffic() (float64, error) {
if t.ValidateServerPods != nil {
err = t.ValidateServerPods(podList)
if err != nil {
return 0, fmt.Errorf("pod list %v validation failed %v", podList, err)
return 0, fmt.Errorf("pod list validation failed %v", err)
}
fmt.Fprintln(GinkgoWriter, "successfully validated the server pod list")
}
Expand Down
21 changes: 14 additions & 7 deletions test/integration/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -74,22 +74,21 @@ In order to test a custom image you need pass the following tags along with the

*IMPORTANT*: Should use an IPv6 cluster with Prefix Delegation enabled. VPC CNI only supports IPv6 mode with Prefix Delegation.

### Custom Networking
### Custom Networking tests (custom_networking)

Custom networking tests validate use of the `AWS_VPC_K8S_CNI_CUSTOM_NETWORK_CFG` environment variable.

Test info:
- No existing node group should be present. The test creates a self managed node group with the reduced MAX_POD value.
- Pass `custom-networking-cidr-range` flag with *allowed* VPC CIDR that does not conflict with an existing one. So if existing VPC CIDR is `192.168.0.0/16`, you can use `custom-networking-cidr-range=100.64.0.0/16`. You can go to your cluster VPC to check existing/allowed CIDRs.

### SNAT tests
### SNAT tests (snat)

SNAT tests cover pod source NAT behavior with various deployment scenarios.

Test info:
- EKS Cluster should have at least one private subnet and at least one public subnet. These tests modify the SNAT related variables in `aws-node` pod, validate the IP table SNAT rules, and check for Internet Connectivity.

### Calico tests
### Calico tests (calico)

`calico` helps validate compatibility with calico network policies. It does so by running the Calico Stars policy demo.

Expand All @@ -99,10 +98,18 @@ Test info:

Test info:
- Requires at least one Nitro-based instance.
- EKS Cluster should be v1.16+. This tests creates an additional Trunk ENI on all Nitro-based instances present in the cluster. This could interfere with running integration tests that expect specific values of `WARM_ENI_TARGET`.
- For this reason, the test should either be run without any node groups present in the cluster or at the very end.
- EKS Cluster should be v1.16+. This tests creates an additional Trunk ENI on all Nitro-based instances present in the cluster.

### Multus tests
### Custom Networking and Security Groups for Pods tests (custom_networking_sgpp)

`custom_networking_sgpp` test suite validates the combination of Custom Networking and Security Groups for Pods.

Test info:
- Pass `custom-networking-cidr-range` flag with *allowed* VPC CIDR that does not conflict with an existing one. So if existing VPC CIDR is `192.168.0.0/16`, you can use `custom-networking-cidr-range=100.64.0.0/16`. You can go to your cluster VPC to check existing/allowed CIDRs.
- Requires at least one Nitro-based instance.
- EKS Cluster should be v1.16+. This tests creates an additional Trunk ENI on all Nitro-based instances present in the cluster.

### Multus tests (multus)
These tests require multus to be deployed to your cluster using the [manifest](https://raw.githubusercontent.com/aws/amazon-vpc-cni-k8s/master/config/multus/v3.9.2-eksbuild.1/aws-k8s-multus.yaml) file. Instead test can be triggered by running `run-multus-tests.sh` located under scripts directory. This script installs the multus manifest first and then runs the the ginkgo test suite.
You can optionally provide multus tag to install the manifest. If not provided then it will use the default tag

Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,219 @@
// Copyright Amazon.com Inc. or its affiliates. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License"). You may
// not use this file except in compliance with the License. A copy of the
// License is located at
//
// http://aws.amazon.com/apache2.0/
//
// or in the "license" file accompanying this file. This file is distributed
// on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
// express or implied. See the License for the specific language governing
// permissions and limitations under the License.

package custom_networking_sgpp

import (
"flag"
"fmt"
"net"
"testing"

"github.com/aws/amazon-vpc-cni-k8s/pkg/apis/crd/v1alpha1"
"github.com/aws/amazon-vpc-cni-k8s/test/framework"
awsUtils "github.com/aws/amazon-vpc-cni-k8s/test/framework/resources/aws/utils"
"github.com/aws/amazon-vpc-cni-k8s/test/framework/resources/k8s/manifest"
k8sUtils "github.com/aws/amazon-vpc-cni-k8s/test/framework/resources/k8s/utils"
"github.com/aws/amazon-vpc-cni-k8s/test/framework/utils"
"github.com/aws/amazon-vpc-resource-controller-k8s/pkg/aws/vpc"
"github.com/prometheus/client_golang/prometheus"
corev1 "k8s.io/api/core/v1"

"github.com/apparentlymart/go-cidr/cidr"
. "github.com/onsi/ginkgo/v2"
. "github.com/onsi/gomega"
)

func TestCustomNetworkingSGPP(t *testing.T) {
RegisterFailHandler(Fail)
RunSpecs(t, "CNI Custom Networking + Security Groups for Pods Test Suite")
}

var (
f *framework.Framework
// VPC Configuration with the details of public subnet and availability zone present in the cluster's subnets
clusterVPCConfig *awsUtils.ClusterVPCConfig
// The CIDR Range that will be associated with the VPC to create new subnet for Custom Networking
cidrRangeString string
cidrRange *net.IPNet
cidrBlockAssociationID string
// Security Group that will be used in ENIConfig
customNetworkingSGID string
customNetworkingSubnetIDList []string
// List of ENIConfig per Availability Zone
eniConfigList []*v1alpha1.ENIConfig
eniConfigBuilderList []*manifest.ENIConfigBuilder
// Security Group that will be used to create Security Group Policy
podEniSGID string
// Port that will be opened for Security Groups for Pods testing
podEniOpenPort = 80
metricsPort = 8080
// Maximum number of branch interfaces that can be created across all nodes
totalBranchInterface int
// Cluster security group ID for node to node communication
clusterSGID string

targetNode corev1.Node
v4Zero = "0.0.0.0/0"
v6Zero = "::/0"
numNodes int // number of nodes in cluster
)

// Parse test specific variable from flag
func init() {
flag.StringVar(&cidrRangeString, "custom-networking-cidr-range", "100.64.0.0/16", "custom networking cidr range to be associated with the VPC")
}

var _ = BeforeSuite(func() {
f = framework.New(framework.GlobalOptions)

_, cidrRange, err = net.ParseCIDR(cidrRangeString)
Expect(err).ToNot(HaveOccurred())

By("getting the cluster VPC Config")
clusterVPCConfig, err = awsUtils.GetClusterVPCConfig(f)
Expect(err).ToNot(HaveOccurred())

By("Getting Cluster Security Group ID")
clusterRes, err := f.CloudServices.EKS().DescribeCluster(f.Options.ClusterName)
Expect(err).NotTo(HaveOccurred())
clusterSGID = *(clusterRes.Cluster.ResourcesVpcConfig.ClusterSecurityGroupId)
fmt.Fprintf(GinkgoWriter, "cluster security group is %s\n", clusterSGID)

// Custom Networking setup
// TODO: Ideally, we would clone the Custom Networking SG from the cluster SG. Unfortunately, the EC2 API does not support this.
By("creating security group to be used by custom networking")
createSecurityGroupOutput, err := f.CloudServices.EC2().
CreateSecurityGroup("custom-networking-test", "custom networking", f.Options.AWSVPCID)
Expect(err).ToNot(HaveOccurred())
customNetworkingSGID = *createSecurityGroupOutput.GroupId

By("authorizing egress and ingress for security group in ENIConfig")
f.CloudServices.EC2().AuthorizeSecurityGroupEgress(customNetworkingSGID, "-1", -1, -1, v4Zero)
f.CloudServices.EC2().AuthorizeSecurityGroupIngress(customNetworkingSGID, "-1", -1, -1, v4Zero)

By("associating cidr range to the VPC")
association, err := f.CloudServices.EC2().AssociateVPCCIDRBlock(f.Options.AWSVPCID, cidrRange.String())
Expect(err).ToNot(HaveOccurred())
cidrBlockAssociationID = *association.CidrBlockAssociation.AssociationId

for i, az := range clusterVPCConfig.AvailZones {
By(fmt.Sprintf("creating the subnet in %s", az))

subnetCidr, err := cidr.Subnet(cidrRange, 8, 5*i)
Expect(err).ToNot(HaveOccurred())

createSubnetOutput, err := f.CloudServices.EC2().
CreateSubnet(subnetCidr.String(), f.Options.AWSVPCID, az)
Expect(err).ToNot(HaveOccurred())

subnetID := *createSubnetOutput.Subnet.SubnetId

By("associating the route table with the newly created subnet")
err = f.CloudServices.EC2().AssociateRouteTableToSubnet(clusterVPCConfig.PublicRouteTableID, subnetID)
Expect(err).ToNot(HaveOccurred())

eniConfigBuilder := manifest.NewENIConfigBuilder().
Name(az).
SubnetID(subnetID).
SecurityGroup([]string{customNetworkingSGID})
eniConfig, err := eniConfigBuilder.Build()
Expect(err).ToNot(HaveOccurred())

// For updating/deleting later
customNetworkingSubnetIDList = append(customNetworkingSubnetIDList, subnetID)
eniConfigBuilderList = append(eniConfigBuilderList, eniConfigBuilder)
eniConfigList = append(eniConfigList, eniConfig.DeepCopy())

By("creating the ENIConfig with az name")
err = f.K8sResourceManagers.CustomResourceManager().CreateResource(eniConfig)
Expect(err).ToNot(HaveOccurred())
}

// Security Groups for Pods setup
// Note that Custom Networking only supports IPv4 clusters, so IPv4 setup can be assumed.
By("creating a new security group for use in Security Group Policy")
podEniSGName := "pod-eni-automation-v4"
securityGroupOutput, err := f.CloudServices.EC2().CreateSecurityGroup(podEniSGName,
"test created by vpc cni automation test suite", f.Options.AWSVPCID)
Expect(err).ToNot(HaveOccurred())
podEniSGID = *securityGroupOutput.GroupId

By("authorizing egress and ingress on security group for client-server communication")
f.CloudServices.EC2().AuthorizeSecurityGroupEgress(podEniSGID, "tcp", podEniOpenPort, podEniOpenPort, v4Zero)
f.CloudServices.EC2().AuthorizeSecurityGroupIngress(podEniSGID, "tcp", podEniOpenPort, podEniOpenPort, v4Zero)

By("getting branch ENI limits")
nodeList, err := f.K8sResourceManagers.NodeManager().GetNodes(f.Options.NgNameLabelKey, f.Options.NgNameLabelVal)
Expect(err).ToNot(HaveOccurred())
numNodes = len(nodeList.Items)
Expect(numNodes).Should(BeNumerically(">=", 1))

node := nodeList.Items[0]
instanceID := k8sUtils.GetInstanceIDFromNode(node)
nodeInstance, err := f.CloudServices.EC2().DescribeInstance(instanceID)
instanceType := *nodeInstance.InstanceType
totalBranchInterface = vpc.Limits[instanceType].BranchInterface * numNodes

By("enabling custom networking and sgpp on aws-node DaemonSet")
k8sUtils.AddEnvVarToDaemonSetAndWaitTillUpdated(f, utils.AwsNodeName,
utils.AwsNodeNamespace, utils.AwsNodeName, map[string]string{
"AWS_VPC_K8S_CNI_CUSTOM_NETWORK_CFG": "true",
"ENI_CONFIG_LABEL_DEF": "topology.kubernetes.io/zone",
"ENABLE_POD_ENI": "true",
})

By("terminating instances")
err = awsUtils.TerminateInstances(f)
Expect(err).ToNot(HaveOccurred())

By("getting target node")
nodeList, err = f.K8sResourceManagers.NodeManager().GetNodes(f.Options.NgNameLabelKey, f.Options.NgNameLabelVal)
Expect(err).ToNot(HaveOccurred())
targetNode = nodeList.Items[0]
})

var _ = AfterSuite(func() {
var errs prometheus.MultiError
for _, eniConfig := range eniConfigList {
By("deleting ENIConfig")
errs.Append(f.K8sResourceManagers.CustomResourceManager().DeleteResource(eniConfig))
}

By("disabling custom networking and pod eni on aws-node DaemonSet")
k8sUtils.RemoveVarFromDaemonSetAndWaitTillUpdated(f, utils.AwsNodeName,
utils.AwsNodeNamespace, utils.AwsNodeName, map[string]struct{}{
"AWS_VPC_K8S_CNI_CUSTOM_NETWORK_CFG": {},
"ENI_CONFIG_LABEL_DEF": {},
"ENABLE_POD_ENI": {},
})

By("terminating instances")
errs.Append(awsUtils.TerminateInstances(f))

By("deleting Custom Networking security group")
errs.Append(f.CloudServices.EC2().DeleteSecurityGroup(customNetworkingSGID))

By("deleting pod ENI security group")
errs.Append(f.CloudServices.EC2().DeleteSecurityGroup(podEniSGID))

for _, subnet := range customNetworkingSubnetIDList {
By(fmt.Sprintf("deleting the subnet %s", subnet))
errs.Append(f.CloudServices.EC2().DeleteSubnet(subnet))
}

By("disassociating the CIDR range to the VPC")
errs.Append(f.CloudServices.EC2().DisAssociateVPCCIDRBlock(cidrBlockAssociationID))

Expect(errs.MaybeUnwrap()).ToNot(HaveOccurred())
})
Loading

0 comments on commit b7ed952

Please sign in to comment.