mirror of
https://github.com/kubernetes/kubernetes.git
synced 2026-06-11 01:41:54 -04:00
Add server-side streaming RPCs to bypass the gRPC 16MB message size limit on nodes with many containers/pods. This implements KEP-5825. New RuntimeService streaming RPCs: - StreamPodSandboxes - StreamContainers - StreamContainerStats - StreamPodSandboxStats - StreamPodSandboxMetrics New ImageService streaming RPC: - StreamImages Each streaming RPC accepts the same filter as its unary counterpart and streams results one item at a time. Feature gate: CRIListStreaming KEP: https://kep.k8s.io/5825 🤖 Generated with [Claude Code](https://claude.com/claude-code) Signed-off-by: Ayato Tokubi <atokubi@redhat.com>
505 lines
18 KiB
Go
505 lines
18 KiB
Go
//go:build linux
|
|
|
|
/*
|
|
Copyright 2024 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package e2enode
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"os"
|
|
"strings"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
"github.com/onsi/ginkgo/v2"
|
|
"github.com/onsi/gomega"
|
|
"google.golang.org/grpc/codes"
|
|
"google.golang.org/grpc/status"
|
|
|
|
v1 "k8s.io/api/core/v1"
|
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
|
"k8s.io/apimachinery/pkg/util/uuid"
|
|
"k8s.io/kubernetes/pkg/features"
|
|
kubeletevents "k8s.io/kubernetes/pkg/kubelet/events"
|
|
"k8s.io/kubernetes/pkg/kubelet/images"
|
|
"k8s.io/kubernetes/test/e2e/feature"
|
|
"k8s.io/kubernetes/test/e2e/framework"
|
|
e2epod "k8s.io/kubernetes/test/e2e/framework/pod"
|
|
"k8s.io/kubernetes/test/e2e_node/criproxy"
|
|
imageutils "k8s.io/kubernetes/test/utils/image"
|
|
admissionapi "k8s.io/pod-security-admission/api"
|
|
)
|
|
|
|
// Examples of using CRI proxy
|
|
var _ = SIGDescribe(feature.CriProxy, framework.WithSerial(), func() {
|
|
f := framework.NewDefaultFramework("cri-proxy-example")
|
|
f.NamespacePodSecurityLevel = admissionapi.LevelPrivileged
|
|
|
|
ginkgo.Context("Inject a pull image error exception into the CriProxy", func() {
|
|
ginkgo.BeforeEach(func() {
|
|
if err := resetCRIProxyInjector(e2eCriProxy); err != nil {
|
|
ginkgo.Skip("Skip the test since the CRI Proxy is undefined.")
|
|
}
|
|
ginkgo.DeferCleanup(func() error {
|
|
return resetCRIProxyInjector(e2eCriProxy)
|
|
})
|
|
})
|
|
|
|
ginkgo.It("Pod failed to start due to an image pull error.", func(ctx context.Context) {
|
|
expectedErr := fmt.Errorf("PullImage failed")
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
if apiName == criproxy.PullImage {
|
|
return expectedErr
|
|
}
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
pod := e2epod.NewPodClient(f).Create(ctx, newPullImageAlwaysPod())
|
|
podErr := e2epod.WaitForPodCondition(ctx, f.ClientSet, f.Namespace.Name, pod.Name, "ImagePullBackOff", 1*time.Minute, func(pod *v1.Pod) (bool, error) {
|
|
if len(pod.Status.ContainerStatuses) > 0 && pod.Status.Reason == images.ErrImagePullBackOff.Error() {
|
|
return true, nil
|
|
}
|
|
return false, nil
|
|
})
|
|
gomega.Expect(podErr).To(gomega.HaveOccurred())
|
|
|
|
eventMsg, err := getFailedToPullImageMsg(ctx, f, pod.Name)
|
|
framework.ExpectNoError(err)
|
|
isExpectedErrMsg := strings.Contains(eventMsg, expectedErr.Error())
|
|
gomega.Expect(isExpectedErrMsg).To(gomega.BeTrueBecause("we injected an exception into the PullImage interface of the cri proxy"))
|
|
})
|
|
})
|
|
|
|
ginkgo.Context("Image pull backoff", func() {
|
|
ginkgo.BeforeEach(func() {
|
|
if err := resetCRIProxyInjector(e2eCriProxy); err != nil {
|
|
ginkgo.Skip("Skip the test since the CRI Proxy is undefined.")
|
|
}
|
|
ginkgo.DeferCleanup(func() error {
|
|
return resetCRIProxyInjector(e2eCriProxy)
|
|
})
|
|
})
|
|
|
|
})
|
|
|
|
framework.Context("Image volume digest error handling", feature.CriProxy, framework.WithFeatureGate(features.ImageVolumeWithDigest), func() {
|
|
ginkgo.BeforeEach(func() {
|
|
if e2eCriProxy == nil {
|
|
ginkgo.Skip("Skip the test since the CRI Proxy is undefined. Please run with --cri-proxy-enabled=true")
|
|
}
|
|
if err := resetCRIProxyInjector(e2eCriProxy); err != nil {
|
|
ginkgo.Skip("Skip the test since the CRI Proxy is undefined.")
|
|
}
|
|
ginkgo.DeferCleanup(func() error {
|
|
return resetCRIProxyInjector(e2eCriProxy)
|
|
})
|
|
})
|
|
|
|
getImageVolumePod := func() *v1.Pod {
|
|
return &v1.Pod{
|
|
ObjectMeta: metav1.ObjectMeta{
|
|
Name: "image-vol-test-" + string(uuid.NewUUID()),
|
|
Namespace: f.Namespace.Name,
|
|
},
|
|
Spec: v1.PodSpec{
|
|
Containers: []v1.Container{
|
|
{
|
|
Name: "image-vol-container-" + string(uuid.NewUUID()),
|
|
Image: imageutils.GetPauseImageName(),
|
|
VolumeMounts: []v1.VolumeMount{
|
|
{
|
|
Name: volumeName,
|
|
MountPath: "/image-volume-" + string(uuid.NewUUID()),
|
|
},
|
|
},
|
|
},
|
|
},
|
|
Volumes: []v1.Volume{
|
|
{
|
|
Name: volumeName,
|
|
VolumeSource: v1.VolumeSource{
|
|
Image: &v1.ImageVolumeSource{
|
|
Reference: imageutils.GetPauseImageName(),
|
|
PullPolicy: v1.PullAlways,
|
|
},
|
|
},
|
|
},
|
|
},
|
|
},
|
|
}
|
|
}
|
|
|
|
waitForPodContainerStatuses := func(pod *v1.Pod) *v1.Pod {
|
|
ginkgo.By("Waiting for the pod container statuses")
|
|
|
|
var err error
|
|
gomega.Eventually(func() []v1.ContainerStatus {
|
|
pod, err = f.ClientSet.CoreV1().Pods(f.Namespace.Name).Get(context.Background(), pod.Name, metav1.GetOptions{})
|
|
framework.ExpectNoError(err)
|
|
|
|
return pod.Status.ContainerStatuses
|
|
}).WithPolling(5*time.Second).WithTimeout(2*time.Minute).Should(gomega.HaveLen(1), "couldn't find expected container status")
|
|
|
|
return pod
|
|
}
|
|
|
|
getVolumeMountStatus := func(pod *v1.Pod) v1.VolumeMountStatus {
|
|
ginkgo.By("Finding the pod volume mount status")
|
|
|
|
var volMountStatus *v1.VolumeMountStatus
|
|
containerStatus := pod.Status.ContainerStatuses[0]
|
|
|
|
for i := range pod.Status.ContainerStatuses[0].VolumeMounts {
|
|
if containerStatus.VolumeMounts[i].Name == volumeName {
|
|
volMountStatus = &containerStatus.VolumeMounts[i]
|
|
break
|
|
}
|
|
}
|
|
gomega.ExpectWithOffset(1, volMountStatus).ToNot(gomega.BeNil(), "couldn't find expected volume mount status")
|
|
|
|
return *volMountStatus
|
|
}
|
|
|
|
ginkgo.It("should expect error log when ImageStatus fails for image volume digest", func(ctx context.Context) {
|
|
const imageStatusErrMsg = "mock error message - ImageStatus failed"
|
|
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
if apiName == criproxy.ImageStatus {
|
|
return errors.New(imageStatusErrMsg)
|
|
}
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
pod := getImageVolumePod()
|
|
pod = e2epod.NewPodClient(f).Create(ctx, pod)
|
|
pod = waitForPodContainerStatuses(pod)
|
|
|
|
volMountStatus := getVolumeMountStatus(pod)
|
|
|
|
if volMountStatus.VolumeStatus != nil && volMountStatus.VolumeStatus.Image != nil {
|
|
ginkgo.Fail(fmt.Sprintf("ImageRef should not be set when ImageStatus fails, but got: %s", volMountStatus.VolumeStatus.Image.ImageRef))
|
|
}
|
|
|
|
ginkgo.By("Expecting an error when ImageStatus fails")
|
|
gomega.Eventually(func() error {
|
|
return verifyErrorInKubeletLogs(imageStatusErrMsg)
|
|
}).WithPolling(5*time.Second).WithTimeout(20*time.Second).ToNot(gomega.HaveOccurred(), "Could not verify error in kubelet logs")
|
|
})
|
|
|
|
ginkgo.It("should expect error log for image volume with empty Image.Image", func(ctx context.Context) {
|
|
// This test verifies error handling when imageSpec.Image is empty (curVolumeMount.Image.Image == "").
|
|
|
|
pod := getImageVolumePod()
|
|
pod = e2epod.NewPodClient(f).Create(ctx, pod)
|
|
pod = waitForPodContainerStatuses(pod)
|
|
|
|
volMountStatus := getVolumeMountStatus(pod)
|
|
|
|
if volMountStatus.VolumeStatus != nil && volMountStatus.VolumeStatus.Image != nil {
|
|
ginkgo.Fail(fmt.Sprintf("ImageRef should not be set when ImageStatus fails, but got: %s", volMountStatus.VolumeStatus.Image.ImageRef))
|
|
}
|
|
|
|
ginkgo.By("Expecting an error when imageSpec.Image is empty")
|
|
gomega.Eventually(func() error {
|
|
return verifyErrorInKubeletLogs("Failed to inspect image")
|
|
}).WithPolling(5*time.Second).WithTimeout(20*time.Second).ToNot(gomega.HaveOccurred(), "Could not verify error in kubelet logs")
|
|
})
|
|
})
|
|
|
|
ginkgo.Context("Inject a pull image timeout exception into the CriProxy", func() {
|
|
ginkgo.BeforeEach(func() {
|
|
if err := resetCRIProxyInjector(e2eCriProxy); err != nil {
|
|
ginkgo.Skip("Skip the test since the CRI Proxy is undefined.")
|
|
}
|
|
ginkgo.DeferCleanup(func() error {
|
|
return resetCRIProxyInjector(e2eCriProxy)
|
|
})
|
|
})
|
|
|
|
ginkgo.It("Image pull time exceeded 10 seconds", func(ctx context.Context) {
|
|
const delayTime = 10 * time.Second
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
if apiName == criproxy.PullImage {
|
|
time.Sleep(10 * time.Second)
|
|
}
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
pod := e2epod.NewPodClient(f).Create(ctx, newPullImageAlwaysPod())
|
|
podErr := e2epod.WaitForPodRunningInNamespace(ctx, f.ClientSet, pod)
|
|
framework.ExpectNoError(podErr)
|
|
|
|
imagePullDuration, err := getPodImagePullDuration(ctx, f, pod.Name)
|
|
framework.ExpectNoError(err)
|
|
|
|
gomega.Expect(imagePullDuration).To(gomega.BeNumerically(">=", delayTime), "PullImages should take more than 10 seconds")
|
|
})
|
|
})
|
|
|
|
// CRI streaming API tests
|
|
framework.Context("CRI streaming list operations", feature.CriProxy, framework.WithFeatureGate(features.CRIListStreaming), func() {
|
|
ginkgo.BeforeEach(func() {
|
|
if err := resetCRIProxyInjector(e2eCriProxy); err != nil {
|
|
ginkgo.Skip("Skip the test since the CRI Proxy is undefined.")
|
|
}
|
|
ginkgo.DeferCleanup(func() error {
|
|
return resetCRIProxyInjector(e2eCriProxy)
|
|
})
|
|
})
|
|
|
|
ginkgo.It("should use streaming RPCs for listing pods and containers", func(ctx context.Context) {
|
|
// Track which streaming APIs were called
|
|
apiCalled := make(map[string]bool)
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
apiCalled[apiName] = true
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
// Wait for kubelet to make list calls (which should use streaming when enabled)
|
|
gomega.Eventually(func(g gomega.Gomega) {
|
|
g.Expect(apiCalled[criproxy.StreamContainers]).To(gomega.BeTrueBecause("StreamContainers should be called"))
|
|
g.Expect(apiCalled[criproxy.StreamPodSandboxes]).To(gomega.BeTrueBecause("StreamPodSandboxes should be called"))
|
|
g.Expect(apiCalled[criproxy.ListContainers]).To(gomega.BeFalseBecause("ListContainers should not be called"))
|
|
g.Expect(apiCalled[criproxy.ListPodSandbox]).To(gomega.BeFalseBecause("ListPodSandbox should not be called"))
|
|
}).WithPolling(1 * time.Second).WithTimeout(1 * time.Minute).Should(gomega.Succeed())
|
|
})
|
|
|
|
ginkgo.It("should handle mid-stream errors", func(ctx context.Context) {
|
|
// Create a pod so that StreamContainersSend is called at least twice
|
|
// (once per container), allowing us to inject a mid-stream error
|
|
// after the first item is successfully sent.
|
|
e2epod.NewPodClient(f).CreateSync(ctx, newPausePodWithContainers(2))
|
|
|
|
// Track per-call send count so we can fail after the first item
|
|
// is successfully sent, simulating a mid-stream failure.
|
|
var perCallSendCount atomic.Int32
|
|
var midStreamErrors atomic.Int32
|
|
var listFallbackCalls atomic.Int32
|
|
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
switch apiName {
|
|
case criproxy.StreamContainers:
|
|
// Reset per-call counter at the start of each streaming call
|
|
perCallSendCount.Store(0)
|
|
case criproxy.StreamContainersSend:
|
|
if perCallSendCount.Add(1) > 1 {
|
|
midStreamErrors.Add(1)
|
|
return status.Error(codes.Internal, "injected mid-stream error")
|
|
}
|
|
case criproxy.ListContainers:
|
|
listFallbackCalls.Add(1)
|
|
}
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
// Wait for the mid-stream error to be triggered at least once
|
|
gomega.Eventually(func() bool {
|
|
return midStreamErrors.Load() > 0
|
|
}).WithPolling(1 * time.Second).WithTimeout(1 * time.Minute).Should(
|
|
gomega.BeTrueBecause("Expected mid-stream error to be triggered during StreamContainers"))
|
|
|
|
// Verify no fallback to unary RPC (Internal errors should NOT trigger fallback)
|
|
gomega.Expect(listFallbackCalls.Load()).To(gomega.Equal(int32(0)),
|
|
"Non-Unimplemented errors should not trigger fallback to ListContainers")
|
|
})
|
|
|
|
ginkgo.It("should handle streaming timeout", func(ctx context.Context) {
|
|
// Create a pod so that StreamContainersSend is called at least twice,
|
|
// allowing us to block on the second send to simulate a timeout.
|
|
e2epod.NewPodClient(f).CreateSync(ctx, newPausePodWithContainers(5))
|
|
|
|
var perCallSendCount atomic.Int32
|
|
var listFallbackCalls atomic.Int32
|
|
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
switch apiName {
|
|
case criproxy.StreamContainers:
|
|
// Reset per-call counter at the start of each streaming call
|
|
perCallSendCount.Store(0)
|
|
case criproxy.StreamContainersSend:
|
|
// Simulate a slow runtime by waiting one minute per item;
|
|
// the client's context timeout will fire and the Recv()
|
|
// will return DeadlineExceeded.
|
|
time.Sleep(1 * time.Minute)
|
|
perCallSendCount.Add(1)
|
|
case criproxy.ListContainers:
|
|
listFallbackCalls.Add(1)
|
|
}
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
// Ensure the number of containers sent per streaming call never exceeds 2,
|
|
// because the connection timeout is set to 2 mins.
|
|
// It confirms the client times out behave the same as List methods.
|
|
gomega.Eventually(func() bool {
|
|
return perCallSendCount.Load() > 0
|
|
}).WithPolling(1 * time.Second).WithTimeout(3 * time.Minute).Should(
|
|
gomega.BeTrueBecause("Expected at least one StreamContainersSend call"))
|
|
gomega.Expect(perCallSendCount.Load()).To(gomega.BeNumerically("<=", int32(2)),
|
|
"Expected no more than 2 containers to be sent before timeout")
|
|
|
|
// Wait for the kubelet to log the streaming recv failure caused by the timeout
|
|
gomega.Eventually(func() error {
|
|
return verifyErrorInKubeletLogs("StreamContainers recv failed")
|
|
}).WithPolling(5*time.Second).WithTimeout(3*time.Minute).Should(gomega.Succeed(),
|
|
"Expected kubelet to log a StreamContainers recv failure due to timeout")
|
|
|
|
// Verify no fallback to unary RPC (timeout errors should NOT trigger fallback)
|
|
gomega.Expect(listFallbackCalls.Load()).To(gomega.Equal(int32(0)),
|
|
"Timeout errors should not trigger fallback to ListContainers")
|
|
})
|
|
|
|
// Each fallback test restarts the kubelet to ensure a fresh CRI client
|
|
// with useStreaming=true, since triggering the Unimplemented fallback
|
|
// permanently disables streaming on the kubelet's CRI client.
|
|
ginkgo.It("should fall back to unary RPC when streaming returns Unimplemented", func(ctx context.Context) {
|
|
// Restart kubelet on cleanup to reset the useStreaming flag,
|
|
// which is cached from the first streaming attempt.
|
|
ginkgo.DeferCleanup(func(ctx context.Context) error {
|
|
err := resetCRIProxyInjector(e2eCriProxy)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
restartKubelet(ctx, true)
|
|
waitForKubeletToStart(ctx, f)
|
|
return nil
|
|
})
|
|
|
|
var streamCallCount atomic.Int32
|
|
var listCallCount atomic.Int32
|
|
|
|
err := addCRIProxyInjector(e2eCriProxy, func(apiName string) error {
|
|
switch apiName {
|
|
case criproxy.StreamContainers:
|
|
streamCallCount.Add(1)
|
|
return status.Error(codes.Unimplemented, "streaming not supported")
|
|
case criproxy.ListContainers:
|
|
listCallCount.Add(1)
|
|
}
|
|
return nil
|
|
})
|
|
framework.ExpectNoError(err)
|
|
|
|
gomega.Eventually(func() bool {
|
|
return listCallCount.Load() > 0
|
|
}).WithPolling(1 * time.Second).WithTimeout(1 * time.Minute).Should(
|
|
gomega.BeTrueBecause("Expected fallback to ListContainers after StreamContainers returned Unimplemented"))
|
|
|
|
gomega.Expect(streamCallCount.Load()).To(gomega.BeNumerically(">=", int32(1)),
|
|
"Expected StreamContainers to be attempted at least once before falling back")
|
|
})
|
|
})
|
|
})
|
|
|
|
func getFailedToPullImageMsg(ctx context.Context, f *framework.Framework, podName string) (string, error) {
|
|
events, err := f.ClientSet.CoreV1().Events(f.Namespace.Name).List(ctx, metav1.ListOptions{})
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
for _, event := range events.Items {
|
|
if event.Reason == kubeletevents.FailedToPullImage && event.InvolvedObject.Name == podName {
|
|
return event.Message, nil
|
|
}
|
|
}
|
|
|
|
return "", fmt.Errorf("failed to find FailedToPullImage event for pod: %s", podName)
|
|
}
|
|
|
|
func getPodImagePullDuration(ctx context.Context, f *framework.Framework, podName string) (time.Duration, error) {
|
|
events, err := f.ClientSet.CoreV1().Events(f.Namespace.Name).List(ctx, metav1.ListOptions{})
|
|
if err != nil {
|
|
return 0, err
|
|
}
|
|
|
|
var startTime, endTime time.Time
|
|
for _, event := range events.Items {
|
|
if event.InvolvedObject.Name == podName {
|
|
switch event.Reason {
|
|
case kubeletevents.PullingImage:
|
|
startTime = event.FirstTimestamp.Time
|
|
case kubeletevents.PulledImage:
|
|
endTime = event.FirstTimestamp.Time
|
|
}
|
|
}
|
|
}
|
|
|
|
if startTime.IsZero() || endTime.IsZero() {
|
|
return 0, fmt.Errorf("failed to find both PullingImage and PulledImage events for pod: %s", podName)
|
|
}
|
|
|
|
return endTime.Sub(startTime), nil
|
|
}
|
|
|
|
func newPullImageAlwaysPod() *v1.Pod {
|
|
podName := "cri-proxy-test-" + string(uuid.NewUUID())
|
|
pod := &v1.Pod{
|
|
ObjectMeta: metav1.ObjectMeta{
|
|
Name: podName,
|
|
},
|
|
Spec: v1.PodSpec{
|
|
Containers: []v1.Container{
|
|
{
|
|
Image: imageutils.GetPauseImageName(),
|
|
Name: podName,
|
|
ImagePullPolicy: v1.PullAlways,
|
|
},
|
|
},
|
|
},
|
|
}
|
|
return pod
|
|
}
|
|
|
|
func newPausePodWithContainers(count int) *v1.Pod {
|
|
podName := "cri-proxy-test-" + string(uuid.NewUUID())
|
|
var containers []v1.Container
|
|
for i := range count {
|
|
containers = append(containers, v1.Container{
|
|
Name: fmt.Sprintf("pause-%d", i),
|
|
Image: imageutils.GetPauseImageName(),
|
|
})
|
|
}
|
|
return &v1.Pod{
|
|
ObjectMeta: metav1.ObjectMeta{
|
|
Name: podName,
|
|
},
|
|
Spec: v1.PodSpec{
|
|
Containers: containers,
|
|
},
|
|
}
|
|
}
|
|
|
|
func verifyErrorInKubeletLogs(errorMsg string) error {
|
|
kubeletLog, err := os.ReadFile(framework.TestContext.ReportDir + "/kubelet.log")
|
|
if err != nil {
|
|
return fmt.Errorf("could not read kubelet logs: %w", err)
|
|
}
|
|
|
|
if !strings.Contains(string(kubeletLog), errorMsg) {
|
|
return fmt.Errorf("error message \"%s\" not found in kubelet logs", errorMsg)
|
|
}
|
|
|
|
return nil
|
|
}
|