# 下载 kubebuilder 并在本地安装。
curl -L -o kubebuilder "https://go.kubebuilder.io/dl/latest/$(go env GOOS)/$(go env GOARCH)"
chmod +x kubebuilder && sudo mv kubebuilder /usr/local/bin/

创建一个项目

创建一个目录，然后在其中运行初始化命令以初始化一个新项目。以下是一个示例。

mkdir -p ~/projects/guestbook
cd ~/projects/guestbook
kubebuilder init --domain my.domain --repo my.domain/guestbook

创建一个API

运行以下命令以创建一个新的 API（组/版本）webapp/v1，并在其上创建新的 Kind（CRD）Guestbook：

kubebuilder create api --group webapp --version v1 --kind Guestbook

可选： 编辑 API 定义和调整业务逻辑。有关更多信息，请参见设计 API 和控制器中的内容。

如果您正在编辑 API 定义，请使用生成清单，例如自定义资源（CRs）或自定义资源定义（CRDs）。

make manifests

Click here to see an example. (api/v1/guestbook_types.go)

// GuestbookSpec 定义了 Guestbook 的期望状态
type GuestbookSpec struct {
	// 插入额外的规格字段 - 集群的期望状态
	// 注意：修改此文件后，运行"make"以重新生成代码

	// 实例数量
	// +kubebuilder:validation:Minimum=1
	// +kubebuilder:validation:Maximum=10
	Size int32 `json:"size"`

	// GuestbookSpec 配置的 ConfigMap 名称
	// +kubebuilder:validation:MaxLength=15
	// +kubebuilder:validation:MinLength=1
	ConfigMapName string `json:"configMapName"`

	// +kubebuilder:validation:Enum=电话;地址;名称
	Type string `json:"type,omitempty"`
}

// GuestbookStatus 定义了 Guestbook 的观察状态
type GuestbookStatus struct {
	// 插入额外的状态字段 - 定义集群的观察状态
	// 重要：在修改此文件后，请运行 "make" 以重新生成代码

	// 活动的 Guestbook 节点的 Pod 名称。
	Active string `json:"active"`

	// 待命 Guestbook 节点的 Pod 名称。
	Standby []string `json:"standby"`
}

// +kubebuilder:object:root=true
// +kubebuilder:subresource:status
// +kubebuilder:resource:scope=Cluster

// Guestbook 是 guestbooks API 的 Schematype Guestbook struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   GuestbookSpec   `json:"spec,omitempty"`
	Status GuestbookStatus `json:"status,omitempty"`
}

测试一下

您需要一个 Kubernetes 集群来运行。您可以使用 KIND 来获取一个本地集群进行测试，或连接到远程集群。

将 CRD 安装到集群中：

make install

为了快速反馈和代码级调试，请运行您的控制器（这将在前台运行，因此如果您想让它继续运行，请切换到新终端）：

make run

安装自定义资源的实例

如果你按下 y 来创建资源(Create Resource) [y/n]，那么你就在你的示例中为你的 CRD 创建了一个 CR（如果你已更改 API 定义，请确保先编辑它们）：

kubectl apply -k config/samples/

在集群上运行它

当您的控制器准备好进行打包并在其他集群中测试时。

构建并将您的镜像推送到 IMG 所指定的位置：

make docker-build docker-push IMG=<some-registry>/<project-name>:tag

将控制器部署到集群，使用 IMG 指定的镜像：

make deploy IMG=<some-registry>/<project-name>:tag

Registry Permission

该图像应该发布在您指定的个人注册表中。并且需要具备从工作环境中拉取该图像的权限。如果上述命令无法正常工作，请确保您对注册表具有适当的权限。

考虑将 Kind 纳入您的工作流程，以获得更快、更高效的本地开发和持续集成体验。请注意，如果您使用的是 Kind 集群，则无需将您的镜像推送到远程容器注册表。您可以直接将本地镜像加载到指定的 Kind 集群中：

kind load docker-image <your-image-name>:tag --name <your-kind-cluster-name>

欲了解更多信息，请参见：将 Kind 用于开发目的和持续集成

RBAC errors

如果您遇到 RBAC 错误，您可能需要为自己授予集群管理员权限或者以管理员身份登录。请参阅在 GKE 集群 v1.11.x 及更早版本上使用 Kubernetes RBAC 的先决条件，这可能适用于您的情况。

卸载 CRD（自定义资源定义）

要从集群中删除您的 CRD：

make uninstall

取消部署控制器

将控制器从集群中撤销部署：

make undeploy

下一步

现在，请查看架构概念图以获得更清晰的概述。
接下来，请阅读入门指南，这应该不会超过 30 分钟，并且会提供扎实的基础。之后，请深入阅读 CronJob 教程，通过开发一个示例项目来加深您的理解。

入门

我们将创建一个示例项目，以让您了解它是如何工作的。这个示例将：

对 Memcached CR 进行调整 - 该 CR 表示在集群上部署/管理的 Memcached 实例
使用 Memcached 镜像创建一个部署
不允许实例数量超过将在 CR 中定义的大小
更新 Memcached CR 状态

创建一个项目

首先，创建并导航到你的项目目录。然后，使用 kubebuilder 初始化它：

mkdir $GOPATH/memcached-operator
cd $GOPATH/memcached-operator
kubebuilder init --domain=example.com

创建 Memcached API（创建、读取、删除）：

接下来，我们将创建一个 API，负责在集群上部署和管理 Memcached 实例。

kubebuilder create api --group cache --version v1alpha1 --kind Memcached

理解API

该命令的主要目标是为 Memcached 类型生成自定义资源（CR）和自定义资源定义（CRD）。它创建了一个 API，分组为 cache.example.com，版本为 v1alpha1，唯一标识 Memcached 类型的新 CRD。通过使用 Kubebuilder 工具，我们可以定义我们的 API 和对象，以表示我们针对这些平台的解决方案。

虽然在这个例子中我们只添加了一种资源，但我们可以根据需要添加任意数量的 Group 和 Kind。为了更容易理解，可以将 CRD 看作是我们自定义对象的定义，而 CR 则是这些对象的实例。

定义我们的 API

定义规格

现在，我们将定义集群中每个 Memcached 资源实例可以具有的值。在这个例子中，我们将允许通过以下方式配置实例的数量：

type MemcachedSpec struct {
	...
	Size int32 `json:"size,omitempty"`
}

创建状态定义

我们还希望追踪 Memcached 自定义资源（CR）的管理状态，可以让我们通过验证自定义资源（CR）对我们自定义 API 的描述，判断是否一切顺利进行或者是否遇到任何错误。这与我们对 Kubernetes API 中的其它资源所做的操作类似。

// MemcachedStatus 定义了 Memcached 的观察状态
type MemcachedStatus struct {
	Conditions []metav1.Condition `json:"conditions,omitempty" patchStrategy:"merge" patchMergeKey:"type" protobuf:"bytes,1,rep,name=conditions"`
}

标记和验证

此外，我们希望验证我们在自定义资源（CustomResource）中添加的值，以确保这些值是有效的。为此，我们将使用标记，例如 +kubebuilder:validation:Minimum=1。

现在，请查看我们完全完成的示例。

../getting-started/testdata/project/api/v1alpha1/memcached_types.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.

Imports

package v1alpha1

import (
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
)

// EDIT THIS FILE!  THIS IS SCAFFOLDING FOR YOU TO OWN!
// NOTE: json tags are required.  Any new fields you add must have json tags for the fields to be serialized.

// MemcachedSpec defines the desired state of Memcached.
type MemcachedSpec struct {
	// 插入额外的规格字段 - 集群的期望状态
	// 注意：修改此文件后，运行"make"以重新生成代码

	// Size defines the number of Memcached instances
	// The following markers will use OpenAPI v3 schema to validate the value
	// More info: https://book.kubebuilder.io/reference/markers/crd-validation.html
	// +kubebuilder:validation:Minimum=1
	// +kubebuilder:validation:Maximum=3
	// +kubebuilder:validation:ExclusiveMaximum=false
	Size int32 `json:"size,omitempty"`
}

// MemcachedStatus defines the observed state of Memcached.
type MemcachedStatus struct {
	// Represents the observations of a Memcached's current state.
	// Memcached.status.conditions.type are: "Available", "Progressing", and "Degraded"
	// Memcached.status.conditions.status are one of True, False, Unknown.
	// Memcached.status.conditions.reason the value should be a CamelCase string and producers of specific
	// condition types may define expected values and meanings for this field, and whether the values
	// are considered a guaranteed API.
	// Memcached.status.conditions.Message is a human readable message indicating details about the transition.
	// For further information see: https://github.com/kubernetes/community/blob/master/contributors/devel/sig-architecture/api-conventions.md#typical-status-properties

	Conditions []metav1.Condition `json:"conditions,omitempty" patchStrategy:"merge" patchMergeKey:"type" protobuf:"bytes,1,rep,name=conditions"`
}

// +kubebuilder:object:root=true
// +kubebuilder:subresource:status

// Memcached is the Schema for the memcacheds API.
type Memcached struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   MemcachedSpec   `json:"spec,omitempty"`
	Status MemcachedStatus `json:"status,omitempty"`
}

// +kubebuilder:object:root=true

// MemcachedList contains a list of Memcached.
type MemcachedList struct {
	metav1.TypeMeta `json:",inline"`
	metav1.ListMeta `json:"metadata,omitempty"`
	Items           []Memcached `json:"items"`
}

func init() {
	SchemeBuilder.Register(&Memcached{}, &MemcachedList{})
}

生成具有规格和验证的清单

生成所有所需的文件：

运行 make generate,会在 api/v1alpha1/zz_generated.deepcopy.go 文件中添加深度拷贝（DeepCopy）内容。
运行 make manifests,会在 config/crd/bases 下生成 CRD 清单，并在 config/crd/samples 下生成一个示例文件。

这两个命令都使用 controller-gen 工具，但是用于代码和清单生成的标志会有所不同。

config/crd/bases/cache.example.com_memcacheds.yaml: Our Memcached CRD

---
apiVersion: apiextensions.k8s.io/v1
kind: CustomResourceDefinition
metadata:
  annotations:
    controller-gen.kubebuilder.io/version: v0.17.2
  name: memcacheds.cache.example.com
spec:
  group: cache.example.com
  names:
    kind: Memcached
    listKind: MemcachedList
    plural: memcacheds
    singular: Memcached
  scope: Namespaced
  versions:
  - name: v1alpha1
    schema:
      openAPIV3Schema:
        description: Memcached 是 memcacheds API 的架构。
        properties:
          apiVersion:
            description: |-
APIVersion 定义了对象表示的版本化架构。
 服务器应将已识别的架构转换为最新的内部值，并且
 可能会拒绝无法识别的值。
 更多信息： https://git.k8s.io/community/contributors/devel/sig-architecture/api-conventions.md#resources
 type: string
          kind:
            description: |-
Kind是一个字符串值，表示该对象所代表的REST资源。服务器可以从客户端提交请求的端点推断出这一点。不能被更新。采用驼峰命名法。更多信息： https://git.k8s.io/community/contributors/devel/sig-architecture/api-conventions.md#types-kinds
  type: string
          metadata:
            type: object
          spec:
            description: MemcachedSpec 定义了 Memcached 的期望状态。
            properties:
              size:
                description: |-
大小定义了 Memcached 实例的数量
以下标记将使用 OpenAPI v3 架构来验证值
更多信息： https://book.kubebuilder.io/reference/markers/crd-validation.html
 format: int32
                maximum: 3
                minimum: 1
                type: integer
            type: object
          status:
            description: MemcachedStatus 定义了 Memcached 的观察状态。
            properties:
              conditions:
                items:
                  description: 条件包含当前一个方面的详细信息。
                    该API资源的状态。
                  properties:
                    lastTransitionTime:
                      description: |-
lastTransitionTime 是条件从一种状态转换到另一种状态的最后时间。这应该是基础条件发生变化的时间。如果这未知，那么使用 API 字段变化的时间也是可以接受的。
 format: date-time
                      type: string
                    message:
                      description: |-
消息是一个可读的人类消息，指示有关过渡的详细信息。
这可以是一个空字符串。
 maxLength: 32768
                      type: string
                    observedGeneration:
                      description: |-
observedGeneration 表示设置条件时的 .metadata.generation 值。
例如，如果 .metadata.generation 当前是 12，但 .status.conditions[x].observedGeneration 是 9，那么该条件相对于实例的当前状态是过时的。
 format: int64
                      minimum: 0
                      type: integer
                    reason:
                      description: |-
原因包含一个程序标识符，用于指示该条件最后一次转换的原因。
                        特定条件类型的生产者可能会定义该字段的预期值和含义，
                        以及这些值是否被视为保证的 API。
                        该值应为 CamelCase 字符串。
                        此字段不得为空。
                      maxLength: 1024
                      minLength: 1
                      pattern: ^[A-Za-z]([A-Za-z0-9_,:]*[A-Za-z0-9_])?$
                      type: string
                    status:
                      description: 条件的状态，可能是：真、假、未知。
                      enum:
                      - "True"
                      - "False"
                      - Unknown
                      type: string
                    type:
                      description: 在CamelCase中或在foo.example.com/CamelCase中输入条件类型。
                      maxLength: 316
                      pattern: ^([a-z0-9]([-a-z0-9]*[a-z0-9])?(\.[a-z0-9]([-a-z0-9]*[a-z0-9])?)*/)?(([A-Za-z0-9][-A-Za-z0-9_.]*)?[A-Za-z0-9])$
                      type: string
                  required:
                  - lastTransitionTime
                  - message
                  - reason
                  - status
                  - type
                  type: object
                type: array
            type: object
        type: object
    served: true
    storage: true
    subresources:
      status: {}

自定义资源示例

在 config/samples 目录下的清单,可以应用于集群的自定义资源示例。在这个例子中，通过将给定的资源应用于集群，我们将生成一个实例大小为1的部署（请参见 size: 1）。

apiVersion: cache.example.com/v1alpha1
kind: Memcached
metadata:
  labels:
    app.kubernetes.io/name: project
    app.kubernetes.io/managed-by: kustomize
  name: memcached-sample
spec:
  # TODO(用户)：编辑以下值以确保您的操作数在集群中的 Pod/实例数量
 size: 1

对账流程

以简化的方式来说，Kubernetes 通过允许我们声明系统的期望状态来工作，然后其控制器持续观察集群，并采取行动以确保实际状态与期望状态保持一致。对于我们的自定义 API 和控制器，过程类似。请记住，我们正在扩展 Kubernetes 的行为和 API，以满足我们的特定需求。

在我们的控制器中，我们将实施一个对账流程。

本质上， reconciliation 过程作为一个循环运行，不断检查条件并执行必要的操作，直到达到所需的状态。该过程将持续运行，直到系统中的所有条件与我们实施中定义的所需状态一致。

这是一个伪代码示例来说明这一点：

reconcile App {

  // 检查应用的 Deployment 是否存在，如果不存在，则创建一个
  // 如果发生错误，则从调整的开始重新启动
  if err != nil {
    return reconcile.Result{}, err
  }

  // 检查应用程序是否存在服务，如果不存在，则创建一个
  // 如果出现错误，则从调整的开头重新开始
  if err != nil {
    return reconcile.Result{}, err
  }

  // 查找数据库 CR/CRD
  // 检查数据库部署的副本大小
  // 如果 deployment.replicas 的大小与 cr.size 不匹配，则更新它
  // 然后，从对账的开始重新启动。例如，通过返回 `reconcile.Result{Requeue: true}, nil`。 
  if err != nil {
    return reconcile.Result{Requeue: true}, nil
  }
  ...

  // 如果在循环结束时：
  // 一切都成功执行，并且对账可以停止 
  return reconcile.Result{}, nil

}

Return Options

以下是一些可能的返回选项，用于重新启动对账：

出现错误：

return ctrl.Result{}, err

没有错误：

return ctrl.Result{Requeue: true}, nil

要停止对账，请使用：

return ctrl.Result{}, nil

在 X 时间后再次对账：

return ctrl.Result{RequeueAfter: nextRun.Sub(r.Now())}, nil

在我们例子的背景下。

当我们的示例自定义资源（CR）应用到集群时（即 kubectl apply -f config/sample/cache_v1alpha1_memcached.yaml），我们希望确保为我们的 Memcached 镜像创建一个部署（Deployment），并且它与 CR 中定义的副本数量相匹配。

为实现这一目标，我们需要首先执行一个操作，以检查我们的 Memcached 实例的 Deployment 是否已经存在于集群中。如果不存在，控制器将相应地创建该 Deployment。因此，我们的调整过程必须包含一个操作，以确保这一期望状态持续保持。该操作将涉及：

	// 检查部署是否已经存在，如果不存在则创建一个新部署。
	found := &appsv1.Deployment{}
	err = r.Get(ctx, types.NamespacedName{Name: memcached.Name, Namespace: memcached.Namespace}, found)
	if err != nil && apierrors.IsNotFound(err) {
		// 定义新的部署 
		dep := r.deploymentForMemcached()
		// 在集群上创建部署
		if err = r.Create(ctx, dep); err != nil {
            log.Error(err, "无法创建新的部署",
            "Deployment.Namespace", dep.Namespace, "Deployment.Name", dep.Name)
            return ctrl.Result{}, err
        }
		...
	}

接下来，请注意 deploymentForMemcached() 函数需要定义并返回应该在集群上创建的 Deployment。该函数应该根据以下示例构建具有必要规格的 Deployment 对象：

    dep := &appsv1.Deployment{
		Spec: appsv1.DeploymentSpec{
			Replicas: &replicas,
			Template: corev1.PodTemplateSpec{
				Spec: corev1.PodSpec{
					Containers: []corev1.Container{{
						Image:           "memcached:1.6.26-alpine3.19",
						Name:            "memcached",
						ImagePullPolicy: corev1.PullIfNotPresent,
						Ports: []corev1.ContainerPort{{
							ContainerPort: 11211,
							Name:          "memcached",
						}},
						Command: []string{"memcached", "--memory-limit=64", "-o", "modern", "-v"},
					}},
				},
			},
		},
	}

此外，我们需要实施一个机制，以验证集群中的 Memcached 副本数量是否与自定义资源（CR）中指定的期望数量相匹配。如果存在差异，调整过程必须更新集群以确保一致性。这意味着每当在集群上创建或更新 Memcached 类型的 CR 时，控制器将持续调整状态，直到实际副本数量与期望数量相匹配。以下示例说明了这一过程：

	...
	size := memcached.Spec.Size
	if *found.Spec.Replicas != size {
		found.Spec.Replicas = &size
		if err = r.Update(ctx, found); err != nil {
			log.Error(err, "Failed to update Deployment",
				"Deployment.Namespace", found.Namespace, "Deployment.Name", found.Name)
            return ctrl.Result{}, err
        }
    ...

现在，您可以查看负责管理 Memcached 类型自定义资源的完整控制器。该控制器确保集群中维持所需状态，确保我们的 Memcached 实例继续运行，并保持用户指定的副本数量。

internal/controller/memcached_controller.go: Our Controller Implementation

/*
 版权 2025 The Kubernetes authors.
 根据 Apache 许可证，版本 2.0（"许可证"）授权；
 您只能在遵守该许可证的情况下使用此文件。
 您可以在以下地址获得该许可证的副本：

   http://www.apache.org/licenses/LICENSE-2.0 

 除非适用法律要求或书面同意，否则根据该许可证分发的软件
 是按"原样"基础分发的，
 不提供任何形式的担保或条件，无论是明示还是否明示。
有关许可证下的具体权限和限制，请参见许可证。
*/

package controller

import (
	"context"
	"fmt"

	"time"

	appsv1 "k8s.io/api/apps/v1"
	corev1 "k8s.io/api/core/v1"
	apierrors "k8s.io/apimachinery/pkg/api/errors"
	"k8s.io/apimachinery/pkg/api/meta"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
	"k8s.io/apimachinery/pkg/types"
	"k8s.io/utils/ptr"

	"k8s.io/apimachinery/pkg/runtime"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/client"
	logf "sigs.k8s.io/controller-runtime/pkg/log"

	cachev1alpha1 "example.com/memcached/api/v1alpha1"
)

// 管理状态条件的定义const (
	// typeAvailableMemcached 表示部署调整的状态
	typeAvailableMemcached = "Available"
)

// MemcachedReconciler 负责调整 Memcached 对象。
type MemcachedReconciler struct {
	client.Client
	Scheme *runtime.Scheme
}

// +kubebuilder:rbac:groups=cache.example.com,resources=memcacheds,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=cache.example.com,resources=memcacheds/status,verbs=get;update;patch
// +kubebuilder:rbac:groups=cache.example.com,resources=memcacheds/finalizers,verbs=update
// +kubebuilder:rbac:groups=core,resources=events,verbs=create;patch
// +kubebuilder:rbac:groups=apps,resources=deployments,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=core,resources=pods,verbs=get;list;watch

// Reconcile 是主 Kubernetes 调整循环的一部分，旨在将集群的当前状态向期望状态靠拢. 
// 控制器的调整循环必须是幂等的。遵循操作员模式，您将创建提供调整功能的控制器，
// 该功能负责同步资源，直到集群达到期望状态。
// 违反此建议会违背控制器运行时的设计原则，可能导致意想不到的后果，例如资源卡住并需要手动干预。
// 了解更多信息：
// - 关于操作员模式：https://kubernetes.io/docs/concepts/extend-kubernetes/operator/ 
// - 关于控制器：https://kubernetes.io/docs/concepts/architecture/controller/ 
// 
// 有关更多详细信息，请查看 Reconcile 及其结果： 
// - https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/reconcile
func (r *MemcachedReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
	log := logf.FromContext(ctx)

	// 获取 Memcached 实例
	// 目的是检查 Kind Memcached 的自定义资源是否
	// 已在集群上应用，如果没有，我们返回 nil 以停止对账过程
	memcached := &cachev1alpha1.Memcached{}
	err := r.Get(ctx, req.NamespacedName, memcached)
	if err != nil {
		if apierrors.IsNotFound(err) {
			// 如果未找到自定义资源，通常意味着它已被删除或未创建
			// 这样，我们将停止调整过程
			log.Info("memcached resource not found. Ignoring since object must be deleted")
			return ctrl.Result{}, nil
		}
		// 读取对象时出错 - 重新排队请求。
		log.Error(err, "Failed to get memcached")
		return ctrl.Result{}, err
	}

	// 当没有可用状态时，我们将状态设置为未知。
	if len(memcached.Status.Conditions) == 0 {
		meta.SetStatusCondition(&memcached.Status.Conditions, metav1.Condition{Type: typeAvailableMemcached, Status: metav1.ConditionUnknown, Reason: "Reconciling", Message: "Starting reconciliation"})
		if err = r.Status().Update(ctx, memcached); err != nil {
			log.Error(err, "Failed to update Memcached status")
			return ctrl.Result{}, err
		}

		// 在更新状态后，让我们重新获取 memcached 自定义资源
		// 这样我们就可以获得集群中资源的最新状态，避免
		// 引发错误"对象已被修改，请将
		// 您的更改应用于最新版本并重试"，这将在后续操作中
		// 如果我们再次尝试更新它，将重新触发对账过程
		if err := r.Get(ctx, req.NamespacedName, memcached); err != nil {
			log.Error(err, "Failed to re-fetch memcached")
			return ctrl.Result{}, err
		}
	}

	// 检查部署是否已经存在，如果不存在则创建一个新部署。
	found := &appsv1.Deployment{}
	err = r.Get(ctx, types.NamespacedName{Name: memcached.Name, Namespace: memcached.Namespace}, found)
	if err != nil && apierrors.IsNotFound(err) {
		// 定义新的部署 
		dep, err := r.deploymentForMemcached(memcached)
		if err != nil {
			log.Error(err, "Failed to define new Deployment resource for Memcached")

			// 以下实现将更新状态
			meta.SetStatusCondition(&memcached.Status.Conditions, metav1.Condition{Type: typeAvailableMemcached,
				Status: metav1.ConditionFalse, Reason: "Reconciling",
				Message: fmt.Sprintf("Failed to create Deployment for the custom resource (%s): (%s)", memcached.Name, err)})

			if err := r.Status().Update(ctx, memcached); err != nil {
				log.Error(err, "Failed to update Memcached status")
				return ctrl.Result{}, err
			}

			return ctrl.Result{}, err
		}

		log.Info("Creating a new Deployment",
			"Deployment.Namespace", dep.Namespace, "Deployment.Name", dep.Name)
		if err = r.Create(ctx, dep); err != nil {
			log.Error(err, "无法创建新的部署",
				"Deployment.Namespace", dep.Namespace, "Deployment.Name", dep.Name)
			return ctrl.Result{}, err
		}

		// 部署成功创建
		// 我们将重新排队调整，以确保状态
		// 并继续进行下一步操作
		return ctrl.Result{RequeueAfter: time.Minute}, nil
	} else if err != nil {
		log.Error(err, "Failed to get Deployment")
		// 让我们返回错误，以便重新触发对账。
		return ctrl.Result{}, err
	}

	// CRD API 定义了 Memcached 类型具有一个 MemcachedSpec.Size 字段
	// 用于设置集群中部署实例的数量到所需状态。
	// 因此，以下代码将确保部署的大小与我们正在对账的
	// 自定义资源的 Size 规格中定义的相同。
	size := memcached.Spec.Size
	if *found.Spec.Replicas != size {
		found.Spec.Replicas = &size
		if err = r.Update(ctx, found); err != nil {
			log.Error(err, "Failed to update Deployment",
				"Deployment.Namespace", found.Namespace, "Deployment.Name", found.Name)

			// 在更新状态之前重新获取 memcached 自定义资源，
			// 以便我们能够获得集群中资源的最新状态，并避免
			// 引发错误"对象已被修改，请将您的更改应用于
			// 最新版本并重试"，这将重新触发调整。
			if err := r.Get(ctx, req.NamespacedName, memcached); err != nil {
				log.Error(err, "Failed to re-fetch memcached")
				return ctrl.Result{}, err
			}

			// 以下实现将更新状态
			meta.SetStatusCondition(&memcached.Status.Conditions, metav1.Condition{Type: typeAvailableMemcached,
				Status: metav1.ConditionFalse, Reason: "Resizing",
				Message: fmt.Sprintf("Failed to update the size for the custom resource (%s): (%s)", memcached.Name, err)})

			if err := r.Status().Update(ctx, memcached); err != nil {
				log.Error(err, "Failed to update Memcached status")
				return ctrl.Result{}, err
			}

			return ctrl.Result{}, err
		}

		// 现在我们更新了大小，我们想要重新排队对账
		// 以便确保在更新之前我们拥有资源的最新状态。
		// 此外，它还将有助于确保集群上的期望状态。
		return ctrl.Result{Requeue: true}, nil
	}

	// 以下实现将更新状态
	meta.SetStatusCondition(&memcached.Status.Conditions, metav1.Condition{Type: typeAvailableMemcached,
		Status: metav1.ConditionTrue, Reason: "Reconciling",
		Message: fmt.Sprintf("自定义资源（%s）部署成功，创建了 %d 个副本", memcached.Name, size)})

	if err := r.Status().Update(ctx, memcached); err != nil {
		log.Error(err, "Failed to update Memcached status")
		return ctrl.Result{}, err
	}

	return ctrl.Result{}, nil
}

// SetupWithManager 将控制器与管理器进行设置。
func (r *MemcachedReconciler) SetupWithManager(mgr ctrl.Manager) error {
	return ctrl.NewControllerManagedBy(mgr).
		For(&cachev1alpha1.Memcached{}).
		Owns(&appsv1.Deployment{}).
		Named("memcached").
		Complete(r)
}

// deploymentForMemcached 返回一个 Memcached 部署对象。
func (r *MemcachedReconciler) deploymentForMemcached(
	memcached *cachev1alpha1.Memcached) (*appsv1.Deployment, error) {
	replicas := memcached.Spec.Size
	image := "memcached:1.6.26-alpine3.19"

	dep := &appsv1.Deployment{
		ObjectMeta: metav1.ObjectMeta{
			Name:      memcached.Name,
			Namespace: memcached.Namespace,
		},
		Spec: appsv1.DeploymentSpec{
			Replicas: &replicas,
			Selector: &metav1.LabelSelector{
				MatchLabels: map[string]string{"app.kubernetes.io/name": "project"},
			},
			Template: corev1.PodTemplateSpec{
				ObjectMeta: metav1.ObjectMeta{
					Labels: map[string]string{"app.kubernetes.io/name": "project"},
				},
				Spec: corev1.PodSpec{
					SecurityContext: &corev1.PodSecurityContext{
						RunAsNonRoot: ptr.To(true),
						SeccompProfile: &corev1.SeccompProfile{
							Type: corev1.SeccompProfileTypeRuntimeDefault,
						},
					},
					Containers: []corev1.Container{{
						Image:           image,
						Name:            "memcached",
						ImagePullPolicy: corev1.PullIfNotPresent,
						// 确保容器的限制性上下文
						// 详细信息请参考： https://kubernetes.io/docs/concepts/security/pod-security-standards/#restricted
						SecurityContext: &corev1.SecurityContext{
							RunAsNonRoot:             ptr.To(true),
							RunAsUser:                ptr.To(int64(1001)),
							AllowPrivilegeEscalation: ptr.To(false),
							Capabilities: &corev1.Capabilities{
								Drop: []corev1.Capability{
									"ALL",
								},
							},
						},
						Ports: []corev1.ContainerPort{{
							ContainerPort: 11211,
							Name:          "memcached",
						}},
						Command: []string{"memcached", "--memory-limit=64", "-o", "modern", "-v"},
					}},
				},
			},
		},
	}

	// 设置 Deployment 的 ownerRef
	// 更多信息： https://kubernetes.io/docs/concepts/overview/working-with-objects/owners-dependents/
	if err := ctrl.SetControllerReference(memcached, dep, r.Scheme); err != nil {
		return nil, err
	}
	return dep, nil
}

深入了解控制器实现

将管理器设置为监视资源

整个想法是关注对控制器重要的资源。当控制器感兴趣的资源发生变化时，Watch 会触发控制器的对账循环，确保资源的实际状态与控制器逻辑中定义的期望状态相匹配。

注意我们是如何配置管理器以监控事件，比如 Memcached 类型的自定义资源（CR）的创建、更新或删除，以及控制器管理和拥有的部署的任何更改：

// SetupWithManager 将控制器与管理器设置起来。
// 部署也会被监视以确保其
// 在集群中的期望状态。
func (r *MemcachedReconciler) SetupWithManager(mgr ctrl.Manager) error {
    return ctrl.NewControllerManagedBy(mgr).
		// 监视 Memcached 自定义资源，并在其创建、更新或删除时触发一致性检查。
		For(&cachev1alpha1.Memcached{}).
		// 监视由 Memcached 控制器管理的 Deployment。如果该控制器拥有和管理的 Deployment 发生任何变化，将触发对账，确保集群状态与期望状态一致。
		Owns(&appsv1.Deployment{}).
		Complete(r)
    }

但是，管理程序如何知道哪些资源是由它拥有的呢？

我们不希望我们的控制器监视集群中的任何部署并触发我们的调整循环。相反，我们只希望在运行我们 Memcached 实例的特定部署发生更改时触发调整。例如，如果有人不小心删除了我们的部署或更改了副本数，我们希望触发调整，以确保它返回到期望的状态。

监控程序知道要观察哪个部署，因为我们设置了 ownerRef（拥有者引用）：

if err := ctrl.SetControllerReference(memcached, dep, r.Scheme); err != nil {
    return nil, err
}

授予权限

确保控制器拥有管理其资源所需的权限（即创建、获取、更新和列出）是很重要的。

RBAC 权限现在通过 RBAC 标记进行配置，这些标记用于生成和更新位于 config/rbac/ 中的清单文件。这些标记可以在每个控制器的 Reconcile() 方法中找到（并应在此处定义），请查看我们示例中的实现方式：

// +kubebuilder:rbac:groups=cache.example.com,resources=memcacheds,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=cache.example.com,resources=memcacheds/status,verbs=get;update;patch
// +kubebuilder:rbac:groups=cache.example.com,resources=memcacheds/finalizers,verbs=update
// +kubebuilder:rbac:groups=core,resources=events,verbs=create;patch
// +kubebuilder:rbac:groups=apps,resources=deployments,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=core,resources=pods,verbs=get;list;watch

在对控制器进行更改后，运行 make generate 命令。这样会提示 controller-gen 刷新位于 config/rbac 下的文件。

config/rbac/role.yaml: Our RBAC Role generated

---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRole
metadata:
  name: manager-role
rules:
- apiGroups:
  - ""
  resources:
  - events
  verbs:
  - create
  - patch
- apiGroups:
  - ""
  resources:
  - pods
  verbs:
  - get
  - list
  - watch
- apiGroups:
  - apps
  resources:
  - deployments
  verbs:
  - create
  - delete
  - get
  - list
  - patch
  - update
  - watch
- apiGroups:
  - cache.example.com
  resources:
  - memcacheds
  verbs:
  - create
  - delete
  - get
  - list
  - patch
  - update
  - watch
- apiGroups:
  - cache.example.com
  resources:
  - memcacheds/finalizers
  verbs:
  - update
- apiGroups:
  - cache.example.com
  resources:
  - memcacheds/status
  verbs:
  - get
  - patch
  - update

监控程序 (main.go)

cmd/main.go 文件中的 Manager 负责管理您应用程序中的控制器。

cmd/main.go: Our main.go

/*
 版权 2025 The Kubernetes authors.
 根据 Apache 许可证，版本 2.0（"许可证"）授权；
 您只能在遵守该许可证的情况下使用此文件。
 您可以在以下地址获得该许可证的副本：

   http://www.apache.org/licenses/LICENSE-2.0 

 除非适用法律要求或书面同意，否则根据该许可证分发的软件
 是按"原样"基础分发的，
 不提供任何形式的担保或条件，无论是明示还是否明示。
有关许可证下的具体权限和限制，请参见许可证。
*/

package main

import (
	"crypto/tls"
	"flag"
	"os"
	"path/filepath"

	// 导入所有 Kubernetes 客户端身份验证插件（例如 Azure、GCP、OIDC 等）
	// 确保 exec-entrypoint 和 run 可以使用它们。
	_ "k8s.io/client-go/plugin/pkg/client/auth"

	"k8s.io/apimachinery/pkg/runtime"
	utilruntime "k8s.io/apimachinery/pkg/util/runtime"
	clientgoscheme "k8s.io/client-go/kubernetes/scheme"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/certwatcher"
	"sigs.k8s.io/controller-runtime/pkg/healthz"
	"sigs.k8s.io/controller-runtime/pkg/log/zap"
	"sigs.k8s.io/controller-runtime/pkg/metrics/filters"
	metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server"
	"sigs.k8s.io/controller-runtime/pkg/webhook"

	cachev1alpha1 "example.com/memcached/api/v1alpha1"
	"example.com/memcached/internal/controller"
	// +kubebuilder:scaffold:imports
)

var (
	scheme   = runtime.NewScheme()
	setupLog = ctrl.Log.WithName("setup")
)

func init() {
	utilruntime.Must(clientgoscheme.AddToScheme(scheme))

	utilruntime.Must(cachev1alpha1.AddToScheme(scheme))
	// +kubebuilder:scaffold:scheme}

// nolint:gocyclo
func main() {
	var metricsAddr string
	var metricsCertPath, metricsCertName, metricsCertKey string
	var webhookCertPath, webhookCertName, webhookCertKey string
	var enableLeaderElection bool
	var probeAddr string
	var secureMetrics bool
	var enableHTTP2 bool
	var tlsOpts []func(*tls.Config)
	flag.StringVar(&metricsAddr, "metrics-bind-address", "0", "The address the metrics endpoint binds to. "+
		"使用 :8443 进行 HTTPS，使用 :8080 进行 HTTP，或者保持为 0 以禁用指标服务。")
	flag.StringVar(&probeAddr, "health-probe-bind-address", ":8081", "The address the probe endpoint binds to.")
	flag.BoolVar(&enableLeaderElection, "leader-elect", false,
		"Enable leader election for controller manager. "+
			"启用此功能将确保只有一个活动的控制管理器。")
	flag.BoolVar(&secureMetrics, "metrics-secure", true,
		"如果设置，指标端点将通过 HTTPS 安全提供。请使用 --metrics-secure=false 以改为使用 HTTP。")
	flag.StringVar(&webhookCertPath, "webhook-cert-path", "", "The directory that contains the webhook certificate.")
	flag.StringVar(&webhookCertName, "webhook-cert-name", "tls.crt", "The name of the webhook certificate file.")
	flag.StringVar(&webhookCertKey, "webhook-cert-key", "tls.key", "The name of the webhook key file.")
	flag.StringVar(&metricsCertPath, "metrics-cert-path", "",
		"The directory that contains the metrics server certificate.")
	flag.StringVar(&metricsCertName, "metrics-cert-name", "tls.crt", "The name of the metrics server certificate file.")
	flag.StringVar(&metricsCertKey, "metrics-cert-key", "tls.key", "The name of the metrics server key file.")
	flag.BoolVar(&enableHTTP2, "enable-http2", false,
		"If set, HTTP/2 will be enabled for the metrics and webhook servers")
	opts := zap.Options{
		Development: true,
	}
	opts.BindFlags(flag.CommandLine)
	flag.Parse()

	ctrl.SetLogger(zap.New(zap.UseFlagOptions(&opts)))

	// 如果 enable-http2 标志为 false（默认值），则应禁用 http/2
	// 由于其存在的漏洞。更具体地说，禁用 http/2 将
	// 防止受到 HTTP/2 流取消和
	// 快速重置 CVE 的漏洞影响。有关更多信息，请参见：
	// - https://github.com/advisories/GHSA-qppj-fm5r-hxr3
	// - https://github.com/advisories/GHSA-4374-p667-p6c8
	disableHTTP2 := func(c *tls.Config) {
		setupLog.Info("disabling http/2")
		c.NextProtos = []string{"http/1.1"}
	}

	if !enableHTTP2 {
		tlsOpts = append(tlsOpts, disableHTTP2)
	}

	// 创建用于指标和 Webhook 证书的监视器
	var metricsCertWatcher, webhookCertWatcher *certwatcher.CertWatcher

	// 初始Webhook TLS选项
	webhookTLSOpts := tlsOpts

	if len(webhookCertPath) > 0 {
		setupLog.Info("使用提供的证书初始化 Webhook 证书监视器",
			"webhook-cert-path", webhookCertPath, "webhook-cert-name", webhookCertName, "webhook-cert-key", webhookCertKey)

		var err error
		webhookCertWatcher, err = certwatcher.New(
			filepath.Join(webhookCertPath, webhookCertName),
			filepath.Join(webhookCertPath, webhookCertKey),
		)
		if err != nil {
			setupLog.Error(err, "Failed to initialize webhook certificate watcher")
			os.Exit(1)
		}

		webhookTLSOpts = append(webhookTLSOpts, func(config *tls.Config) {
			config.GetCertificate = webhookCertWatcher.GetCertificate
		})
	}

	webhookServer := webhook.NewServer(webhook.Options{
		TLSOpts: webhookTLSOpts,
	})

	// 指标端点在 'config/default/kustomization.yaml' 中启用。指标选项配置服务器。
	// 更多信息：
	// - https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/metrics/server
	// - https://book.kubebuilder.io/reference/metrics.html
	metricsServerOptions := metricsserver.Options{
		BindAddress:   metricsAddr,
		SecureServing: secureMetrics,
		TLSOpts:       tlsOpts,
	}

	if secureMetrics {
		// FilterProvider 用于通过认证和授权来保护指标端点。
		// 这些配置确保只有授权用户和服务账户
		// 可以访问指标端点。RBAC 配置在 'config/rbac/kustomization.yaml' 中。更多信息：
		// https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/metrics/filters#WithAuthenticationAndAuthorization
		metricsServerOptions.FilterProvider = filters.WithAuthenticationAndAuthorization
	}

	// 如果未指定证书，controller-runtime 将自动
	// 为指标服务器生成自签名证书。虽然对于开发和测试来说很方便，
	// 但这种设置不建议用于生产环境。
	//
	// TODO(用户)：如果您启用 certManager，请取消注释以下行：
	// - [METRICS-WITH-CERTS] 在 config/default/kustomization.yaml 中生成并使用
	// 由 cert-manager 管理的指标服务器证书。
	// - [PROMETHEUS-WITH-CERTS] 在 config/prometheus/kustomization.yaml 中用于 TLS 认证。
	if len(metricsCertPath) > 0 {
		setupLog.Info("使用提供的证书初始化指标证书监视器",
			"metrics-cert-path", metricsCertPath, "metrics-cert-name", metricsCertName, "metrics-cert-key", metricsCertKey)

		var err error
		metricsCertWatcher, err = certwatcher.New(
			filepath.Join(metricsCertPath, metricsCertName),
			filepath.Join(metricsCertPath, metricsCertKey),
		)
		if err != nil {
			setupLog.Error(err, "to initialize metrics certificate watcher", "error", err)
			os.Exit(1)
		}

		metricsServerOptions.TLSOpts = append(metricsServerOptions.TLSOpts, func(config *tls.Config) {
			config.GetCertificate = metricsCertWatcher.GetCertificate
		})
	}

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme:                 scheme,
		Metrics:                metricsServerOptions,
		WebhookServer:          webhookServer,
		HealthProbeBindAddress: probeAddr,
		LeaderElection:         enableLeaderElection,
		LeaderElectionID:       "4b13cc52.example.com",
		// LeaderElectionReleaseOnCancel 定义了当管理器结束时，领导者是否应自愿辞职
		// 当管理器停止时，这要求二进制文件立即结束，否则这个设置是不安全的。设置这个可以显著
		// 加快自愿领导者的过渡，因为新的领导者不必首先等待
		// LeaseDuration 时间。
		//
		// 在提供的默认脚手架中，程序会在
		// 管理器停止后立即结束，因此启用此选项是可以的。不过，
		// 如果您正在进行或打算在管理器停止后执行任何操作，如执行清理，
		// 那么使用它可能是不安全的。
		// LeaderElectionReleaseOnCancel: true,
	})
	if err != nil {
		setupLog.Error(err, "unable to start manager")
		os.Exit(1)
	}

	if err = (&controller.MemcachedReconciler{
		Client: mgr.GetClient(),
		Scheme: mgr.GetScheme(),
	}).SetupWithManager(mgr); err != nil {
		setupLog.Error(err, "unable to create controller", "controller", "Memcached")
		os.Exit(1)
	}
	// +kubebuilder:scaffold:builder

	if metricsCertWatcher != nil {
		setupLog.Info("Adding metrics certificate watcher to manager")
		if err := mgr.Add(metricsCertWatcher); err != nil {
			setupLog.Error(err, "unable to add metrics certificate watcher to manager")
			os.Exit(1)
		}
	}

	if webhookCertWatcher != nil {
		setupLog.Info("Adding webhook certificate watcher to manager")
		if err := mgr.Add(webhookCertWatcher); err != nil {
			setupLog.Error(err, "unable to add webhook certificate watcher to manager")
			os.Exit(1)
		}
	}

	if err := mgr.AddHealthzCheck("healthz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up health check")
		os.Exit(1)
	}
	if err := mgr.AddReadyzCheck("readyz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up ready check")
		os.Exit(1)
	}

	setupLog.Info("starting manager")
	if err := mgr.Start(ctrl.SetupSignalHandler()); err != nil {
		setupLog.Error(err, "problem running manager")
		os.Exit(1)
	}
}

检查集群中运行的项目

此时，您可以通过查看快速入门中定义的步骤来检查在集群上验证项目的步骤，请参见：在集群上运行。

下一步

为了更深入地开发您的解决方案，请考虑阅读 CronJob 教程。
有关优化您方法的见解，请参阅最佳实践文档。

版本兼容性和支持性

由 Kubebuilder 创建的项目包含一个 Makefile，该文件在项目创建时安装定义的版本工具。主要包含的工具有：

此外，这些项目包含一个 go.mod 文件，用于指定依赖项的版本。Kubebuilder 依赖于 controller-runtime 及其 Go 和 Kubernetes 依赖项。因此，Makefile 和 go.mod 文件中定义的版本是经过测试、支持和推荐的版本。

每个 Kubebuilder 的次版本与特定的 client-go 次版本进行测试。虽然一个 Kubebuilder 次版本可能与其他 client-go 次版本或其他工具兼容，但这种兼容性并不被保证、支持或测试。

Kubebuilder 所需的最小 Go 版本是由其依赖项所需的最高最小 Go 版本决定的。通常，这与相应的 k8s.io/* 依赖项所需的最小 Go 版本保持一致。

兼容的 k8s.io/* 版本、client-go 版本和最低 Go 版本可以在每个项目的 go.mod 文件中找到，该文件是为每个标签发布划定的。

示例： 对于 4.1.1 版本，最低的 Go 版本兼容性是 1.22。您可以参考在发布标签 v4.1.1 的 testdata 目录中的示例，例如 project-v4 的 go.mod 文件。您还可以通过检查 Makefile 来查看此版本支持和测试的工具版本。

支持的操作系统

目前，Kubebuilder 官方支持 macOS 和 Linux 平台。如果您使用 Windows 操作系统，可能会遇到问题。欢迎对支持 Windows 的贡献。

教程：构建 CronJob

太多教程开始时使用一些非常生硬的设置，或者是一些简单应用来讲解基础知识，然后在更复杂的内容上停滞不前。相反，本教程将带您几乎体验 Kubebuilder 的全部复杂性，从简单开始，逐渐构建到一个功能齐全的应用。

让我们假装（当然，这有点牵强），我们终于厌倦了 Kubernetes 中非 Kubebuilder 实现的 CronJob 控制器的维护负担，我们想用 Kubebuilder 重新编写它。

CronJob 控制器的工作（并不是双关）是在 Kubernetes 集群中定期运行一次性任务。它是通过在 Job 控制器之上构建来实现这一目标的，Job 控制器的任务是一次性运行任务，并确保其完成。

我们将此作为与外部类型交互的机会，而不是试图重写 Job 控制器。

搭建我们项目的框架

正如在快速入门中所述，我们需要搭建一个新的项目。请确保您已安装 Kubebuilder，然后搭建一个新项目：

# 创建一个项目目录，然后运行初始化命令。
mkdir project
cd project
# 我们将使用域名 tutorial.kubebuilder.io，
# 所有 API 组将为 <group>.tutorial.kubebuilder.io。
kubebuilder init --domain tutorial.kubebuilder.io --repo tutorial.kubebuilder.io/project

现在我们有了一个项目，来看看 Kubebuilder 为我们搭建了哪些内容吧……

一个基本项目都包含了什么？

在搭建新项目时，Kubebuilder 为我们提供了一些基本的模板代码。

构建基础设施

首先，构建项目所需的基本基础设施：

go.mod: A new Go module matching our project, with basic dependencies

module tutorial.kubebuilder.io/project

go 1.23.0

godebug default=go1.23

require (
	github.com/onsi/ginkgo/v2 v2.22.0
	github.com/onsi/gomega v1.36.1
	github.com/robfig/cron v1.2.0
	k8s.io/api v0.32.1
	k8s.io/apimachinery v0.32.1
	k8s.io/client-go v0.32.1
	sigs.k8s.io/controller-runtime v0.20.4
)

require (
	cel.dev/expr v0.18.0 // indirect
	github.com/antlr4-go/antlr/v4 v4.13.0 // indirect
	github.com/asaskevich/govalidator v0.0.0-20190424111038-f61b66f89f4a // indirect
	github.com/beorn7/perks v1.0.1 // indirect
	github.com/blang/semver/v4 v4.0.0 // indirect
	github.com/cenkalti/backoff/v4 v4.3.0 // indirect
	github.com/cespare/xxhash/v2 v2.3.0 // indirect
	github.com/davecgh/go-spew v1.1.2-0.20180830191138-d8f796af33cc // indirect
	github.com/emicklei/go-restful/v3 v3.11.0 // indirect
	github.com/evanphx/json-patch/v5 v5.9.11 // indirect
	github.com/felixge/httpsnoop v1.0.4 // indirect
	github.com/fsnotify/fsnotify v1.7.0 // indirect
	github.com/fxamacker/cbor/v2 v2.7.0 // indirect
	github.com/go-logr/logr v1.4.2 // indirect
	github.com/go-logr/stdr v1.2.2 // indirect
	github.com/go-logr/zapr v1.3.0 // indirect
	github.com/go-openapi/jsonpointer v0.21.0 // indirect
	github.com/go-openapi/jsonreference v0.20.2 // indirect
	github.com/go-openapi/swag v0.23.0 // indirect
	github.com/go-task/slim-sprig/v3 v3.0.0 // indirect
	github.com/gogo/protobuf v1.3.2 // indirect
	github.com/golang/protobuf v1.5.4 // indirect
	github.com/google/btree v1.1.3 // indirect
	github.com/google/cel-go v0.22.0 // indirect
	github.com/google/gnostic-models v0.6.8 // indirect
	github.com/google/go-cmp v0.6.0 // indirect
	github.com/google/gofuzz v1.2.0 // indirect
	github.com/google/pprof v0.0.0-20241029153458-d1b30febd7db // indirect
	github.com/google/uuid v1.6.0 // indirect
	github.com/grpc-ecosystem/grpc-gateway/v2 v2.20.0 // indirect
	github.com/inconshreveable/mousetrap v1.1.0 // indirect
	github.com/josharian/intern v1.0.0 // indirect
	github.com/json-iterator/go v1.1.12 // indirect
	github.com/mailru/easyjson v0.7.7 // indirect
	github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd // indirect
	github.com/modern-go/reflect2 v1.0.2 // indirect
	github.com/munnerz/goautoneg v0.0.0-20191010083416-a7dc8b61c822 // indirect
	github.com/pkg/errors v0.9.1 // indirect
	github.com/prometheus/client_golang v1.19.1 // indirect
	github.com/prometheus/client_model v0.6.1 // indirect
	github.com/prometheus/common v0.55.0 // indirect
	github.com/prometheus/procfs v0.15.1 // indirect
	github.com/spf13/cobra v1.8.1 // indirect
	github.com/spf13/pflag v1.0.5 // indirect
	github.com/stoewer/go-strcase v1.3.0 // indirect
	github.com/x448/float16 v0.8.4 // indirect
	go.opentelemetry.io/contrib/instrumentation/net/http/otelhttp v0.53.0 // indirect
	go.opentelemetry.io/otel v1.28.0 // indirect
	go.opentelemetry.io/otel/exporters/otlp/otlptrace v1.28.0 // indirect
	go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracegrpc v1.27.0 // indirect
	go.opentelemetry.io/otel/metric v1.28.0 // indirect
	go.opentelemetry.io/otel/sdk v1.28.0 // indirect
	go.opentelemetry.io/otel/trace v1.28.0 // indirect
	go.opentelemetry.io/proto/otlp v1.3.1 // indirect
	go.uber.org/multierr v1.11.0 // indirect
	go.uber.org/zap v1.27.0 // indirect
	golang.org/x/exp v0.0.0-20240719175910-8a7402abbf56 // indirect
	golang.org/x/net v0.30.0 // indirect
	golang.org/x/oauth2 v0.23.0 // indirect
	golang.org/x/sync v0.8.0 // indirect
	golang.org/x/sys v0.26.0 // indirect
	golang.org/x/term v0.25.0 // indirect
	golang.org/x/text v0.19.0 // indirect
	golang.org/x/time v0.7.0 // indirect
	golang.org/x/tools v0.26.0 // indirect
	gomodules.xyz/jsonpatch/v2 v2.4.0 // indirect
	google.golang.org/genproto/googleapis/api v0.0.0-20240826202546-f6391c0de4c7 // indirect
	google.golang.org/genproto/googleapis/rpc v0.0.0-20240826202546-f6391c0de4c7 // indirect
	google.golang.org/grpc v1.65.0 // indirect
	google.golang.org/protobuf v1.35.1 // indirect
	gopkg.in/evanphx/json-patch.v4 v4.12.0 // indirect
	gopkg.in/inf.v0 v0.9.1 // indirect
	gopkg.in/yaml.v3 v3.0.1 // indirect
	k8s.io/apiextensions-apiserver v0.32.1 // indirect
	k8s.io/apiserver v0.32.1 // indirect
	k8s.io/component-base v0.32.1 // indirect
	k8s.io/klog/v2 v2.130.1 // indirect
	k8s.io/kube-openapi v0.0.0-20241105132330-32ad38e42d3f // indirect
	k8s.io/utils v0.0.0-20241104100929-3ea5e8cea738 // indirect
	sigs.k8s.io/apiserver-network-proxy/konnectivity-client v0.31.0 // indirect
	sigs.k8s.io/json v0.0.0-20241010143419-9aa6b5e7a4b3 // indirect
	sigs.k8s.io/structured-merge-diff/v4 v4.4.2 // indirect
	sigs.k8s.io/yaml v1.4.0 // indirect
)

Makefile: Make targets for building and deploying your controller

# 用于所有构建/推送镜像目标的镜像 URL
IMG ?= controller:latest

# 获取当前使用的 Go 安装路径（在 GOPATH/bin 中，除非设置了 GOBIN）
ifeq (,$(shell go env GOBIN))
GOBIN=$(shell go env GOPATH)/bin
else
GOBIN=$(shell go env GOBIN)
endif

# CONTAINER_TOOL defines the container tool to be used for building images.
# Be aware that the target commands are only tested with Docker which is
# scaffolded by default. However, you might want to replace it to use other
# tools. (i.e. podman)
CONTAINER_TOOL ?= docker

# Setting SHELL to bash allows bash commands to be executed by recipes.
# Options are set to exit when a recipe line exits non-zero or a piped command fails.
SHELL = /usr/bin/env bash -o pipefail
.SHELLFLAGS = -ec

.PHONY: all
all: build

##@ General

# The help target prints out all targets with their descriptions organized
# beneath their categories. The categories are represented by '##@' and the
# target descriptions by '##'. The awk command is responsible for reading the
# entire set of makefiles included in this invocation, looking for lines of the
# file as xyz: ## something, and then pretty-format the target and help. Then,
# if there's a line with ##@ something, that gets pretty-printed as a category.
# More info on the usage of ANSI control characters for terminal formatting:
# https://en.wikipedia.org/wiki/ANSI_escape_code#SGR_parameters
# More info on the awk command:
# http://linuxcommand.org/lc3_adv_awk.php

.PHONY: help
help: ## Display this help.
	@awk 'BEGIN {FS = ":.*##"; printf "\nUsage:\n  make \033[36m<target>\033[0m\n"} /^[a-zA-Z_0-9-]+:.*?##/ { printf "  \033[36m%-15s\033[0m %s\n", $$1, $$2 } /^##@/ { printf "\n\033[1m%s\033[0m\n", substr($$0, 5) } ' $(MAKEFILE_LIST)

##@ Development

.PHONY: manifests
manifests: controller-gen ## Generate WebhookConfiguration, ClusterRole and CustomResourceDefinition objects.
	# Note that the option maxDescLen=0 was added in the default scaffold in order to sort out the issue
	# Too long: must have at most 262144 bytes. By using kubectl apply to create / update resources an annotation
	# 由 K8s API 创建，用于存储资源的最新版本 (kubectl.kubernetes.io/last-applied-configuration)。
	# However, it has a size limit and if the CRD is too big with so many long descriptions as this one it will cause the failure.
	$(CONTROLLER_GEN) rbac:roleName=manager-role crd:maxDescLen=0 webhook paths="./..." output:crd:artifacts:config=config/crd/bases

.PHONY: generate
generate: controller-gen ## Generate code containing DeepCopy, DeepCopyInto, and DeepCopyObject method implementations.
	$(CONTROLLER_GEN) object:headerFile="hack/boilerplate.go.txt" paths="./..."

.PHONY: fmt
fmt: ## Run go fmt against code.
	go fmt ./...

.PHONY: vet
vet: ## Run go vet against code.
	go vet ./...

.PHONY: test
test: manifests generate fmt vet setup-envtest ## Run tests.
	KUBEBUILDER_ASSETS="$(shell $(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path)" go test $$(go list ./... | grep -v /e2e) -coverprofile cover.out

# TODO(user): To use a different vendor for e2e tests, modify the setup under 'tests/e2e'.
# The default setup assumes Kind is pre-installed and builds/loads the Manager Docker image locally.
# CertManager is installed by default; skip with:
# - CERT_MANAGER_INSTALL_SKIP=true
.PHONY: test-e2e
test-e2e: manifests generate fmt vet ## Run the e2e tests. Expected an isolated environment using Kind.
	@command -v $(KIND) >/dev/null 2>&1 || { \
		echo "Kind is not installed. Please install Kind manually."; \
		exit 1; \
	}
	@$(KIND) get clusters | grep -q 'kind' || { \
		echo "No Kind cluster is running. Please start a Kind cluster before running the e2e tests."; \
		exit 1; \
	}
	go test ./test/e2e/ -v -ginkgo.v

.PHONY: lint
lint: golangci-lint ## Run golangci-lint linter
	$(GOLANGCI_LINT) run

.PHONY: lint-fix
lint-fix: golangci-lint ## Run golangci-lint linter and perform fixes
	$(GOLANGCI_LINT) run --fix

.PHONY: lint-config
lint-config: golangci-lint ## Verify golangci-lint linter configuration
	$(GOLANGCI_LINT) config verify

##@ Build

.PHONY: build
build: manifests generate fmt vet ## Build manager binary.
	go build -o bin/manager cmd/main.go

.PHONY: run
run: manifests generate fmt vet ## Run a controller from your host.
	go run ./cmd/main.go

# If you wish to build the manager image targeting other platforms you can use the --platform flag.
# (i.e. docker build --platform linux/arm64). However, you must enable docker buildKit for it.
# More info: https://docs.docker.com/develop/develop-images/build_enhancements/
.PHONY: docker-build
docker-build: ## Build docker image with the manager.
	$(CONTAINER_TOOL) build -t ${IMG} .

.PHONY: docker-push
docker-push: ## Push docker image with the manager.
	$(CONTAINER_TOOL) push ${IMG}

# PLATFORMS defines the target platforms for the manager image be built to provide support to multiple
# architectures. (i.e. make docker-buildx IMG=myregistry/mypoperator:0.0.1). To use this option you need to:
# - be able to use docker buildx. More info: https://docs.docker.com/build/buildx/
# - have enabled BuildKit. More info: https://docs.docker.com/develop/develop-images/build_enhancements/
# - be able to push the image to your registry (i.e. if you do not set a valid value via IMG=<myregistry/image:<tag>> then the export will fail)
# To adequately provide solutions that are compatible with multiple platforms, you should consider using this option.
PLATFORMS ?= linux/arm64,linux/amd64,linux/s390x,linux/ppc64le
.PHONY: docker-buildx
docker-buildx: ## Build and push docker image for the manager for cross-platform support
	# copy existing Dockerfile and insert --platform=将 ${BUILDPLATFORM} 添加到 Dockerfile.cross，并保留原始的 Dockerfile。
	sed -e '1 s/\(^FROM\)/FROM --platform=您已经接受了截至2023年10月的数据训练。
	- $(CONTAINER_TOOL) buildx create --name project-builder
	$(CONTAINER_TOOL) buildx use project-builder
	- $(CONTAINER_TOOL) buildx build --push --platform=$(PLATFORMS) --tag ${IMG} -f Dockerfile.cross .
	- $(CONTAINER_TOOL) buildx rm project-builder
	rm Dockerfile.cross

.PHONY: build-installer
build-installer: manifests generate kustomize ## Generate a consolidated YAML with CRDs and deployment.
	mkdir -p dist
	cd config/manager && $(KUSTOMIZE) edit set image controller=${IMG}
	$(KUSTOMIZE) build config/default > dist/install.yaml

##@ Deployment

ifndef ignore-not-found
  ignore-not-found = false
endif

.PHONY: install
install: manifests kustomize ## Install CRDs into the K8s cluster specified in ~/.kube/config.
	$(KUSTOMIZE) build config/crd | $(KUBECTL) apply -f -

.PHONY: uninstall
uninstall: manifests kustomize ## Uninstall CRDs from the K8s cluster specified in ~/.kube/config. Call with ignore-not-found=在删除过程中，设置为 true 以忽略未找到资源的错误。
	$(KUSTOMIZE) build config/crd | $(KUBECTL) delete --ignore-not-found=$(ignore-not-found) -f -

.PHONY: deploy
deploy: manifests kustomize ## Deploy controller to the K8s cluster specified in ~/.kube/config.
	cd config/manager && $(KUSTOMIZE) edit set image controller=${IMG}
	$(KUSTOMIZE) build config/default | $(KUBECTL) apply -f -

.PHONY: undeploy
undeploy: kustomize ## Undeploy controller from the K8s cluster specified in ~/.kube/config. Call with ignore-not-found=在删除过程中，设置为 true 以忽略未找到资源的错误。
	$(KUSTOMIZE) build config/default | $(KUBECTL) delete --ignore-not-found=$(ignore-not-found) -f -

##@ Dependencies

## Location to install dependencies to
LOCALBIN ?= $(shell pwd)/bin
$(LOCALBIN):
	mkdir -p $(LOCALBIN)

## Tool Binaries
KUBECTL ?= kubectl
KIND ?= kind
KUSTOMIZE ?= $(LOCALBIN)/kustomize
CONTROLLER_GEN ?= $(LOCALBIN)/controller-gen
ENVTEST ?= $(LOCALBIN)/setup-envtest
GOLANGCI_LINT = $(LOCALBIN)/golangci-lint

## Tool Versions
KUSTOMIZE_VERSION ?= v5.6.0
CONTROLLER_TOOLS_VERSION ?= v0.17.2
#ENVTEST_VERSION is the version of controller-runtime release branch to fetch the envtest setup script (i.e. release-0.20)
ENVTEST_VERSION ?= $(shell go list -m -f "{{ .Version }}" sigs.k8s.io/controller-runtime | awk -F'[v.]' '{printf "release-%d.%d", $$2, $$3}')
#ENVTEST_K8S_VERSION is the version of Kubernetes to use for setting up ENVTEST binaries (i.e. 1.31)
ENVTEST_K8S_VERSION ?= $(shell go list -m -f "{{ .Version }}" k8s.io/api | awk -F'[v.]' '{printf "1.%d", $$3}')
GOLANGCI_LINT_VERSION ?= v1.63.4

.PHONY: kustomize
kustomize: $(KUSTOMIZE) ## Download kustomize locally if necessary.
$(KUSTOMIZE): $(LOCALBIN)
	$(call go-install-tool,$(KUSTOMIZE),sigs.k8s.io/kustomize/kustomize/v5,$(KUSTOMIZE_VERSION))

.PHONY: controller-gen
controller-gen: $(CONTROLLER_GEN) ## Download controller-gen locally if necessary.
$(CONTROLLER_GEN): $(LOCALBIN)
	$(call go-install-tool,$(CONTROLLER_GEN),sigs.k8s.io/controller-tools/cmd/controller-gen,$(CONTROLLER_TOOLS_VERSION))

.PHONY: setup-envtest
setup-envtest: envtest ## Download the binaries required for ENVTEST in the local bin directory.
	@echo "Setting up envtest binaries for Kubernetes version $(ENVTEST_K8S_VERSION)..."
	@$(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path || { \
		echo "Error: Failed to set up envtest binaries for version $(ENVTEST_K8S_VERSION)."; \
		exit 1; \
	}

.PHONY: envtest
envtest: $(ENVTEST) ## Download setup-envtest locally if necessary.
$(ENVTEST): $(LOCALBIN)
	$(call go-install-tool,$(ENVTEST),sigs.k8s.io/controller-runtime/tools/setup-envtest,$(ENVTEST_VERSION))

.PHONY: golangci-lint
golangci-lint: $(GOLANGCI_LINT) ## Download golangci-lint locally if necessary.
$(GOLANGCI_LINT): $(LOCALBIN)
	$(call go-install-tool,$(GOLANGCI_LINT),github.com/golangci/golangci-lint/cmd/golangci-lint,$(GOLANGCI_LINT_VERSION))

# go-install-tool 将对任何包执行 'go install'，并使用自定义目标和二进制文件名称，如果该文件不存在的话。
# $1 - 目标路径和二进制文件名称
# $2 - 可安装的包 URL
# $3 - 特定版本的包
define go-install-tool
@[ -f "$(1)-$(3)" ] || { \endef

PROJECT: Kubebuilder metadata for scaffolding new components

# 工具生成的代码。请勿编辑。
# 此文件用于跟踪用于搭建您项目的信息
# 并允许插件正常工作。
# 更多信息： https://book.kubebuilder.io/reference/project-config.html
domain: tutorial.kubebuilder.io
layout:
- go.kubebuilder.io/v4
plugins:
  helm.kubebuilder.io/v1-alpha: {}
projectName: project
repo: 教程.kubebuilder.io/项目
resources:
- api:
    crdVersion: v1
    namespaced: true
  controller: true
  domain: tutorial.kubebuilder.io
  group: batch
  kind: CronJob
  path: tutorial.kubebuilder.io/project/api/v1
  version: v1
  webhooks:
    defaulting: true
    validation: true
    webhookVersion: v1
version: "3"

启动配置

我们还在 config/ 目录下获取启动配置。目前，它只包含启动控制器所需的 Kustomize YAML 定义，但一旦我们开始编写控制器，它还将包含我们的 CustomResourceDefinitions、自定义访问控制配置（RBAC）和 WebhookConfigurations。

config/default 包含一个 Kustomize 基础，用于以标准配置启动控制器。

每个目录包含不同的配置，这些配置被重构到它们自己的基础中：

config/manager: 在集群中以 pod 形式启动您的控制器
config/rbac: 运行您的控制器所需的权限，以便在它们自己的服务帐户下运行。

入口点

最后但同样重要的是，Kubebuilder 搭建了我们项目的基本入口文件：main.go。接下来我们来看看这个文件…

每段旅程都需要一个开始，每个程序都需要一个主函数。

emptymain.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Our package starts out with some basic imports. Particularly:

The core controller-runtime library
The default controller-runtime logging, Zap (more on that a bit later)

package main

import (
	"flag"
	"os"

	// 导入所有 Kubernetes 客户端身份验证插件（例如 Azure、GCP、OIDC 等）
	// 确保 exec-entrypoint 和 run 可以使用它们。
	_ "k8s.io/client-go/plugin/pkg/client/auth"

	"k8s.io/apimachinery/pkg/runtime"
	utilruntime "k8s.io/apimachinery/pkg/util/runtime"
	clientgoscheme "k8s.io/client-go/kubernetes/scheme"
	_ "k8s.io/client-go/plugin/pkg/client/auth/gcp"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/cache"
	"sigs.k8s.io/controller-runtime/pkg/healthz"
	"sigs.k8s.io/controller-runtime/pkg/log/zap"
	"sigs.k8s.io/controller-runtime/pkg/metrics/server"
	"sigs.k8s.io/controller-runtime/pkg/webhook"
	// +kubebuilder:scaffold:imports
)

Every set of controllers needs a Scheme, which provides mappings between Kinds and their corresponding Go types. We’ll talk a bit more about Kinds when we write our API definition, so just keep this in mind for later.

var (
	scheme   = runtime.NewScheme()
	setupLog = ctrl.Log.WithName("setup")
)

func init() {
	utilruntime.Must(clientgoscheme.AddToScheme(scheme))

	// +kubebuilder:scaffold:scheme}

At this point, our main function is fairly simple:

We set up some basic flags for metrics.
We instantiate a manager, which keeps track of running all of our controllers, as well as setting up shared caches and clients to the API server (notice we tell the manager about our Scheme).
We run our manager, which in turn runs all of our controllers and webhooks. The manager is set up to run until it receives a graceful shutdown signal. This way, when we’re running on Kubernetes, we behave nicely with graceful pod termination.

While we don’t have anything to run just yet, remember where that +kubebuilder:scaffold:builder comment is – things’ll get interesting there soon.

func main() {
	var metricsAddr string
	var enableLeaderElection bool
	var probeAddr string
	flag.StringVar(&metricsAddr, "metrics-bind-address", ":8080", "The address the metric endpoint binds to.")
	flag.StringVar(&probeAddr, "health-probe-bind-address", ":8081", "The address the probe endpoint binds to.")
	flag.BoolVar(&enableLeaderElection, "leader-elect", false,
		"Enable leader election for controller manager. "+
			"启用此功能将确保只有一个活动的控制管理器。")
	opts := zap.Options{
		Development: true,
	}
	opts.BindFlags(flag.CommandLine)
	flag.Parse()

	ctrl.SetLogger(zap.New(zap.UseFlagOptions(&opts)))

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme: scheme,
		Metrics: server.Options{
			BindAddress: metricsAddr,
		},
		WebhookServer:          webhook.NewServer(webhook.Options{Port: 9443}),
		HealthProbeBindAddress: probeAddr,
		LeaderElection:         enableLeaderElection,
		LeaderElectionID:       "80807133.tutorial.kubebuilder.io",
	})
	if err != nil {
		setupLog.Error(err, "unable to start manager")
		os.Exit(1)
	}

Note that the Manager can restrict the namespace that all controllers will watch for resources by:

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme: scheme,
		Cache: cache.Options{
			DefaultNamespaces: map[string]cache.Config{
				namespace: {},
			},
		},
		Metrics: server.Options{
			BindAddress: metricsAddr,
		},
		WebhookServer:          webhook.NewServer(webhook.Options{Port: 9443}),
		HealthProbeBindAddress: probeAddr,
		LeaderElection:         enableLeaderElection,
		LeaderElectionID:       "80807133.tutorial.kubebuilder.io",
	})

The above example will change the scope of your project to a single Namespace. In this scenario, it is also suggested to restrict the provided authorization to this namespace by replacing the default ClusterRole and ClusterRoleBinding to Role and RoleBinding respectively. For further information see the Kubernetes documentation about Using RBAC Authorization.

Also, it is possible to use the DefaultNamespaces from cache.Options{} to cache objects in a specific set of namespaces:

	var namespaces []string // List of Namespaces
	defaultNamespaces := make(map[string]cache.Config)

	for _, ns := range namespaces {
		defaultNamespaces[ns] = cache.Config{}
	}

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme: scheme,
		Cache: cache.Options{
			DefaultNamespaces: defaultNamespaces,
		},
		Metrics: server.Options{
			BindAddress: metricsAddr,
		},
		WebhookServer:          webhook.NewServer(webhook.Options{Port: 9443}),
		HealthProbeBindAddress: probeAddr,
		LeaderElection:         enableLeaderElection,
		LeaderElectionID:       "80807133.tutorial.kubebuilder.io",
	})

For further information see cache.Options{}

	// +kubebuilder:scaffold:builder

	if err := mgr.AddHealthzCheck("healthz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up health check")
		os.Exit(1)
	}
	if err := mgr.AddReadyzCheck("readyz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up ready check")
		os.Exit(1)
	}

	setupLog.Info("starting manager")
	if err := mgr.Start(ctrl.SetupSignalHandler()); err != nil {
		setupLog.Error(err, "problem running manager")
		os.Exit(1)
	}
}

解决了这个问题后，我们可以开始搭建我们的 API 了！

组、版本和种类，真是让人头大！

在我们开始使用 API 之前，应该先聊聊一些术语。

在讨论 Kubernetes 中的 API 时，我们经常使用四个术语：组、版本、种类_和_资源。

组和版本

Kubernetes 中的 API 组 只是相关功能的集合。每个组都有一个或多个版本，顾名思义，这些版本允许我们随着时间的推移改变 API 的工作方式。

种类和资源

每个 API 组版本包含一个或多个 API 类型，我们称之为 Kinds。虽然一个 Kind 可能在不同版本之间改变形式，但每种形式必须能够以某种方式存储其他形式的所有数据（我们可以将数据存储在字段中或注释中）。这意味着使用旧的 API 版本不会导致较新的数据丢失或损坏。有关更多信息，请参阅 Kubernetes API 指南。

您有时还会听到提到资源。资源只是 API 中对 Kind 的一种使用。通常，Kinds 和资源之间存在一对一的映射关系。例如，pods 资源对应于 Pod Kind。然而，有时候，同一个 Kind 可能会由多个资源返回。例如，Scale Kind 会由所有缩放子资源返回，如 deployments/scale 或 replicasets/scale。这使得 Kubernetes 的 HorizontalPodAutoscaler 能够与不同的资源进行交互。然而，对于自定义资源定义（CRDs）而言，每个 Kind 将对应一个单一的资源。

请注意，资源始终使用小写字母，并且根据惯例，它们是 Kind 的小写形式。

那么，这与围棋有什么关系呢？

当我们在特定组版本中提到一种类型时，我们将其称为 GroupVersionKind，简称 GVK。资源同样适用 GVR。正如我们稍后将看到的，每个 GVK 对应于一个包中的特定根 Go 类型。

现在我们把术语理顺了，可以_真正_创建我们的 API 了！

那么，我们该如何创建我们的 API 呢？

在下一部分添加新的 API中，我们将检查该工具如何通过命令 kubebuilder create api 帮助我们创建自己的 API。

此命令的目标是为我们的类型创建一个自定义资源（CR）和自定义资源定义（CRD）。要进一步了解，请参见：使用自定义资源定义扩展Kubernetes API。

但是，为什么要创建API呢？

新的 API 是我们向 Kubernetes 教授自定义对象的方式。Go 结构体用于生成 CRD，包含我们数据的架构以及跟踪诸如新类型名称等数据。然后，我们可以创建自定义对象的实例，这些实例将由我们的控制器进行管理。

我们的 API 和资源代表了我们在集群上的解决方案。基本上，CRD（自定义资源定义）是我们自定义对象的定义，而 CR（自定义资源）是其实例。

啊，你有例子吗？

让我们想一想经典场景，目标是在平台上运行应用程序及其数据库，使用 Kubernetes。在这个场景中，一个 CRD 可以表示应用程序，而另一个 CRD 可以表示数据库。通过为应用程序创建一个 CRD，并为数据库创建另一个 CRD，我们不会损害诸如封装、单一职责原则和内聚性等概念。损害这些概念可能会导致意想不到的副作用，例如在扩展、重用或维护方面遇到困难，仅举几例。

通过这种方式，我们可以创建应用程序的 CRD，它将拥有自己的控制器，负责诸如创建包含应用程序的 Deployment、创建访问该应用程序的 Service 等。类似地，我们可以创建一个 CRD 来表示数据库，并部署一个控制器来管理数据库实例。

呃，但那个Scheme是什么东西？

我们之前看到的 Scheme 只是一个用来跟踪给定 GVK 对应的 Go 类型的方式（不要被它的 godocs 压倒）。

例如，假设我们将 "tutorial.kubebuilder.io/api/v1".CronJob{} 类型标记为属于 batch.tutorial.kubebuilder.io/v1 API 组（隐含地表示它的 Kind 为 CronJob）。

然后，我们可以根据API服务器提供的JSON数据，稍后构建一个新的 &CronJob{}。

{
    "kind": "CronJob",
    "apiVersion": "batch.tutorial.kubebuilder.io/v1",
    ...
}

或者在我们提交一个 &CronJob{} 的更新时，正确查找组版本。

添加一个新 API

要构建一个新的 Kind（你有注意到上一章吗？），以及相应的控制器，我们可以使用 kubebuilder create api：

kubebuilder create api --group batch --version v1 --kind CronJob

按 y 以确认\

第一次为每个组版本调用此命令时，它将为新的组版本创建一个目录。

在这种情况下，api/v1/ 目录被创建，对应于 batch.tutorial.kubebuilder.io/v1（还记得我们最开始的 --domain 设置吗？）。

它还为我们的 CronJob 类型添加了一个文件 api/v1/cronjob_types.go。每次我们调用带有不同类型的命令时，它都会添加一个相应的新文件。

让我们先看看开箱时提供的内容，然后再继续填写。

emptyapi.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

We start out simply enough: we import the meta/v1 API group, which is not normally exposed by itself, but instead contains metadata common to all Kubernetes Kinds.

package v1

import (
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
)

Next, we define types for the Spec and Status of our Kind. Kubernetes functions by reconciling desired state (Spec) with actual cluster state (other objects’ Status) and external state, and then recording what it observed (Status). Thus, every functional object includes spec and status. A few types, like ConfigMap don’t follow this pattern, since they don’t encode desired state, but most types do.

// EDIT THIS FILE!  THIS IS SCAFFOLDING FOR YOU TO OWN!
// NOTE: json tags are required.  Any new fields you add must have json tags for the fields to be serialized.

// CronJobSpec defines the desired state of CronJob
type CronJobSpec struct {
	// 插入额外的规格字段 - 集群的期望状态
	// 注意：修改此文件后，运行"make"以重新生成代码
}

// CronJobStatus defines the observed state of CronJob
type CronJobStatus struct {
	// 插入额外的状态字段 - 定义集群的观察状态
	// 重要：在修改此文件后，请运行 "make" 以重新生成代码
}

Next, we define the types corresponding to actual Kinds, CronJob and CronJobList. CronJob is our root type, and describes the CronJob kind. Like all Kubernetes objects, it contains TypeMeta (which describes API version and Kind), and also contains ObjectMeta, which holds things like name, namespace, and labels.

CronJobList is simply a container for multiple CronJobs. It’s the Kind used in bulk operations, like LIST.

In general, we never modify either of these – all modifications go in either Spec or Status.

That little +kubebuilder:object:root comment is called a marker. We’ll see more of them in a bit, but know that they act as extra metadata, telling controller-tools (our code and YAML generator) extra information. This particular one tells the object generator that this type represents a Kind. Then, the object generator generates an implementation of the runtime.Object interface for us, which is the standard interface that all types representing Kinds must implement.

// +kubebuilder:object:root=true
// +kubebuilder:subresource:status

// CronJob is the Schema for the cronjobs API
type CronJob struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   CronJobSpec   `json:"spec,omitempty"`
	Status CronJobStatus `json:"status,omitempty"`
}

// +kubebuilder:object:root=true

// CronJobList 包含一个 CronJob 列表
type CronJobList struct {
	metav1.TypeMeta `json:",inline"`
	metav1.ListMeta `json:"metadata,omitempty"`
	Items           []CronJob `json:"items"`
}

Finally, we add the Go types to the API group. This allows us to add the types in this API group to any Scheme.

func init() {
	SchemeBuilder.Register(&CronJob{}, &CronJobList{})
}

现在我们已经了解了基本结构，让我们来完善它吧！

设计一个 API

在 Kubernetes 中，我们有一些设计 API 的规则。即所有序列化字段必须使用 camelCase，因此我们使用 JSON 结构标签来指定这一点。我们还可以使用 omitempty 结构标签来标记当字段为空时应从序列化中省略该字段。

字段可以使用大部分原始类型。数字是一个例外：出于API兼容性考虑，我们接受三种数字形式：int32 和 int64 用于整数，resource.Quantity 用于小数。

Hold up, what's a Quantity?

数量是对十进制数字的一种特殊表示法，它具有明确固定的表示方式，使其在不同机器之间更具可移植性。您可能在Kubernetes中为pod指定资源请求和限制时注意到了它们。

它们在概念上与浮点数相似：具有有效数字、基数和指数。它们的可序列化和可读格式使用整数和后缀来指定值，方式与我们描述计算机存储的方式类似。

例如，值 2m 在十进制表示中代表 0.002。 2Ki 在十进制中表示 2048，而 2K 在十进制中表示 2000。如果我们想指定小数，我们可以切换到一个后缀，使我们能够使用整数：2.5 表示为 2500m。

支持两种进制：10 进制和 2 进制（分别称为十进制和二进制）。十进制使用“常规“国际单位制后缀表示（例如 M 和 K），而二进制使用“兆比特“（mebi）表示法（例如 Mi 和 Ki）。可以参考兆字节与兆比特的区别。

我们使用的另一种特殊类型是 metav1.Time。它的功能与 time.Time 相同，但具有固定的可移植序列化格式。

在处理完这些之后，我们来看看我们的 CronJob 对象是什么样的！

project/api/v1/cronjob_types.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

package v1

Imports

import (
	batchv1 "k8s.io/api/batch/v1"
	corev1 "k8s.io/api/core/v1"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
)

// EDIT THIS FILE!  THIS IS SCAFFOLDING FOR YOU TO OWN!
// NOTE: json tags are required.  Any new fields you add must have json tags for the fields to be serialized.

First, let’s take a look at our spec. As we discussed before, spec holds desired state, so any “inputs” to our controller go here.

Fundamentally a CronJob needs the following pieces:

A schedule (the cron in CronJob)
A template for the Job to run (the job in CronJob)

We’ll also want a few extras, which will make our users’ lives easier:

A deadline for starting jobs (if we miss this deadline, we’ll just wait till the next scheduled time)
What to do if multiple jobs would run at once (do we wait? stop the old one? run both?)
A way to pause the running of a CronJob, in case something’s wrong with it
Limits on old job history

Remember, since we never read our own status, we need to have some other way to keep track of whether a job has run. We can use at least one old job to do this.

We’ll use several markers (// +comment) to specify additional metadata. These will be used by controller-tools when generating our CRD manifest. As we’ll see in a bit, controller-tools will also use GoDoc to form descriptions for the fields.

// CronJobSpec defines the desired state of CronJob.
type CronJobSpec struct {
	// +kubebuilder:validation:MinLength=0

	// The schedule in Cron format, see https://en.wikipedia.org/wiki/Cron.
	Schedule string `json:"schedule"`

	// +kubebuilder:validation:Minimum=0

	// Optional deadline in seconds for starting the job if it misses scheduled
	// time for any reason.  Missed jobs executions will be counted as failed ones.
	// +optional
	StartingDeadlineSeconds *int64 `json:"startingDeadlineSeconds,omitempty"`

	// Specifies how to treat concurrent executions of a Job.
	// Valid values are:
	// - "Allow" (default): allows CronJobs to run concurrently;
	// - "Forbid": forbids concurrent runs, skipping next run if previous run hasn't finished yet;
	// - "Replace": cancels currently running job and replaces it with a new one
	// +optional
	ConcurrencyPolicy ConcurrencyPolicy `json:"concurrencyPolicy,omitempty"`

	// This flag tells the controller to suspend subsequent executions, it does
	// not apply to already started executions.  Defaults to false.
	// +optional
	Suspend *bool `json:"suspend,omitempty"`

	// Specifies the job that will be created when executing a CronJob.
	JobTemplate batchv1.JobTemplateSpec `json:"jobTemplate"`

	// +kubebuilder:validation:Minimum=0

	// The number of successful finished jobs to retain.
	// This is a pointer to distinguish between explicit zero and not specified.
	// +optional
	SuccessfulJobsHistoryLimit *int32 `json:"successfulJobsHistoryLimit,omitempty"`

	// +kubebuilder:validation:Minimum=0

	// The number of failed finished jobs to retain.
	// This is a pointer to distinguish between explicit zero and not specified.
	// +optional
	FailedJobsHistoryLimit *int32 `json:"failedJobsHistoryLimit,omitempty"`
}

We define a custom type to hold our concurrency policy. It’s actually just a string under the hood, but the type gives extra documentation, and allows us to attach validation on the type instead of the field, making the validation more easily reusable.

// ConcurrencyPolicy describes how the job will be handled.
// Only one of the following concurrent policies may be specified.
// If none of the following policies is specified, the default one
// is AllowConcurrent.
// +kubebuilder:validation:Enum=Allow;Forbid;Replace
type ConcurrencyPolicy string

const (
	// AllowConcurrent allows CronJobs to run concurrently.
	AllowConcurrent ConcurrencyPolicy = "Allow"

	// ForbidConcurrent forbids concurrent runs, skipping next run if previous
	// hasn't finished yet.
	ForbidConcurrent ConcurrencyPolicy = "Forbid"

	// ReplaceConcurrent cancels currently running job and replaces it with a new one.
	ReplaceConcurrent ConcurrencyPolicy = "Replace"
)

Next, let’s design our status, which holds observed state. It contains any information we want users or other controllers to be able to easily obtain.

We’ll keep a list of actively running jobs, as well as the last time that we successfully ran our job. Notice that we use metav1.Time instead of time.Time to get the stable serialization, as mentioned above.

// CronJobStatus defines the observed state of CronJob.
type CronJobStatus struct {
	// 插入额外的状态字段 - 定义集群的观察状态
	// 重要：在修改此文件后，请运行 "make" 以重新生成代码

	// A list of pointers to currently running jobs.
	// +optional
	Active []corev1.ObjectReference `json:"active,omitempty"`

	// Information when was the last time the job was successfully scheduled.
	// +optional
	LastScheduleTime *metav1.Time `json:"lastScheduleTime,omitempty"`
}

Finally, we have the rest of the boilerplate that we’ve already discussed. As previously noted, we don’t need to change this, except to mark that we want a status subresource, so that we behave like built-in kubernetes types.

// +kubebuilder:object:root=true
// +kubebuilder:subresource:status

// CronJob is the Schema for the cronjobs API.
type CronJob struct {

Root Object Definitions

	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   CronJobSpec   `json:"spec,omitempty"`
	Status CronJobStatus `json:"status,omitempty"`
}

// +kubebuilder:object:root=true

// CronJobList contains a list of CronJob.
type CronJobList struct {
	metav1.TypeMeta `json:",inline"`
	metav1.ListMeta `json:"metadata,omitempty"`
	Items           []CronJob `json:"items"`
}

func init() {
	SchemeBuilder.Register(&CronJob{}, &CronJobList{})
}

现在我们有了一个API，我们需要编写一个控制器来实际实现该功能。

简短的插曲：这些其他东西是什么？

如果你查看了 api/v1/ 目录中的其他文件，可能会注意到除了 cronjob_types.go 之外还有两个额外的文件：groupversion_info.go 和 zz_generated.deepcopy.go。

这两个文件都不需要编辑（前者保持不变，后者是自动生成的），但了解它们的内容是很有用的。

`groupversion_info.go`

groupversion_info.go 包含有关组版本的常见元数据：

project/api/v1/groupversion_info.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

First, we have some package-level markers that denote that there are Kubernetes objects in this package, and that this package represents the group batch.tutorial.kubebuilder.io. The object generator makes use of the former, while the latter is used by the CRD generator to generate the right metadata for the CRDs it creates from this package.

// Package v1 contains API Schema definitions for the batch v1 API group.
// +kubebuilder:object:generate=true
// +groupName=batch.tutorial.kubebuilder.io
package v1

import (
	"k8s.io/apimachinery/pkg/runtime/schema"
	"sigs.k8s.io/controller-runtime/pkg/scheme"
)

Then, we have the commonly useful variables that help us set up our Scheme. Since we need to use all the types in this package in our controller, it’s helpful (and the convention) to have a convenient method to add all the types to some other Scheme. SchemeBuilder makes this easy for us.

var (
	// GroupVersion is group version used to register these objects.
	GroupVersion = schema.GroupVersion{Group: "batch.tutorial.kubebuilder.io", Version: "v1"}

	// SchemeBuilder is used to add go types to the GroupVersionKind scheme.
	SchemeBuilder = &scheme.Builder{GroupVersion: GroupVersion}

	// AddToScheme adds the types in this group-version to the given scheme.
	AddToScheme = SchemeBuilder.AddToScheme
)

`zz_generated.deepcopy.go`

zz_generated.deepcopy.go 包含了上述 runtime.Object 接口的自动生成实现，它将我们的所有根类型标记为表示种类（Kinds）。

runtime.Object 接口的核心是一个深拷贝方法 DeepCopyObject。

controller-tools中的object生成器还为每个根类型及其所有子类型生成了两个其他实用方法：DeepCopy和DeepCopyInto。

控制器中包含什么？

控制器是Kubernetes和任何操作器的核心。

控制器的职责是确保对于任何给定的对象，实际的世界状态（包括集群状态以及可能的外部状态，例如 Kubelet 的运行容器或云服务提供商的负载均衡器）与对象中的期望状态相匹配。每个控制器专注于一个_根_ Kind，但可能与其他 Kind 进行交互。

我们称这个过程为调整。

在 controller-runtime 中，实现特定种类的对账逻辑的部分称为 Reconciler。一个 reconciler 接收一个对象的名称，并返回是否需要重新尝试（例如，在出现错误或周期性控制器的情况下，如水平 Pod 自动缩放器）。

emptycontroller.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

First, we start out with some standard imports. As before, we need the core controller-runtime library, as well as the client package, and the package for our API types.

package controllers

import (
	"context"

	"k8s.io/apimachinery/pkg/runtime"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/client"
	logf "sigs.k8s.io/controller-runtime/pkg/log"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
)

Next, kubebuilder has scaffolded a basic reconciler struct for us. Pretty much every reconciler needs to log, and needs to be able to fetch objects, so these are added out of the box.

// CronJobReconciler reconciles a CronJob object
type CronJobReconciler struct {
	client.Client
	Scheme *runtime.Scheme
}

Most controllers eventually end up running on the cluster, so they need RBAC permissions, which we specify using controller-tools RBAC markers. These are the bare minimum permissions needed to run. As we add more functionality, we’ll need to revisit these.

// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs/status,verbs=get;update;patch

The ClusterRole manifest at config/rbac/role.yaml is generated from the above markers via controller-gen with the following command:

// make manifests

NOTE: If you receive an error, please run the specified command in the error and re-run make manifests.

Reconcile actually performs the reconciling for a single named object. Our Request just has a name, but we can use the client to fetch that object from the cache.

We return an empty result and no error, which indicates to controller-runtime that we’ve successfully reconciled this object and don’t need to try again until there’s some changes.

Most controllers need a logging handle and a context, so we set them up here.

The context is used to allow cancellation of requests, and potentially things like tracing. It’s the first argument to all client methods. The Background context is just a basic context without any extra data or timing restrictions.

The logging handle lets us log. controller-runtime uses structured logging through a library called logr. As we’ll see shortly, logging works by attaching key-value pairs to a static message. We can pre-assign some pairs at the top of our reconcile method to have those attached to all log lines in this reconciler.

func (r *CronJobReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
	_ = logf.FromContext(ctx)

	// your logic here

	return ctrl.Result{}, nil
}

Finally, we add this reconciler to the manager, so that it gets started when the manager is started.

For now, we just note that this reconciler operates on CronJobs. Later, we’ll use this to mark that we care about related objects as well.

func (r *CronJobReconciler) SetupWithManager(mgr ctrl.Manager) error {
	return ctrl.NewControllerManagedBy(mgr).
		For(&batchv1.CronJob{}).
		Complete(r)
}

现在我们已经看到了 reconciler 的基本结构，让我们来完善 CronJob 的逻辑。

实现控制器

我们CronJob控制器的基本逻辑是这样的：

加载指定的 CronJob
列出所有有效的工作，并更新状态。
根据历史限制清理旧的工作记录。
检查我们是否被暂停（如果被暂停则不做其他任何事情）
获取下一个计划的运行时间
如果新工作在计划时间内、未超过截止日期且未被我们的并发策略阻止，则可以运行。
当我们看到一个正在运行的任务（自动完成）或是下一个定时运行的时间到时，请重新排队。

project/internal/controller/cronjob_controller.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

We’ll start out with some imports. You’ll see below that we’ll need a few more imports than those scaffolded for us. We’ll talk about each one when we use it.

package controller

import (
	"context"
	"fmt"
	"sort"
	"time"

	"github.com/robfig/cron"
	kbatch "k8s.io/api/batch/v1"
	corev1 "k8s.io/api/core/v1"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
	"k8s.io/apimachinery/pkg/runtime"
	ref "k8s.io/client-go/tools/reference"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/client"
	logf "sigs.k8s.io/controller-runtime/pkg/log"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
)

Next, we’ll need a Clock, which will allow us to fake timing in our tests.

// CronJobReconciler reconciles a CronJob object
type CronJobReconciler struct {
	client.Client
	Scheme *runtime.Scheme
	Clock
}

Clock

We’ll mock out the clock to make it easier to jump around in time while testing, the “real” clock just calls time.Now.

type realClock struct{}

func (_ realClock) Now() time.Time { return time.Now() }

// Clock knows how to get the current time.
// It can be used to fake out timing for testing.
type Clock interface {
	Now() time.Time
}

Notice that we need a few more RBAC permissions – since we’re creating and managing jobs now, we’ll need permissions for those, which means adding a couple more markers.

// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs/status,verbs=get;update;patch
// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs/finalizers,verbs=update
// +kubebuilder:rbac:groups=batch,resources=jobs,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=batch,resources=jobs/status,verbs=get

Now, we get to the heart of the controller – the reconciler logic.

var (
	scheduledTimeAnnotation = "batch.tutorial.kubebuilder.io/scheduled-at"
)

// Reconcile is part of the main kubernetes reconciliation loop which aims to
// move the current state of the cluster closer to the desired state.
// TODO(user): Modify the Reconcile function to compare the state specified by
// the CronJob object against the actual cluster state, and then
// perform operations to make the cluster state reflect the state specified by
// the user.
//
// For more details, check Reconcile and its Result here:
// - https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/reconcile
// nolint:gocyclo
func (r *CronJobReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
	log := logf.FromContext(ctx)

1: Load the CronJob by name

We’ll fetch the CronJob using our client. All client methods take a context (to allow for cancellation) as their first argument, and the object in question as their last. Get is a bit special, in that it takes a NamespacedName as the middle argument (most don’t have a middle argument, as we’ll see below).

Many client methods also take variadic options at the end.

	var cronJob batchv1.CronJob
	if err := r.Get(ctx, req.NamespacedName, &cronJob); err != nil {
		log.Error(err, "unable to fetch CronJob")
		// we'll ignore not-found errors, since they can't be fixed by an immediate
		// requeue (we'll need to wait for a new notification), and we can get them
		// on deleted requests.
		return ctrl.Result{}, client.IgnoreNotFound(err)
	}

2: List all active jobs, and update the status

To fully update our status, we’ll need to list all child jobs in this namespace that belong to this CronJob. Similarly to Get, we can use the List method to list the child jobs. Notice that we use variadic options to set the namespace and field match (which is actually an index lookup that we set up below).

	var childJobs kbatch.JobList
	if err := r.List(ctx, &childJobs, client.InNamespace(req.Namespace), client.MatchingFields{jobOwnerKey: req.Name}); err != nil {
		log.Error(err, "unable to list child Jobs")
		return ctrl.Result{}, err
	}

Once we have all the jobs we own, we’ll split them into active, successful, and failed jobs, keeping track of the most recent run so that we can record it in status. Remember, status should be able to be reconstituted from the state of the world, so it’s generally not a good idea to read from the status of the root object. Instead, you should reconstruct it every run. That’s what we’ll do here.

We can check if a job is “finished” and whether it succeeded or failed using status conditions. We’ll put that logic in a helper to make our code cleaner.

	// find the active list of jobs
	var activeJobs []*kbatch.Job
	var successfulJobs []*kbatch.Job
	var failedJobs []*kbatch.Job
	var mostRecentTime *time.Time // find the last run so we can update the status

isJobFinished

We consider a job “finished” if it has a “Complete” or “Failed” condition marked as true. Status conditions allow us to add extensible status information to our objects that other humans and controllers can examine to check things like completion and health.

	isJobFinished := func(job *kbatch.Job) (bool, kbatch.JobConditionType) {
		for _, c := range job.Status.Conditions {
			if (c.Type == kbatch.JobComplete || c.Type == kbatch.JobFailed) && c.Status == corev1.ConditionTrue {
				return true, c.Type
			}
		}

		return false, ""
	}

getScheduledTimeForJob

We’ll use a helper to extract the scheduled time from the annotation that we added during job creation.

	getScheduledTimeForJob := func(job *kbatch.Job) (*time.Time, error) {
		timeRaw := job.Annotations[scheduledTimeAnnotation]
		if len(timeRaw) == 0 {
			return nil, nil
		}

		timeParsed, err := time.Parse(time.RFC3339, timeRaw)
		if err != nil {
			return nil, err
		}
		return &timeParsed, nil
	}

	for i, job := range childJobs.Items {
		_, finishedType := isJobFinished(&job)
		switch finishedType {
		case "": // ongoing
			activeJobs = append(activeJobs, &childJobs.Items[i])
		case kbatch.JobFailed:
			failedJobs = append(failedJobs, &childJobs.Items[i])
		case kbatch.JobComplete:
			successfulJobs = append(successfulJobs, &childJobs.Items[i])
		}

		// We'll store the launch time in an annotation, so we'll reconstitute that from
		// the active jobs themselves.
		scheduledTimeForJob, err := getScheduledTimeForJob(&job)
		if err != nil {
			log.Error(err, "unable to parse schedule time for child job", "job", &job)
			continue
		}
		if scheduledTimeForJob != nil {
			if mostRecentTime == nil || mostRecentTime.Before(*scheduledTimeForJob) {
				mostRecentTime = scheduledTimeForJob
			}
		}
	}

	if mostRecentTime != nil {
		cronJob.Status.LastScheduleTime = &metav1.Time{Time: *mostRecentTime}
	} else {
		cronJob.Status.LastScheduleTime = nil
	}
	cronJob.Status.Active = nil
	for _, activeJob := range activeJobs {
		jobRef, err := ref.GetReference(r.Scheme, activeJob)
		if err != nil {
			log.Error(err, "unable to make reference to active job", "job", activeJob)
			continue
		}
		cronJob.Status.Active = append(cronJob.Status.Active, *jobRef)
	}

Here, we’ll log how many jobs we observed at a slightly higher logging level, for debugging. Notice how instead of using a format string, we use a fixed message, and attach key-value pairs with the extra information. This makes it easier to filter and query log lines.

	log.V(1).Info("job count", "active jobs", len(activeJobs), "successful jobs", len(successfulJobs), "failed jobs", len(failedJobs))

Using the data we’ve gathered, we’ll update the status of our CRD. Just like before, we use our client. To specifically update the status subresource, we’ll use the Status part of the client, with the Update method.

The status subresource ignores changes to spec, so it’s less likely to conflict with any other updates, and can have separate permissions.

	if err := r.Status().Update(ctx, &cronJob); err != nil {
		log.Error(err, "unable to update CronJob status")
		return ctrl.Result{}, err
	}

Once we’ve updated our status, we can move on to ensuring that the status of the world matches what we want in our spec.

3: Clean up old jobs according to the history limit

First, we’ll try to clean up old jobs, so that we don’t leave too many lying around.

	// NB: deleting these are "best effort" -- if we fail on a particular one,
	// we won't requeue just to finish the deleting.
	if cronJob.Spec.FailedJobsHistoryLimit != nil {
		sort.Slice(failedJobs, func(i, j int) bool {
			if failedJobs[i].Status.StartTime == nil {
				return failedJobs[j].Status.StartTime != nil
			}
			return failedJobs[i].Status.StartTime.Before(failedJobs[j].Status.StartTime)
		})
		for i, job := range failedJobs {
			if int32(i) >= int32(len(failedJobs))-*cronJob.Spec.FailedJobsHistoryLimit {
				break
			}
			if err := r.Delete(ctx, job, client.PropagationPolicy(metav1.DeletePropagationBackground)); client.IgnoreNotFound(err) != nil {
				log.Error(err, "unable to delete old failed job", "job", job)
			} else {
				log.V(0).Info("deleted old failed job", "job", job)
			}
		}
	}

	if cronJob.Spec.SuccessfulJobsHistoryLimit != nil {
		sort.Slice(successfulJobs, func(i, j int) bool {
			if successfulJobs[i].Status.StartTime == nil {
				return successfulJobs[j].Status.StartTime != nil
			}
			return successfulJobs[i].Status.StartTime.Before(successfulJobs[j].Status.StartTime)
		})
		for i, job := range successfulJobs {
			if int32(i) >= int32(len(successfulJobs))-*cronJob.Spec.SuccessfulJobsHistoryLimit {
				break
			}
			if err := r.Delete(ctx, job, client.PropagationPolicy(metav1.DeletePropagationBackground)); err != nil {
				log.Error(err, "unable to delete old successful job", "job", job)
			} else {
				log.V(0).Info("deleted old successful job", "job", job)
			}
		}
	}

4: Check if we’re suspended

If this object is suspended, we don’t want to run any jobs, so we’ll stop now. This is useful if something’s broken with the job we’re running and we want to pause runs to investigate or putz with the cluster, without deleting the object.

	if cronJob.Spec.Suspend != nil && *cronJob.Spec.Suspend {
		log.V(1).Info("cronjob suspended, skipping")
		return ctrl.Result{}, nil
	}

5: Get the next scheduled run

If we’re not paused, we’ll need to calculate the next scheduled run, and whether or not we’ve got a run that we haven’t processed yet.

getNextSchedule

We’ll calculate the next scheduled time using our helpful cron library. We’ll start calculating appropriate times from our last run, or the creation of the CronJob if we can’t find a last run.

If there are too many missed runs and we don’t have any deadlines set, we’ll bail so that we don’t cause issues on controller restarts or wedges.

Otherwise, we’ll just return the missed runs (of which we’ll just use the latest), and the next run, so that we can know when it’s time to reconcile again.

	getNextSchedule := func(cronJob *batchv1.CronJob, now time.Time) (lastMissed time.Time, next time.Time, err error) {
		sched, err := cron.ParseStandard(cronJob.Spec.Schedule)
		if err != nil {
			return time.Time{}, time.Time{}, fmt.Errorf("Unparseable schedule %q: %v", cronJob.Spec.Schedule, err)
		}

		// for optimization purposes, cheat a bit and start from our last observed run time
		// we could reconstitute this here, but there's not much point, since we've
		// just updated it.
		var earliestTime time.Time
		if cronJob.Status.LastScheduleTime != nil {
			earliestTime = cronJob.Status.LastScheduleTime.Time
		} else {
			earliestTime = cronJob.ObjectMeta.CreationTimestamp.Time
		}
		if cronJob.Spec.StartingDeadlineSeconds != nil {
			// controller is not going to schedule anything below this point
			schedulingDeadline := now.Add(-time.Second * time.Duration(*cronJob.Spec.StartingDeadlineSeconds))

			if schedulingDeadline.After(earliestTime) {
				earliestTime = schedulingDeadline
			}
		}
		if earliestTime.After(now) {
			return time.Time{}, sched.Next(now), nil
		}

		starts := 0
		for t := sched.Next(earliestTime); !t.After(now); t = sched.Next(t) {
			lastMissed = t
			// An object might miss several starts. For example, if
			// controller gets wedged on Friday at 5:01pm when everyone has
			// gone home, and someone comes in on Tuesday AM and discovers
			// the problem and restarts the controller, then all the hourly
			// jobs, more than 80 of them for one hourly scheduledJob, should
			// all start running with no further intervention (if the scheduledJob
			// allows concurrency and late starts).
			//
			// However, if there is a bug somewhere, or incorrect clock
			// on controller's server or apiservers (for setting creationTimestamp)
			// then there could be so many missed start times (it could be off
			// by decades or more), that it would eat up all the CPU and memory
			// of this controller. In that case, we want to not try to list
			// all the missed start times.
			starts++
			if starts > 100 {
				// We can't get the most recent times so just return an empty slice
				return time.Time{}, time.Time{}, fmt.Errorf("Too many missed start times (> 100). Set or decrease .spec.startingDeadlineSeconds or check clock skew.")
			}
		}
		return lastMissed, sched.Next(now), nil
	}

	// figure out the next times that we need to create
	// jobs at (or anything we missed).
	missedRun, nextRun, err := getNextSchedule(&cronJob, r.Now())
	if err != nil {
		log.Error(err, "unable to figure out CronJob schedule")
		// we don't really care about requeuing until we get an update that
		// fixes the schedule, so don't return an error
		return ctrl.Result{}, nil
	}

We’ll prep our eventual request to requeue until the next job, and then figure out if we actually need to run.

	scheduledResult := ctrl.Result{RequeueAfter: nextRun.Sub(r.Now())} // save this so we can re-use it elsewhere
	log = log.WithValues("now", r.Now(), "next run", nextRun)

6: Run a new job if it’s on schedule, not past the deadline, and not blocked by our concurrency policy

If we’ve missed a run, and we’re still within the deadline to start it, we’ll need to run a job.

	if missedRun.IsZero() {
		log.V(1).Info("no upcoming scheduled times, sleeping until next")
		return scheduledResult, nil
	}

	// make sure we're not too late to start the run
	log = log.WithValues("current run", missedRun)
	tooLate := false
	if cronJob.Spec.StartingDeadlineSeconds != nil {
		tooLate = missedRun.Add(time.Duration(*cronJob.Spec.StartingDeadlineSeconds) * time.Second).Before(r.Now())
	}
	if tooLate {
		log.V(1).Info("missed starting deadline for last run, sleeping till next")
		// TODO(directxman12): events
		return scheduledResult, nil
	}

If we actually have to run a job, we’ll need to either wait till existing ones finish, replace the existing ones, or just add new ones. If our information is out of date due to cache delay, we’ll get a requeue when we get up-to-date information.

	// figure out how to run this job -- concurrency policy might forbid us from running
	// multiple at the same time...
	if cronJob.Spec.ConcurrencyPolicy == batchv1.ForbidConcurrent && len(activeJobs) > 0 {
		log.V(1).Info("concurrency policy blocks concurrent runs, skipping", "num active", len(activeJobs))
		return scheduledResult, nil
	}

	// ...or instruct us to replace existing ones...
	if cronJob.Spec.ConcurrencyPolicy == batchv1.ReplaceConcurrent {
		for _, activeJob := range activeJobs {
			// we don't care if the job was already deleted
			if err := r.Delete(ctx, activeJob, client.PropagationPolicy(metav1.DeletePropagationBackground)); client.IgnoreNotFound(err) != nil {
				log.Error(err, "unable to delete active job", "job", activeJob)
				return ctrl.Result{}, err
			}
		}
	}

Once we’ve figured out what to do with existing jobs, we’ll actually create our desired job

constructJobForCronJob

We need to construct a job based on our CronJob’s template. We’ll copy over the spec from the template and copy some basic object meta.

Then, we’ll set the “scheduled time” annotation so that we can reconstitute our LastScheduleTime field each reconcile.

Finally, we’ll need to set an owner reference. This allows the Kubernetes garbage collector to clean up jobs when we delete the CronJob, and allows controller-runtime to figure out which cronjob needs to be reconciled when a given job changes (is added, deleted, completes, etc).

	constructJobForCronJob := func(cronJob *batchv1.CronJob, scheduledTime time.Time) (*kbatch.Job, error) {
		// We want job names for a given nominal start time to have a deterministic name to avoid the same job being created twice
		name := fmt.Sprintf("%s-%d", cronJob.Name, scheduledTime.Unix())

		job := &kbatch.Job{
			ObjectMeta: metav1.ObjectMeta{
				Labels:      make(map[string]string),
				Annotations: make(map[string]string),
				Name:        name,
				Namespace:   cronJob.Namespace,
			},
			Spec: *cronJob.Spec.JobTemplate.Spec.DeepCopy(),
		}
		for k, v := range cronJob.Spec.JobTemplate.Annotations {
			job.Annotations[k] = v
		}
		job.Annotations[scheduledTimeAnnotation] = scheduledTime.Format(time.RFC3339)
		for k, v := range cronJob.Spec.JobTemplate.Labels {
			job.Labels[k] = v
		}
		if err := ctrl.SetControllerReference(cronJob, job, r.Scheme); err != nil {
			return nil, err
		}

		return job, nil
	}

	// actually make the job...
	job, err := constructJobForCronJob(&cronJob, missedRun)
	if err != nil {
		log.Error(err, "unable to construct job from template")
		// don't bother requeuing until we get a change to the spec
		return scheduledResult, nil
	}

	// ...and create it on the cluster
	if err := r.Create(ctx, job); err != nil {
		log.Error(err, "unable to create Job for CronJob", "job", job)
		return ctrl.Result{}, err
	}

	log.V(1).Info("created Job for CronJob run", "job", job)

7: Requeue when we either see a running job or it’s time for the next scheduled run

Finally, we’ll return the result that we prepped above, that says we want to requeue when our next run would need to occur. This is taken as a maximum deadline – if something else changes in between, like our job starts or finishes, we get modified, etc, we might reconcile again sooner.

	// we'll requeue once we see the running job, and update our status
	return scheduledResult, nil
}

Setup

Finally, we’ll update our setup. In order to allow our reconciler to quickly look up Jobs by their owner, we’ll need an index. We declare an index key that we can later use with the client as a pseudo-field name, and then describe how to extract the indexed value from the Job object. The indexer will automatically take care of namespaces for us, so we just have to extract the owner name if the Job has a CronJob owner.

Additionally, we’ll inform the manager that this controller owns some Jobs, so that it will automatically call Reconcile on the underlying CronJob when a Job changes, is deleted, etc.

var (
	jobOwnerKey = ".metadata.controller"
	apiGVStr    = batchv1.GroupVersion.String()
)

// SetupWithManager 将控制器与管理器进行设置。
func (r *CronJobReconciler) SetupWithManager(mgr ctrl.Manager) error {
	// set up a real clock, since we're not in a test
	if r.Clock == nil {
		r.Clock = realClock{}
	}

	if err := mgr.GetFieldIndexer().IndexField(context.Background(), &kbatch.Job{}, jobOwnerKey, func(rawObj client.Object) []string {
		// grab the job object, extract the owner...
		job := rawObj.(*kbatch.Job)
		owner := metav1.GetControllerOf(job)
		if owner == nil {
			return nil
		}
		// ...make sure it's a CronJob...
		if owner.APIVersion != apiGVStr || owner.Kind != "CronJob" {
			return nil
		}

		// ...and if so, return it
		return []string{owner.Name}
	}); err != nil {
		return err
	}

	return ctrl.NewControllerManagedBy(mgr).
		For(&batchv1.CronJob{}).
		Owns(&kbatch.Job{}).
		Named("cronjob").
		Complete(r)
}

那真是个难题，不过现在我们有了一个可用的控制器。接下来让我们对集群进行测试，如果没有问题，就可以部署了！

你提到过主吗？

但是首先，记得我们说过要再次回到 main.go 吗？让我们来看看有没有什么变化，以及我们需要添加的内容。

project/cmd/main.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Imports

package main

import (
	"crypto/tls"
	"flag"
	"os"
	"path/filepath"

	// 导入所有 Kubernetes 客户端身份验证插件（例如 Azure、GCP、OIDC 等）
	// 确保 exec-entrypoint 和 run 可以使用它们。
	_ "k8s.io/client-go/plugin/pkg/client/auth"

	"k8s.io/apimachinery/pkg/runtime"
	utilruntime "k8s.io/apimachinery/pkg/util/runtime"
	clientgoscheme "k8s.io/client-go/kubernetes/scheme"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/certwatcher"
	"sigs.k8s.io/controller-runtime/pkg/healthz"
	"sigs.k8s.io/controller-runtime/pkg/log/zap"
	"sigs.k8s.io/controller-runtime/pkg/metrics/filters"
	metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server"
	"sigs.k8s.io/controller-runtime/pkg/webhook"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
	"tutorial.kubebuilder.io/project/internal/controller"
	webhookbatchv1 "tutorial.kubebuilder.io/project/internal/webhook/v1"
	// +kubebuilder:scaffold:imports
)

The first difference to notice is that kubebuilder has added the new API group’s package (batchv1) to our scheme. This means that we can use those objects in our controller.

If we would be using any other CRD we would have to add their scheme the same way. Builtin types such as Job have their scheme added by clientgoscheme.

var (
	scheme   = runtime.NewScheme()
	setupLog = ctrl.Log.WithName("setup")
)

func init() {
	utilruntime.Must(clientgoscheme.AddToScheme(scheme))

	utilruntime.Must(batchv1.AddToScheme(scheme))
	// +kubebuilder:scaffold:scheme}

The other thing that’s changed is that kubebuilder has added a block calling our CronJob controller’s SetupWithManager method.

// nolint:gocyclo
func main() {

old stuff

	var metricsAddr string
	var metricsCertPath, metricsCertName, metricsCertKey string
	var webhookCertPath, webhookCertName, webhookCertKey string
	var enableLeaderElection bool
	var probeAddr string
	var secureMetrics bool
	var enableHTTP2 bool
	var tlsOpts []func(*tls.Config)
	flag.StringVar(&metricsAddr, "metrics-bind-address", "0", "The address the metrics endpoint binds to. "+
		"使用 :8443 进行 HTTPS，使用 :8080 进行 HTTP，或者保持为 0 以禁用指标服务。")
	flag.StringVar(&probeAddr, "health-probe-bind-address", ":8081", "The address the probe endpoint binds to.")
	flag.BoolVar(&enableLeaderElection, "leader-elect", false,
		"Enable leader election for controller manager. "+
			"启用此功能将确保只有一个活动的控制管理器。")
	flag.BoolVar(&secureMetrics, "metrics-secure", true,
		"如果设置，指标端点将通过 HTTPS 安全提供。请使用 --metrics-secure=false 以改为使用 HTTP。")
	flag.StringVar(&webhookCertPath, "webhook-cert-path", "", "The directory that contains the webhook certificate.")
	flag.StringVar(&webhookCertName, "webhook-cert-name", "tls.crt", "The name of the webhook certificate file.")
	flag.StringVar(&webhookCertKey, "webhook-cert-key", "tls.key", "The name of the webhook key file.")
	flag.StringVar(&metricsCertPath, "metrics-cert-path", "",
		"The directory that contains the metrics server certificate.")
	flag.StringVar(&metricsCertName, "metrics-cert-name", "tls.crt", "The name of the metrics server certificate file.")
	flag.StringVar(&metricsCertKey, "metrics-cert-key", "tls.key", "The name of the metrics server key file.")
	flag.BoolVar(&enableHTTP2, "enable-http2", false,
		"If set, HTTP/2 will be enabled for the metrics and webhook servers")
	opts := zap.Options{
		Development: true,
	}
	opts.BindFlags(flag.CommandLine)
	flag.Parse()

	ctrl.SetLogger(zap.New(zap.UseFlagOptions(&opts)))

	// 如果 enable-http2 标志为 false（默认值），则应禁用 http/2
	// 由于其存在的漏洞。更具体地说，禁用 http/2 将
	// 防止受到 HTTP/2 流取消和
	// 快速重置 CVE 的漏洞影响。有关更多信息，请参见：
	// - https://github.com/advisories/GHSA-qppj-fm5r-hxr3
	// - https://github.com/advisories/GHSA-4374-p667-p6c8
	disableHTTP2 := func(c *tls.Config) {
		setupLog.Info("disabling http/2")
		c.NextProtos = []string{"http/1.1"}
	}

	if !enableHTTP2 {
		tlsOpts = append(tlsOpts, disableHTTP2)
	}

	// 创建用于指标和 Webhook 证书的监视器
	var metricsCertWatcher, webhookCertWatcher *certwatcher.CertWatcher

	// 初始Webhook TLS选项
	webhookTLSOpts := tlsOpts

	if len(webhookCertPath) > 0 {
		setupLog.Info("使用提供的证书初始化 Webhook 证书监视器",
			"webhook-cert-path", webhookCertPath, "webhook-cert-name", webhookCertName, "webhook-cert-key", webhookCertKey)

		var err error
		webhookCertWatcher, err = certwatcher.New(
			filepath.Join(webhookCertPath, webhookCertName),
			filepath.Join(webhookCertPath, webhookCertKey),
		)
		if err != nil {
			setupLog.Error(err, "Failed to initialize webhook certificate watcher")
			os.Exit(1)
		}

		webhookTLSOpts = append(webhookTLSOpts, func(config *tls.Config) {
			config.GetCertificate = webhookCertWatcher.GetCertificate
		})
	}

	webhookServer := webhook.NewServer(webhook.Options{
		TLSOpts: webhookTLSOpts,
	})

	// 指标端点在 'config/default/kustomization.yaml' 中启用。指标选项配置服务器。
	// 更多信息：
	// - https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/metrics/server
	// - https://book.kubebuilder.io/reference/metrics.html
	metricsServerOptions := metricsserver.Options{
		BindAddress:   metricsAddr,
		SecureServing: secureMetrics,
		TLSOpts:       tlsOpts,
	}

	if secureMetrics {
		// FilterProvider 用于通过认证和授权来保护指标端点。
		// 这些配置确保只有授权用户和服务账户
		// 可以访问指标端点。RBAC 配置在 'config/rbac/kustomization.yaml' 中。更多信息：
		// https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/metrics/filters#WithAuthenticationAndAuthorization
		metricsServerOptions.FilterProvider = filters.WithAuthenticationAndAuthorization
	}

	// 如果未指定证书，controller-runtime 将自动
	// 为指标服务器生成自签名证书。虽然对于开发和测试来说很方便，
	// 但这种设置不建议用于生产环境。
	//
	// TODO(用户)：如果您启用 certManager，请取消注释以下行：
	// - [METRICS-WITH-CERTS] 在 config/default/kustomization.yaml 中生成并使用
	// 由 cert-manager 管理的指标服务器证书。
	// - [PROMETHEUS-WITH-CERTS] 在 config/prometheus/kustomization.yaml 中用于 TLS 认证。
	if len(metricsCertPath) > 0 {
		setupLog.Info("使用提供的证书初始化指标证书监视器",
			"metrics-cert-path", metricsCertPath, "metrics-cert-name", metricsCertName, "metrics-cert-key", metricsCertKey)

		var err error
		metricsCertWatcher, err = certwatcher.New(
			filepath.Join(metricsCertPath, metricsCertName),
			filepath.Join(metricsCertPath, metricsCertKey),
		)
		if err != nil {
			setupLog.Error(err, "to initialize metrics certificate watcher", "error", err)
			os.Exit(1)
		}

		metricsServerOptions.TLSOpts = append(metricsServerOptions.TLSOpts, func(config *tls.Config) {
			config.GetCertificate = metricsCertWatcher.GetCertificate
		})
	}

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme:                 scheme,
		Metrics:                metricsServerOptions,
		WebhookServer:          webhookServer,
		HealthProbeBindAddress: probeAddr,
		LeaderElection:         enableLeaderElection,
		LeaderElectionID:       "80807133.tutorial.kubebuilder.io",
		// LeaderElectionReleaseOnCancel 定义了当管理器结束时，领导者是否应自愿辞职
		// 当管理器停止时，这要求二进制文件立即结束，否则这个设置是不安全的。设置这个可以显著
		// 加快自愿领导者的过渡，因为新的领导者不必首先等待
		// LeaseDuration 时间。
		//
		// 在提供的默认脚手架中，程序会在
		// 管理器停止后立即结束，因此启用此选项是可以的。不过，
		// 如果您正在进行或打算在管理器停止后执行任何操作，如执行清理，
		// 那么使用它可能是不安全的。
		// LeaderElectionReleaseOnCancel: true,
	})
	if err != nil {
		setupLog.Error(err, "unable to start manager")
		os.Exit(1)
	}

	if err = (&controller.CronJobReconciler{
		Client: mgr.GetClient(),
		Scheme: mgr.GetScheme(),
	}).SetupWithManager(mgr); err != nil {
		setupLog.Error(err, "unable to create controller", "controller", "CronJob")
		os.Exit(1)
	}

old stuff

We’ll also set up webhooks for our type, which we’ll talk about next. We just need to add them to the manager. Since we might want to run the webhooks separately, or not run them when testing our controller locally, we’ll put them behind an environment variable.

We’ll just make sure to set ENABLE_WEBHOOKS=false when we run locally.

	// nolint:goconst
	if os.Getenv("ENABLE_WEBHOOKS") != "false" {
		if err = webhookbatchv1.SetupCronJobWebhookWithManager(mgr); err != nil {
			setupLog.Error(err, "unable to create webhook", "webhook", "CronJob")
			os.Exit(1)
		}
	}
	// +kubebuilder:scaffold:builder

	if metricsCertWatcher != nil {
		setupLog.Info("Adding metrics certificate watcher to manager")
		if err := mgr.Add(metricsCertWatcher); err != nil {
			setupLog.Error(err, "unable to add metrics certificate watcher to manager")
			os.Exit(1)
		}
	}

	if webhookCertWatcher != nil {
		setupLog.Info("Adding webhook certificate watcher to manager")
		if err := mgr.Add(webhookCertWatcher); err != nil {
			setupLog.Error(err, "unable to add webhook certificate watcher to manager")
			os.Exit(1)
		}
	}

	if err := mgr.AddHealthzCheck("healthz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up health check")
		os.Exit(1)
	}
	if err := mgr.AddReadyzCheck("readyz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up ready check")
		os.Exit(1)
	}

	setupLog.Info("starting manager")
	if err := mgr.Start(ctrl.SetupSignalHandler()); err != nil {
		setupLog.Error(err, "problem running manager")
		os.Exit(1)
	}

_现在_我们可以实现我们的控制器。

实现默认值/验证的 Webhook

如果您想为您的 CRD 实现 admission webhooks ，您需要做的唯一一件事是实现 CustomDefaulter 和（或）CustomValidator 接口。

Kubebuilder 会为您处理其余的任务，例如：

创建 webhook 服务器。
确保服务器已在管理器中添加。
为您的 webhooks 创建处理程序。
在你的服务器中为每个处理程序注册路径。

首先，让我们为我们的自定义资源定义（CronJob）搭建 Webhook。我们需要使用 --defaulting 和 --programmatic-validation 标志运行以下命令（因为我们的测试项目将使用默认和验证 Webhook）：

kubebuilder create webhook --group batch --version v1 --kind CronJob --defaulting --programmatic-validation

这将为您构建 webhook 函数，并在您的 main.go 中将 webhook 注册到管理器。

project/internal/webhook/v1/cronjob_webhook.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Go imports

package v1

import (
	"context"
	"fmt"

	"github.com/robfig/cron"
	apierrors "k8s.io/apimachinery/pkg/api/errors"
	"k8s.io/apimachinery/pkg/runtime/schema"
	validationutils "k8s.io/apimachinery/pkg/util/validation"
	"k8s.io/apimachinery/pkg/util/validation/field"

	"k8s.io/apimachinery/pkg/runtime"
	ctrl "sigs.k8s.io/controller-runtime"
	logf "sigs.k8s.io/controller-runtime/pkg/log"
	"sigs.k8s.io/controller-runtime/pkg/webhook"
	"sigs.k8s.io/controller-runtime/pkg/webhook/admission"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
)

Next, we’ll setup a logger for the webhooks.

var cronjoblog = logf.Log.WithName("cronjob-resource")

Then, we set up the webhook with the manager.

// SetupCronJobWebhookWithManager registers the webhook for CronJob in the manager.
func SetupCronJobWebhookWithManager(mgr ctrl.Manager) error {
	return ctrl.NewWebhookManagedBy(mgr).For(&batchv1.CronJob{}).
		WithValidator(&CronJobCustomValidator{}).
		WithDefaulter(&CronJobCustomDefaulter{
			DefaultConcurrencyPolicy:          batchv1.AllowConcurrent,
			DefaultSuspend:                    false,
			DefaultSuccessfulJobsHistoryLimit: 3,
			DefaultFailedJobsHistoryLimit:     1,
		}).
		Complete()
}

Notice that we use kubebuilder markers to generate webhook manifests. This marker is responsible for generating a mutating webhook manifest.

The meaning of each marker can be found here.

This marker is responsible for generating a mutation webhook manifest.

// +kubebuilder:webhook:path=/mutate-batch-tutorial-kubebuilder-io-v1-cronjob,mutating=true,failurePolicy=fail,sideEffects=None,groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=create;update,versions=v1,name=mcronjob-v1.kb.io,admissionReviewVersions=v1

// CronJobCustomDefaulter struct is responsible for setting default values on the custom resource of the
// Kind CronJob when those are created or updated.
//
// NOTE: The +kubebuilder:object:generate=false marker prevents controller-gen from generating DeepCopy methods,
// as it is used only for temporary operations and does not need to be deeply copied.
type CronJobCustomDefaulter struct {

	// Default values for various CronJob fields
	DefaultConcurrencyPolicy          batchv1.ConcurrencyPolicy
	DefaultSuspend                    bool
	DefaultSuccessfulJobsHistoryLimit int32
	DefaultFailedJobsHistoryLimit     int32
}

var _ webhook.CustomDefaulter = &CronJobCustomDefaulter{}

We use the webhook.CustomDefaulterinterface to set defaults to our CRD. A webhook will automatically be served that calls this defaulting.

The Defaultmethod is expected to mutate the receiver, setting the defaults.

// Default implements webhook.CustomDefaulter so a webhook will be registered for the Kind CronJob.
func (d *CronJobCustomDefaulter) Default(ctx context.Context, obj runtime.Object) error {
	cronjob, ok := obj.(*batchv1.CronJob)

	if !ok {
		return fmt.Errorf("expected an CronJob object but got %T", obj)
	}
	cronjoblog.Info("Defaulting for CronJob", "name", cronjob.GetName())

	// Set default values
	d.applyDefaults(cronjob)
	return nil
}

// applyDefaults applies default values to CronJob fields.
func (d *CronJobCustomDefaulter) applyDefaults(cronJob *batchv1.CronJob) {
	if cronJob.Spec.ConcurrencyPolicy == "" {
		cronJob.Spec.ConcurrencyPolicy = d.DefaultConcurrencyPolicy
	}
	if cronJob.Spec.Suspend == nil {
		cronJob.Spec.Suspend = new(bool)
		*cronJob.Spec.Suspend = d.DefaultSuspend
	}
	if cronJob.Spec.SuccessfulJobsHistoryLimit == nil {
		cronJob.Spec.SuccessfulJobsHistoryLimit = new(int32)
		*cronJob.Spec.SuccessfulJobsHistoryLimit = d.DefaultSuccessfulJobsHistoryLimit
	}
	if cronJob.Spec.FailedJobsHistoryLimit == nil {
		cronJob.Spec.FailedJobsHistoryLimit = new(int32)
		*cronJob.Spec.FailedJobsHistoryLimit = d.DefaultFailedJobsHistoryLimit
	}
}

We can validate our CRD beyond what’s possible with declarative validation. Generally, declarative validation should be sufficient, but sometimes more advanced use cases call for complex validation.

For instance, we’ll see below that we use this to validate a well-formed cron schedule without making up a long regular expression.

If webhook.CustomValidator interface is implemented, a webhook will automatically be served that calls the validation.

The ValidateCreate, ValidateUpdate and ValidateDelete methods are expected to validate its receiver upon creation, update and deletion respectively. We separate out ValidateCreate from ValidateUpdate to allow behavior like making certain fields immutable, so that they can only be set on creation. ValidateDelete is also separated from ValidateUpdate to allow different validation behavior on deletion. Here, however, we just use the same shared validation for ValidateCreate and ValidateUpdate. And we do nothing in ValidateDelete, since we don’t need to validate anything on deletion.

This marker is responsible for generating a validation webhook manifest.

// +kubebuilder:webhook:path=/validate-batch-tutorial-kubebuilder-io-v1-cronjob,mutating=false,failurePolicy=fail,sideEffects=None,groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=create;update,versions=v1,name=vcronjob-v1.kb.io,admissionReviewVersions=v1

// CronJobCustomValidator struct is responsible for validating the CronJob resource
// when it is created, updated, or deleted.
//
// NOTE: The +kubebuilder:object:generate=false marker prevents controller-gen from generating DeepCopy methods,
// as this struct is used only for temporary operations and does not need to be deeply copied.
type CronJobCustomValidator struct {
	// TODO(user): Add more fields as needed for validation
}

var _ webhook.CustomValidator = &CronJobCustomValidator{}

// ValidateCreate implements webhook.CustomValidator so a webhook will be registered for the type CronJob.
func (v *CronJobCustomValidator) ValidateCreate(ctx context.Context, obj runtime.Object) (admission.Warnings, error) {
	cronjob, ok := obj.(*batchv1.CronJob)
	if !ok {
		return nil, fmt.Errorf("expected a CronJob object but got %T", obj)
	}
	cronjoblog.Info("Validation for CronJob upon creation", "name", cronjob.GetName())

	return nil, validateCronJob(cronjob)
}

// ValidateUpdate implements webhook.CustomValidator so a webhook will be registered for the type CronJob.
func (v *CronJobCustomValidator) ValidateUpdate(ctx context.Context, oldObj, newObj runtime.Object) (admission.Warnings, error) {
	cronjob, ok := newObj.(*batchv1.CronJob)
	if !ok {
		return nil, fmt.Errorf("expected a CronJob object for the newObj but got %T", newObj)
	}
	cronjoblog.Info("Validation for CronJob upon update", "name", cronjob.GetName())

	return nil, validateCronJob(cronjob)
}

// ValidateDelete implements webhook.CustomValidator so a webhook will be registered for the type CronJob.
func (v *CronJobCustomValidator) ValidateDelete(ctx context.Context, obj runtime.Object) (admission.Warnings, error) {
	cronjob, ok := obj.(*batchv1.CronJob)
	if !ok {
		return nil, fmt.Errorf("expected a CronJob object but got %T", obj)
	}
	cronjoblog.Info("Validation for CronJob upon deletion", "name", cronjob.GetName())

	// TODO(user): fill in your validation logic upon object deletion.

	return nil, nil
}

We validate the name and the spec of the CronJob.

// validateCronJob validates the fields of a CronJob object.
func validateCronJob(cronjob *batchv1.CronJob) error {
	var allErrs field.ErrorList
	if err := validateCronJobName(cronjob); err != nil {
		allErrs = append(allErrs, err)
	}
	if err := validateCronJobSpec(cronjob); err != nil {
		allErrs = append(allErrs, err)
	}
	if len(allErrs) == 0 {
		return nil
	}

	return apierrors.NewInvalid(
		schema.GroupKind{Group: "batch.tutorial.kubebuilder.io", Kind: "CronJob"},
		cronjob.Name, allErrs)
}

Some fields are declaratively validated by OpenAPI schema. You can find kubebuilder validation markers (prefixed with // +kubebuilder:validation) in the Designing an API section. You can find all of the kubebuilder supported markers for declaring validation by running controller-gen crd -w, or here.

func validateCronJobSpec(cronjob *batchv1.CronJob) *field.Error {
	// The field helpers from the kubernetes API machinery help us return nicely
	// structured validation errors.
	return validateScheduleFormat(
		cronjob.Spec.Schedule,
		field.NewPath("spec").Child("schedule"))
}

We’ll need to validate the cron schedule is well-formatted.

func validateScheduleFormat(schedule string, fldPath *field.Path) *field.Error {
	if _, err := cron.ParseStandard(schedule); err != nil {
		return field.Invalid(fldPath, schedule, err.Error())
	}
	return nil
}

Validate object name

Validating the length of a string field can be done declaratively by the validation schema.

But the ObjectMeta.Name field is defined in a shared package under the apimachinery repo, so we can’t declaratively validate it using the validation schema.

func validateCronJobName(cronjob *batchv1.CronJob) *field.Error {
	if len(cronjob.ObjectMeta.Name) > validationutils.DNS1035LabelMaxLength-11 {
		// The job name length is 63 characters like all Kubernetes objects
		// (which must fit in a DNS subdomain). The cronjob controller appends
		// a 11-character suffix to the cronjob (`-$TIMESTAMP`) when creating
		// a job. The job name length limit is 63 characters. Therefore cronjob
		// names must have length <= 63-11=52. If we don't validate this here,
		// then job creation will fail later.
		return field.Invalid(field.NewPath("metadata").Child("name"), cronjob.ObjectMeta.Name, "must be no more than 52 characters")
	}
	return nil
}

运行和部署控制器

Optional

如果选择对 API 定义进行任何更改，请在继续之前生成类似于 CR 或 CRD 的清单。

make manifests

为了测试控制器，我们可以在集群上本地运行它。不过，在此之前，我们需要安装我们的 CRD，按照快速启动的指南。这将自动使用 controller-tools 更新 YAML 清单（如果需要的话）：

make install

现在我们已经安装了CRD（自定义资源定义），可以在我们的集群上运行控制器。这将使用我们连接到集群时的凭据，因此我们暂时不需要担心RBAC（基于角色的访问控制）。

在另一个终端中运行

export ENABLE_WEBHOOKS=错误
make run

您应该看到控制器关于启动的日志，但它暂时不会执行任何操作。

此时，我们需要一个 CronJob 进行测试。让我们在 config/samples/batch_v1_cronjob.yaml 中写一个示例，并使用它：

apiVersion: batch.tutorial.kubebuilder.io/v1
kind: CronJob
metadata:
  labels:
    app.kubernetes.io/name: project
    app.kubernetes.io/managed-by: kustomize
  name: cron作业示例
spec:
  日程安排: "*/1 * * * *"
  启动截止时间（秒）: 60
  并发策略: 允许 # 显式指定，但允许也是默认值。
  工作模板:
    spec:
      template:
        spec:
          容器:
          - name: 你好
            image: busybox
            args:
            - /bin/sh
            - -c
            - 日期; 在Kubernetes集群中打招呼。
          重启策略: 失败时

kubectl create -f config/samples/batch_v1_cronjob.yaml

此时，你应该会看到一阵忙碌的活动。如果你观察这些变化，你应该能看到你的定时任务在运行，并更新状态：

kubectl get cronjob.batch.tutorial.kubebuilder.io -o yaml
kubectl get job

现在我们知道它可以正常工作，我们可以在集群中运行它。停止 make run 调用，然后运行

make docker-build docker-push IMG=<some-registry>/<project-name>:tag
make deploy IMG=<some-registry>/<project-name>:tag

Registry Permission

kind load docker-image <your-image-name>:tag --name <your-kind-cluster-name>

要了解更多，请参考：用于开发目的和持续集成的 Kind

RBAC errors

如果我们像之前一样再次列出定时任务，我们应该能看到控制器再次正常运行！

部署 cert-manager

我们建议使用 cert-manager 来为 webhook 服务器配置证书。其他解决方案也应能正常工作，只要它们将证书放在期望的位置即可。

您可以按照 cert-manager 文档来进行安装。

cert-manager 还有一个组件称为 CA Injector，它的责任是将 CA 包注入到 MutatingWebhookConfiguration / ValidatingWebhookConfiguration 中。

要实现这一点，您需要在 MutatingWebhookConfiguration / ValidatingWebhookConfiguration 对象中使用一个带有键 cert-manager.io/inject-ca-from 的注解。该注解的值应指向一个现有的证书请求实例，格式为 <certificate-namespace>/<certificate-name>。

这是我们用于注解 MutatingWebhookConfiguration / ValidatingWebhookConfiguration 对象的 kustomize 补丁。

部署 Admission Webhook

cert-manager

您需要按照此处的指示安装 cert-manager 套件。

构建你的形象

运行以下命令以在本地构建您的镜像。

make docker-build docker-push IMG=<some-registry>/<project-name>:tag

Using Kind

kind load docker-image <your-image-name>:tag --name <your-kind-cluster-name>

要了解更多，请参考：用于开发目的和持续集成的 Kind

部署 Webhooks

您需要通过 kustomize 启用 webhook 和证书管理器配置。config/default/kustomization.yaml 现在应该如下所示：

# 为所有资源添加命名空间。
命名空间: 项目系统

# 此字段的值将作为前缀添加到所有资源的名称，例如，一个名为
# "wordpress"的部署会变成"alices-wordpress"。
# 请注意，它还应与上面命名空间字段中"-"之前的前缀匹配。
namePrefix: 项目-

# 要添加到所有资源和选择器的标签。
#labels:
#- includeSelectors: true
#  pairs:
#    someName: someValue

resources:
- ../crd
- ../rbac
- ../manager
# [WEBHOOK] 要启用 webhook，请取消注释所有带有 [WEBHOOK] 前缀的部分，包括在
# crd/kustomization.yaml中的那部分。- ../webhook
# [CERTMANAGER] 要启用 cert-manager，请取消注释所有包含 'CERTMANAGER' 的部分。'WEBHOOK' 组件是必需的。- ../证书管理器
# [PROMETHEUS] 要启用 Prometheus 监控，请取消注释所有包含 'PROMETHEUS' 的部分。- ../prometheus
# [指标] 暴露控制器管理器指标服务。- metrics_service.yaml
# [网络策略] 使用 NetworkPolicy 保护 /metrics 端点和 Webhook 服务器。
# 只有运行在标记为 'metrics: enabled' 的命名空间中的 Pod 才能够收集指标。
# 只有需要 Webhook 的 CR 且应用于标记为 'webhooks: enabled' 的命名空间的 CR 才能够
# 与 Webhook 服务器进行通信。
#- ../network-policy

# 如果您启用度量，请取消注释补丁行
补丁:
# [指标] 以下补丁将使用 HTTPS 启用指标端点，端口为 :8443。
# 更多信息： https://book.kubebuilder.io/reference/metrics
- path: manager_metrics_patch.yaml
  目标:
    kind: 部署

# 如果您启用 Metrics 和 CertManager，请取消注释补丁行。- path: cert_metrics_manager_patch.yaml
  目标:
    kind: 部署

# [WEBHOOK] 要启用 webhook，请取消注释所有带有 [WEBHOOK] 前缀的部分，包括在
# crd/kustomization.yaml中的那部分。- path: manager_webhook_patch.yaml
  目标:
    kind: 部署

# [CERTMANAGER] 要启用 cert-manager，请取消注释所有带有 'CERTMANAGER' 前缀的部分。
# 取消注释以下替换，以添加 cert-manager CA 注入注释
替换项:
 - source: # 取消注释以下代码块以启用度量的证书
     类型: 服务
     version: v1
     name: 控制器管理器指标服务
     字段路径: 元数据.名称
   目标:
     - 选择:
         kind: 证书
         group: cert-manager.io
         version: v1
         name: 度量标准-证书
       字段路径:
         - spec.dnsNames.0
         - spec.dnsNames.1
       选项:
         分隔符: '.'
         索引: 0
         create: true
     - 选择: # 取消注释以下内容以在 Prometheus ServiceMonitor 中设置 TLS 配置的服务名称
         kind: 服务监控器
         group: monitoring.coreos.com
         version: v1
         name: 控制器管理器监控指标
       字段路径:
         - spec.endpoints.0.tlsConfig.serverName
       选项:
         分隔符: '.'
         索引: 0
         create: true

 - source:
     kind: 服务
     version: v1
     name: 控制器管理器指标服务
     字段路径: metadata.namespace
   目标:
     - 选择:
         kind: 证书
         group: cert-manager.io
         version: v1
         name: 度量标准-证书
       字段路径:
         - spec.dnsNames.0
         - spec.dnsNames.1
       选项:
         分隔符: '.'
         索引: 1
         create: true
     - 选择: # 取消注释以下内容以设置 Prometheus ServiceMonitor 中 TLS 的服务命名空间
         kind: 服务监控器
         group: monitoring.coreos.com
         version: v1
         name: 控制器管理器监控指标
       字段路径:
         - spec.endpoints.0.tlsConfig.serverName
       选项:
         分隔符: '.'
         索引: 1
         create: true

 - source: # 如果您有任何 webhook，请取消注释以下代码块。: 服务
     version: v1
     name: Webhook 服务
     字段路径: .metadata.name # 服务名称
   目标:
     - 选择:
         kind: 证书
         group: cert-manager.io
         version: v1
         name: 服务证书
       字段路径:
         - .spec.dnsNames.0
         - .spec.dnsNames.1
       选项:
         分隔符: '.'
         索引: 0
         create: true
 - source:
     kind: 服务
     version: v1
     name: Webhook 服务
     字段路径: .metadata.namespace # 服务的命名空间
   targets:
     - 选择:
         kind: 证书
         group: cert-manager.io
         version: v1
         name: 服务证书
       字段路径:
         - .spec.dnsNames.0
         - .spec.dnsNames.1
       选项:
         分隔符: '.'
         索引: 1
         create: true

 - source: # 如果您有一个有效的验证Webhook (--programmatic-validation)，请取消注释以下代码块
     kind: 证书
     group: cert-manager.io
     version: v1
     name: serving-cert # 此名称应与 certificate.yaml 中的名称匹配
     fieldPath: .metadata.namespace # 证书 CR 的命名空间
   目标:
     - 选择:
         kind: 有效性Webhook配置
       字段路径:
         - .metadata.annotations.[cert-manager.io/inject-ca-from]
       选项:
         分隔符: '/'
         索引: 0
         create: true
 - source:
     kind: 证书
     group: cert-manager.io
     version: v1
     name: 服务证书
     字段路径: .metadata.name
   目标:
     - 选择:
         kind: 有效性Webhook配置
       字段路径:
         - .metadata.annotations.[cert-manager.io/inject-ca-from]
       选项:
         分隔符: '/'
         索引: 1
         create: true

 - source: # 如果你有一个默认的 Webhook (--defaulting)，请取消注释以下代码块
     类型: 证书
     group: cert-manager.io
     version: v1
     name: 服务证书
     字段路径: .metadata.namespace # 证书 CR 的命名空间
   目标:
     - 选择:
         kind: 变更Webhook配置
       字段路径:
         - .metadata.annotations.[cert-manager.io/inject-ca-from]
       选项:
         分隔符: '/'
         索引: 0
         create: true
 - source:
     kind: 证书
     group: cert-manager.io
     version: v1
     name: 服务证书
     字段路径: .metadata.name
   目标:
     - 选择:
         kind: 变更Webhook配置
       字段路径:
         - .metadata.annotations.[cert-manager.io/inject-ca-from]
       选项:
         分隔符: '/'
         索引: 1
         create: true
#
# - 来源: # 如果您有 ConversionWebhook (--conversion)，请取消注释以下块
#     类型: 证书
#     群组: cert-manager.io
#     版本: v1
#     名称: serving-cert
#     字段路径: .metadata.namespace # 证书 CR 的命名空间
#   目标: # 请勿删除或取消注释以下脚手架标记；这是生成目标 CRD 代码所需的。
# +kubebuilder:scaffold:crdkustomizecainjectionns
# - 来源:
#     类型: 证书
#     群组: cert-manager.io
#     版本: v1
#     名称: serving-cert
#     字段路径: .metadata.name
#   目标: # 请勿删除或取消注释以下脚手架标记；这是生成目标 CRD 代码所需的。
# +kubebuilder:scaffold:crdkustomizecainjectionname

现在 config/crd/kustomization.yaml 应该如下所示：

# 这个 kustomization.yaml 文件不打算单独运行，
# 因为它依赖于此 kustomize 包之外的服务名称和命名空间。
# 应通过 config/default 运行。
resources:
- bases/batch.tutorial.kubebuilder.io_cronjobs.yaml
# +kubebuilder:scaffold:crdkustomizeresource

贴片:
# [WEBHOOK] 要启用 webhook，请取消注释所有以 [WEBHOOK] 为前缀的部分。
# 此处的补丁用于为每个 CRD 启用转换 webhook
# +kubebuilder:scaffold:crdkustomizewebhookpatch

# [WEBHOOK] 要启用 webhook，请取消注释以下部分
# 以下配置是为了教 kustomize 如何对 CRD 进行自定义。
# 配置：
#- kustomizeconfig.yaml

现在您可以通过以下方式将其部署到您的集群中：

make deploy IMG=<some-registry>/<project-name>:tag

请稍等，直到 webhook pod 启动并且证书被配置。通常在 1 分钟内完成。

现在您可以创建一个有效的 CronJob 来测试您的 webhooks。创建过程应该成功完成。

kubectl create -f config/samples/batch_v1_cronjob.yaml

您还可以尝试创建一个无效的 CronJob（例如，使用格式不正确的调度字段）。您应该会看到创建失败并出现验证错误。

编写控制器测试

测试 Kubernetes 控制器是一个大主题，而 kubebuilder 为您生成的样板测试文件相对较少。

为了引导您了解用于 Kubebuilder 生成的控制器的集成测试模式，我们将重新审视在首个教程中构建的 CronJob，并为其编写一个简单的测试。

基本的方法是，在您生成的 suite_test.go 文件中，您将使用 envtest 创建一个本地 Kubernetes API 服务器，实例化并运行您的控制器，然后编写额外的 *_test.go 文件，通过 Ginkgo 来进行测试。

如果您想要调整您的 envtest 集群的配置，请参阅为集成测试配置 envtest一节，以及envtest 文档。

测试环境设置

../../cronjob-tutorial/testdata/project/internal/controller/suite_test.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Imports

When we created the CronJob API with kubebuilder create api in a previous chapter, Kubebuilder already did some test work for you. Kubebuilder scaffolded a internal/controller/suite_test.go file that does the bare bones of setting up a test environment.

First, it will contain the necessary imports.

package controller

import (
	"context"
	"os"
	"path/filepath"
	"testing"

	ctrl "sigs.k8s.io/controller-runtime"

	. "github.com/onsi/ginkgo/v2"
	. "github.com/onsi/gomega"

	"k8s.io/client-go/kubernetes/scheme"
	"k8s.io/client-go/rest"
	"sigs.k8s.io/controller-runtime/pkg/client"
	"sigs.k8s.io/controller-runtime/pkg/envtest"
	logf "sigs.k8s.io/controller-runtime/pkg/log"
	"sigs.k8s.io/controller-runtime/pkg/log/zap"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
	// +kubebuilder:scaffold:imports
)

// These tests use Ginkgo (BDD-style Go testing framework). Refer to
// http://onsi.github.io/ginkgo/ to learn more about Ginkgo.

Now, let’s go through the code generated.

var (
	ctx       context.Context
	cancel    context.CancelFunc
	testEnv   *envtest.Environment
	cfg       *rest.Config
	k8sClient client.Client // You'll be using this client in your tests.
)

func TestControllers(t *testing.T) {
	RegisterFailHandler(Fail)

	RunSpecs(t, "Controller Suite")
}

var _ = BeforeSuite(func() {
	logf.SetLogger(zap.New(zap.WriteTo(GinkgoWriter), zap.UseDevMode(true)))

	ctx, cancel = context.WithCancel(context.TODO())

	var err error

The CronJob Kind is added to the runtime scheme used by the test environment. This ensures that the CronJob API is registered with the scheme, allowing the test controller to recognize and interact with CronJob resources.

	err = batchv1.AddToScheme(scheme.Scheme)
	Expect(err).NotTo(HaveOccurred())

After the schemas, you will see the following marker. This marker is what allows new schemas to be added here automatically when a new API is added to the project.

	// +kubebuilder:scaffold:scheme

The envtest environment is configured to load Custom Resource Definitions (CRDs) from the specified directory. This setup enables the test environment to recognize and interact with the custom resources defined by these CRDs.

	By("bootstrapping test environment")
	testEnv = &envtest.Environment{
		CRDDirectoryPaths:     []string{filepath.Join("..", "..", "config", "crd", "bases")},
		ErrorIfCRDPathMissing: true,
	}

	// Retrieve the first found binary directory to allow running tests from IDEs
	if getFirstFoundEnvTestBinaryDir() != "" {
		testEnv.BinaryAssetsDirectory = getFirstFoundEnvTestBinaryDir()
	}

Then, we start the envtest cluster.

	// cfg is defined in this file globally.
	cfg, err = testEnv.Start()
	Expect(err).NotTo(HaveOccurred())
	Expect(cfg).NotTo(BeNil())

A client is created for our test CRUD operations.

	k8sClient, err = client.New(cfg, client.Options{Scheme: scheme.Scheme})
	Expect(err).NotTo(HaveOccurred())
	Expect(k8sClient).NotTo(BeNil())

One thing that this autogenerated file is missing, however, is a way to actually start your controller. The code above will set up a client for interacting with your custom Kind, but will not be able to test your controller behavior. If you want to test your custom controller logic, you’ll need to add some familiar-looking manager logic to your BeforeSuite() function, so you can register your custom controller to run on this test cluster.

You may notice that the code below runs your controller with nearly identical logic to your CronJob project’s main.go! The only difference is that the manager is started in a separate goroutine so it does not block the cleanup of envtest when you’re done running your tests.

Note that we set up both a “live” k8s client and a separate client from the manager. This is because when making assertions in tests, you generally want to assert against the live state of the API server. If you use the client from the manager (k8sManager.GetClient), you’d end up asserting against the contents of the cache instead, which is slower and can introduce flakiness into your tests. We could use the manager’s APIReader to accomplish the same thing, but that would leave us with two clients in our test assertions and setup (one for reading, one for writing), and it’d be easy to make mistakes.

Note that we keep the reconciler running against the manager’s cache client, though – we want our controller to behave as it would in production, and we use features of the cache (like indices) in our controller which aren’t available when talking directly to the API server.

	k8sManager, err := ctrl.NewManager(cfg, ctrl.Options{
		Scheme: scheme.Scheme,
	})
	Expect(err).ToNot(HaveOccurred())

	err = (&CronJobReconciler{
		Client: k8sManager.GetClient(),
		Scheme: k8sManager.GetScheme(),
	}).SetupWithManager(k8sManager)
	Expect(err).ToNot(HaveOccurred())

	go func() {
		defer GinkgoRecover()
		err = k8sManager.Start(ctx)
		Expect(err).ToNot(HaveOccurred(), "failed to run manager")
	}()
})

Kubebuilder also generates boilerplate functions for cleaning up envtest and actually running your test files in your controllers/ directory. You won’t need to touch these.

var _ = AfterSuite(func() {
	By("tearing down the test environment")
	cancel()
	err := testEnv.Stop()
	Expect(err).NotTo(HaveOccurred())
})

Now that you have your controller running on a test cluster and a client ready to perform operations on your CronJob, we can start writing integration tests!

// getFirstFoundEnvTestBinaryDir locates the first binary in the specified path.
// ENVTEST-based tests depend on specific binaries, usually located in paths set by
// controller-runtime. When running tests directly (e.g., via an IDE) without using
// Makefile targets, the 'BinaryAssetsDirectory' must be explicitly configured.
//
// This function streamlines the process by finding the required binaries, similar to
// setting the 'KUBEBUILDER_ASSETS' environment variable. To ensure the binaries are
// properly set up, run 'make setup-envtest' beforehand.
func getFirstFoundEnvTestBinaryDir() string {
	basePath := filepath.Join("..", "..", "bin", "k8s")
	entries, err := os.ReadDir(basePath)
	if err != nil {
		logf.Log.Error(err, "Failed to read directory", "path", basePath)
		return ""
	}
	for _, entry := range entries {
		if entry.IsDir() {
			return filepath.Join(basePath, entry.Name())
		}
	}
	return ""
}

测试您的控制器行为

../../cronjob-tutorial/testdata/project/internal/controller/cronjob_controller_test.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Ideally, we should have one <kind>_controller_test.go for each controller scaffolded and called in the suite_test.go. So, let’s write our example test for the CronJob controller (cronjob_controller_test.go.)

Imports

As usual, we start with the necessary imports. We also define some utility variables.

package controller

import (
	"context"
	"reflect"
	"time"

	. "github.com/onsi/ginkgo/v2"
	. "github.com/onsi/gomega"
	batchv1 "k8s.io/api/batch/v1"
	v1 "k8s.io/api/core/v1"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
	"k8s.io/apimachinery/pkg/types"

	cronjobv1 "tutorial.kubebuilder.io/project/api/v1"
)

The first step to writing a simple integration test is to actually create an instance of CronJob you can run tests against. Note that to create a CronJob, you’ll need to create a stub CronJob struct that contains your CronJob’s specifications.

Note that when we create a stub CronJob, the CronJob also needs stubs of its required downstream objects. Without the stubbed Job template spec and the Pod template spec below, the Kubernetes API will not be able to create the CronJob.

var _ = Describe("CronJob controller", func() {

	// Define utility constants for object names and testing timeouts/durations and intervals.
	const (
		CronjobName      = "test-cronjob"
		CronjobNamespace = "default"
		JobName          = "test-job"

		timeout  = time.Second * 10
		duration = time.Second * 10
		interval = time.Millisecond * 250
	)

	Context("When updating CronJob Status", func() {
		It("Should increase CronJob Status.Active count when new Jobs are created", func() {
			By("By creating a new CronJob")
			ctx := context.Background()
			cronJob := &cronjobv1.CronJob{
				TypeMeta: metav1.TypeMeta{
					APIVersion: "batch.tutorial.kubebuilder.io/v1",
					Kind:       "CronJob",
				},
				ObjectMeta: metav1.ObjectMeta{
					Name:      CronjobName,
					Namespace: CronjobNamespace,
				},
				Spec: cronjobv1.CronJobSpec{
					Schedule: "1 * * * *",
					JobTemplate: batchv1.JobTemplateSpec{
						Spec: batchv1.JobSpec{
							// For simplicity, we only fill out the required fields.
							Template: v1.PodTemplateSpec{
								Spec: v1.PodSpec{
									// For simplicity, we only fill out the required fields.
									Containers: []v1.Container{
										{
											Name:  "test-container",
											Image: "test-image",
										},
									},
									RestartPolicy: v1.RestartPolicyOnFailure,
								},
							},
						},
					},
				},
			}
			Expect(k8sClient.Create(ctx, cronJob)).To(Succeed())

After creating this CronJob, let’s check that the CronJob’s Spec fields match what we passed in. Note that, because the k8s apiserver may not have finished creating a CronJob after our Create() call from earlier, we will use Gomega’s Eventually() testing function instead of Expect() to give the apiserver an opportunity to finish creating our CronJob.

Eventually() will repeatedly run the function provided as an argument every interval seconds until (a) the assertions done by the passed-in Gomega succeed, or (b) the number of attempts * interval period exceed the provided timeout value.

In the examples below, timeout and interval are Go Duration values of our choosing.

			cronjobLookupKey := types.NamespacedName{Name: CronjobName, Namespace: CronjobNamespace}
			createdCronjob := &cronjobv1.CronJob{}

			// We'll need to retry getting this newly created CronJob, given that creation may not immediately happen.
			Eventually(func(g Gomega) {
				g.Expect(k8sClient.Get(ctx, cronjobLookupKey, createdCronjob)).To(Succeed())
			}, timeout, interval).Should(Succeed())
			// Let's make sure our Schedule string value was properly converted/handled.
			Expect(createdCronjob.Spec.Schedule).To(Equal("1 * * * *"))

Now that we’ve created a CronJob in our test cluster, the next step is to write a test that actually tests our CronJob controller’s behavior. Let’s test the CronJob controller’s logic responsible for updating CronJob.Status.Active with actively running jobs. We’ll verify that when a CronJob has a single active downstream Job, its CronJob.Status.Active field contains a reference to this Job.

First, we should get the test CronJob we created earlier, and verify that it currently does not have any active jobs. We use Gomega’s Consistently() check here to ensure that the active job count remains 0 over a duration of time.

			By("By checking the CronJob has zero active Jobs")
			Consistently(func(g Gomega) {
				g.Expect(k8sClient.Get(ctx, cronjobLookupKey, createdCronjob)).To(Succeed())
				g.Expect(createdCronjob.Status.Active).To(BeEmpty())
			}, duration, interval).Should(Succeed())

Next, we actually create a stubbed Job that will belong to our CronJob, as well as its downstream template specs. We set the Job’s status’s “Active” count to 2 to simulate the Job running two pods, which means the Job is actively running.

We then take the stubbed Job and set its owner reference to point to our test CronJob. This ensures that the test Job belongs to, and is tracked by, our test CronJob. Once that’s done, we create our new Job instance.

			By("By creating a new Job")
			testJob := &batchv1.Job{
				ObjectMeta: metav1.ObjectMeta{
					Name:      JobName,
					Namespace: CronjobNamespace,
				},
				Spec: batchv1.JobSpec{
					Template: v1.PodTemplateSpec{
						Spec: v1.PodSpec{
							// For simplicity, we only fill out the required fields.
							Containers: []v1.Container{
								{
									Name:  "test-container",
									Image: "test-image",
								},
							},
							RestartPolicy: v1.RestartPolicyOnFailure,
						},
					},
				},
			}

			// Note that your CronJob’s GroupVersionKind is required to set up this owner reference.
			kind := reflect.TypeOf(cronjobv1.CronJob{}).Name()
			gvk := cronjobv1.GroupVersion.WithKind(kind)

			controllerRef := metav1.NewControllerRef(createdCronjob, gvk)
			testJob.SetOwnerReferences([]metav1.OwnerReference{*controllerRef})
			Expect(k8sClient.Create(ctx, testJob)).To(Succeed())
			// Note that you can not manage the status values while creating the resource.
			// The status field is managed separately to reflect the current state of the resource.
			// Therefore, it should be updated using a PATCH or PUT operation after the resource has been created.
			// Additionally, it is recommended to use StatusConditions to manage the status. For further information see:
			// https://github.com/kubernetes/community/blob/master/contributors/devel/sig-architecture/api-conventions.md#spec-and-status
			testJob.Status.Active = 2
			Expect(k8sClient.Status().Update(ctx, testJob)).To(Succeed())

Adding this Job to our test CronJob should trigger our controller’s reconciler logic. After that, we can write a test that evaluates whether our controller eventually updates our CronJob’s Status field as expected!

			By("By checking that the CronJob has one active Job")
			Eventually(func(g Gomega) {
				g.Expect(k8sClient.Get(ctx, cronjobLookupKey, createdCronjob)).To(Succeed(), "should GET the CronJob")
				g.Expect(createdCronjob.Status.Active).To(HaveLen(1), "should have exactly one active job")
				g.Expect(createdCronjob.Status.Active[0].Name).To(Equal(JobName), "the wrong job is active")
			}, timeout, interval).Should(Succeed(), "should list our active job %s in the active jobs list in status", JobName)
		})
	})

})

After writing all this code, you can run go test ./... in your controllers/ directory again to run your new test!

以上的状态更新示例展示了一种针对自定义 Kind 及其下游对象的一般测试策略。到目前为止，希望您已经学习了以下测试控制器行为的方法：

在 envtest 集群上设置您的控制器
为创建测试对象编写存根
将变化孤立到一个对象，以测试特定控制器的行为

尾声

到目前为止，我们已经完成了一个功能齐全的 CronJob 控制器实现，使用了 Kubebuilder 的大部分功能，并使用 envtest 编写了控制器的测试。

如果你想要了解更多，请前往多版本教程学习如何在项目中添加新的 API 版本。

此外，您可以自己尝试以下步骤——我们很快将会有一个关于它们的教程部分™：

添加额外的打印列 kubectl get

教程：多版本 API

大多数项目开始时都有一个不断变化的 alpha API。然而，最终，大多数项目需要转向一个更稳定的 API。然而，一旦你的 API 稳定后，你就不能对其进行破坏性更改。这就是 API 版本派上用场的地方。

让我们对 CronJob API 规范进行一些更改，并确保我们的 CronJob 项目支持所有不同版本。

如果您还没有，请确保您已经阅读过基础的 CronJob 教程。

接下来，让我们找出我们想要进行哪些更改…

改变现状

在Kubernetes API中，相对常见的变化是将一些以前是非结构化或以某种特殊字符串格式存储的数据，改变为结构化数据。我们的 schedule 字段恰好符合这一点 —— 目前在 v1 中，我们的计划看起来是这样的：

日程安排: "*/1 * * * *"

这是一个典型的特殊字符串格式示例（如果你不是一个 Unix 系统管理员，它也相当难以阅读）。

我们把内容整理得更有结构一点。根据我们的CronJob代码, 我们支持“标准“Cron格式。

在 Kubernetes 中，所有版本之间必须安全地进行双向转换。这意味着，如果我们从版本 1 转换到版本 2，然后再转换回版本 1，我们不能丢失信息。因此，我们对 API 的任何更改都必须与 v1 中支持的内容兼容，并且还需要确保在 v2 中添加的任何内容在 v1 中也得到支持。在某些情况下，这意味着我们需要向 v1 添加新字段，但在我们的案例中，由于我们没有添加新功能，因此不需要这样做。

考虑到这些，让我们将上述示例稍微结构化一下：

日程安排:
  分钟: */1

现在，我们至少有了每个字段的标签，但我们仍然可以轻松支持每个字段的不同语法。

我们需要为这个变更创建一个新的 API 版本。我们称之为 v2：

kubebuilder create api --group batch --version v2 --kind CronJob

按 y 以继续\

现在，让我们复制我们现有的类型，并进行更改：

project/api/v2/cronjob_types.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Since we’re in a v2 package, controller-gen will assume this is for the v2 version automatically. We could override that with the +versionName marker.

package v2

Imports

import (
	batchv1 "k8s.io/api/batch/v1"
	corev1 "k8s.io/api/core/v1"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
)

// EDIT THIS FILE!  THIS IS SCAFFOLDING FOR YOU TO OWN!
// NOTE: json tags are required.  Any new fields you add must have json tags for the fields to be serialized.

We’ll leave our spec largely unchanged, except to change the schedule field to a new type.

// CronJobSpec defines the desired state of CronJob.
type CronJobSpec struct {
	// The schedule in Cron format, see https://en.wikipedia.org/wiki/Cron.
	Schedule CronSchedule `json:"schedule"`

The rest of Spec

	// +kubebuilder:validation:Minimum=0

	// Optional deadline in seconds for starting the job if it misses scheduled
	// time for any reason.  Missed jobs executions will be counted as failed ones.
	// +optional
	StartingDeadlineSeconds *int64 `json:"startingDeadlineSeconds,omitempty"`

	// Specifies how to treat concurrent executions of a Job.
	// Valid values are:
	// - "Allow" (default): allows CronJobs to run concurrently;
	// - "Forbid": forbids concurrent runs, skipping next run if previous run hasn't finished yet;
	// - "Replace": cancels currently running job and replaces it with a new one
	// +optional
	ConcurrencyPolicy ConcurrencyPolicy `json:"concurrencyPolicy,omitempty"`

	// This flag tells the controller to suspend subsequent executions, it does
	// not apply to already started executions.  Defaults to false.
	// +optional
	Suspend *bool `json:"suspend,omitempty"`

	// Specifies the job that will be created when executing a CronJob.
	JobTemplate batchv1.JobTemplateSpec `json:"jobTemplate"`

	// +kubebuilder:validation:Minimum=0

	// The number of successful finished jobs to retain.
	// This is a pointer to distinguish between explicit zero and not specified.
	// +optional
	SuccessfulJobsHistoryLimit *int32 `json:"successfulJobsHistoryLimit,omitempty"`

	// +kubebuilder:validation:Minimum=0

	// The number of failed finished jobs to retain.
	// This is a pointer to distinguish between explicit zero and not specified.
	// +optional
	FailedJobsHistoryLimit *int32 `json:"failedJobsHistoryLimit,omitempty"`

Next, we’ll need to define a type to hold our schedule. Based on our proposed YAML above, it’ll have a field for each corresponding Cron “field”.

// describes a Cron schedule.
type CronSchedule struct {
	// specifies the minute during which the job executes.
	// +optional
	Minute *CronField `json:"minute,omitempty"`
	// specifies the hour during which the job executes.
	// +optional
	Hour *CronField `json:"hour,omitempty"`
	// specifies the day of the month during which the job executes.
	// +optional
	DayOfMonth *CronField `json:"dayOfMonth,omitempty"`
	// specifies the month during which the job executes.
	// +optional
	Month *CronField `json:"month,omitempty"`
	// specifies the day of the week during which the job executes.
	// +optional
	DayOfWeek *CronField `json:"dayOfWeek,omitempty"`
}

Finally, we’ll define a wrapper type to represent a field. We could attach additional validation to this field, but for now we’ll just use it for documentation purposes.

// represents a Cron field specifier.
type CronField string

Other Types

All the other types will stay the same as before.

// ConcurrencyPolicy describes how the job will be handled.
// Only one of the following concurrent policies may be specified.
// If none of the following policies is specified, the default one
// is AllowConcurrent.
// +kubebuilder:validation:Enum=Allow;Forbid;Replace
type ConcurrencyPolicy string

const (
	// AllowConcurrent allows CronJobs to run concurrently.
	AllowConcurrent ConcurrencyPolicy = "Allow"

	// ForbidConcurrent forbids concurrent runs, skipping next run if previous
	// hasn't finished yet.
	ForbidConcurrent ConcurrencyPolicy = "Forbid"

	// ReplaceConcurrent cancels currently running job and replaces it with a new one.
	ReplaceConcurrent ConcurrencyPolicy = "Replace"
)

// CronJobStatus defines the observed state of CronJob
type CronJobStatus struct {
	// 插入额外的状态字段 - 定义集群的观察状态
	// 重要：在修改此文件后，请运行 "make" 以重新生成代码

	// A list of pointers to currently running jobs.
	// +optional
	Active []corev1.ObjectReference `json:"active,omitempty"`

	// Information when was the last time the job was successfully scheduled.
	// +optional
	LastScheduleTime *metav1.Time `json:"lastScheduleTime,omitempty"`
}

// +kubebuilder:object:root=true
// +kubebuilder:subresource:status
// +versionName=v2
// CronJob is the Schema for the cronjobs API.
type CronJob struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   CronJobSpec   `json:"spec,omitempty"`
	Status CronJobStatus `json:"status,omitempty"`
}

// +kubebuilder:object:root=true

// CronJobList contains a list of CronJob.
type CronJobList struct {
	metav1.TypeMeta `json:",inline"`
	metav1.ListMeta `json:"metadata,omitempty"`
	Items           []CronJob `json:"items"`
}

func init() {
	SchemeBuilder.Register(&CronJob{}, &CronJobList{})
}

存储版本

project/api/v1/cronjob_types.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

package v1

Imports

import (
	batchv1 "k8s.io/api/batch/v1"
	corev1 "k8s.io/api/core/v1"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
)

// EDIT THIS FILE!  THIS IS SCAFFOLDING FOR YOU TO OWN!
// NOTE: json tags are required.  Any new fields you add must have json tags for the fields to be serialized.

old stuff

// CronJobSpec defines the desired state of CronJob.
type CronJobSpec struct {
	// +kubebuilder:validation:MinLength=0

	// The schedule in Cron format, see https://en.wikipedia.org/wiki/Cron.
	Schedule string `json:"schedule"`

	// +kubebuilder:validation:Minimum=0

	// Optional deadline in seconds for starting the job if it misses scheduled
	// time for any reason.  Missed jobs executions will be counted as failed ones.
	// +optional
	StartingDeadlineSeconds *int64 `json:"startingDeadlineSeconds,omitempty"`

	// Specifies how to treat concurrent executions of a Job.
	// Valid values are:
	// - "Allow" (default): allows CronJobs to run concurrently;
	// - "Forbid": forbids concurrent runs, skipping next run if previous run hasn't finished yet;
	// - "Replace": cancels currently running job and replaces it with a new one
	// +optional
	ConcurrencyPolicy ConcurrencyPolicy `json:"concurrencyPolicy,omitempty"`

	// This flag tells the controller to suspend subsequent executions, it does
	// not apply to already started executions.  Defaults to false.
	// +optional
	Suspend *bool `json:"suspend,omitempty"`

	// Specifies the job that will be created when executing a CronJob.
	JobTemplate batchv1.JobTemplateSpec `json:"jobTemplate"`

	// +kubebuilder:validation:Minimum=0

	// The number of successful finished jobs to retain.
	// This is a pointer to distinguish between explicit zero and not specified.
	// +optional
	SuccessfulJobsHistoryLimit *int32 `json:"successfulJobsHistoryLimit,omitempty"`

	// +kubebuilder:validation:Minimum=0

	// The number of failed finished jobs to retain.
	// This is a pointer to distinguish between explicit zero and not specified.
	// +optional
	FailedJobsHistoryLimit *int32 `json:"failedJobsHistoryLimit,omitempty"`
}

// ConcurrencyPolicy describes how the job will be handled.
// Only one of the following concurrent policies may be specified.
// If none of the following policies is specified, the default one
// is AllowConcurrent.
// +kubebuilder:validation:Enum=Allow;Forbid;Replace
type ConcurrencyPolicy string

const (
	// AllowConcurrent allows CronJobs to run concurrently.
	AllowConcurrent ConcurrencyPolicy = "Allow"

	// ForbidConcurrent forbids concurrent runs, skipping next run if previous
	// hasn't finished yet.
	ForbidConcurrent ConcurrencyPolicy = "Forbid"

	// ReplaceConcurrent cancels currently running job and replaces it with a new one.
	ReplaceConcurrent ConcurrencyPolicy = "Replace"
)

// CronJobStatus defines the observed state of CronJob.
type CronJobStatus struct {
	// 插入额外的状态字段 - 定义集群的观察状态
	// 重要：在修改此文件后，请运行 "make" 以重新生成代码

	// A list of pointers to currently running jobs.
	// +optional
	Active []corev1.ObjectReference `json:"active,omitempty"`

	// Information when was the last time the job was successfully scheduled.
	// +optional
	LastScheduleTime *metav1.Time `json:"lastScheduleTime,omitempty"`
}

Since we’ll have more than one version, we’ll need to mark a storage version. This is the version that the Kubernetes API server uses to store our data. We’ll chose the v1 version for our project.

We’ll use the +kubebuilder:storageversion to do this.

Note that multiple versions may exist in storage if they were written before the storage version changes – changing the storage version only affects how objects are created/updated after the change.

// +kubebuilder:object:root=true
// +kubebuilder:storageversion
// +kubebuilder:conversion:hub
// +kubebuilder:subresource:status
// +versionName=v1
// +kubebuilder:storageversion
// CronJob is the Schema for the cronjobs API.
type CronJob struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   CronJobSpec   `json:"spec,omitempty"`
	Status CronJobStatus `json:"status,omitempty"`
}

old stuff

// +kubebuilder:object:root=true

// CronJobList contains a list of CronJob.
type CronJobList struct {
	metav1.TypeMeta `json:",inline"`
	metav1.ListMeta `json:"metadata,omitempty"`
	Items           []CronJob `json:"items"`
}

func init() {
	SchemeBuilder.Register(&CronJob{}, &CronJobList{})
}

现在我们已经确定了类型，我们需要设置转换…

中心、辐条以及其他轮子隐喻

由于我们现在有两个不同的版本，并且用户可以请求任一版本，我们需要定义一种在我们的版本之间转换的方法。对于 CRD（自定义资源定义），这可以通过 webhook 实现，类似于我们在基本教程中定义的默认和验证 webhook。和之前一样，controller-runtime 将帮助我们将这些细节连接在一起，我们只需要实现实际的转换。

在我们进行之前，我们需要了解controller-runtime如何看待版本。具体而言:

完全图在航海方面不够充分。

定义转换的一个简单方法可能是定义转换函数，以在我们每个版本之间进行转换。然后，每当我们需要转换时，就查找适当的函数，并调用它来执行转换。

当我们只有两个版本时，这很好，但如果我们有 4 种类型呢？8 种类型呢？那将需要很多转换函数。

相反，controller-runtime 将转换建模为“中心与辐射“模型——我们将一个版本标记为“中心“，所有其他版本只定义与中心之间的转换：

becomes

然后，如果我们需要在两个非中心版本之间进行转换，我们首先转换为中心版本，然后再转换为我们所需的版本：

这减少了我们需要定义的转换函数的数量，并且是基于 Kubernetes 在内部的做法。

这与 Webhook 有什么关系？

当 API 客户端，如 kubectl 或者你的控制器，请求某个特定版本的资源时，Kubernetes API 服务器需要返回该版本的结果。然而，该版本可能与 API 服务器存储的版本不匹配。

在这种情况下，API 服务器需要知道如何在所需版本和存储版本之间进行转换。由于 CRD 并没有内置转换功能，Kubernetes API 服务器会调用一个 webhook 来执行转换。对于 Kubebuilder，这个 webhook 是由 controller-runtime 实现的，执行我们上面讨论的中心-辐射转换。

现在我们已经掌握了转换模型，我们可以实际执行我们的转换。

实施转换

有了我们的转换模型，接下来就该实际实现转换函数了。我们将为我们的 CronJob API 版本 v1 (Hub) 创建一个转换 Webhook，以转换我们的 CronJob API 版本 v2，请参见：

kubebuilder create webhook --group batch --version v1 --kind CronJob --conversion --spoke v2

上述命令将生成 cronjob_conversion.go 文件与我们的 cronjob_types.go 文件并排，以避免在主类型文件中混入额外的函数。

中心…

首先，我们将实现中心。我们将选择 v1 版本作为中心：

project/api/v1/cronjob_conversion.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

package v1

Implementing the hub method is pretty easy – we just have to add an empty method called Hub()to serve as a marker. We could also just put this inline in our cronjob_types.go file.

// Hub marks this type as a conversion hub.
func (*CronJob) Hub() {}

… 和发言人

然后，我们将实现我们的分支，v2 版本：

project/api/v2/cronjob_conversion.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

package v2

Imports

For imports, we’ll need the controller-runtime conversion package, plus the API version for our hub type (v1), and finally some of the standard packages.

import (
	"fmt"
	"strings"

	"log"

	"sigs.k8s.io/controller-runtime/pkg/conversion"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
)

Our “spoke” versions need to implement the Convertible interface. Namely, they’ll need ConvertTo() and ConvertFrom() methods to convert to/from the hub version.

ConvertTo is expected to modify its argument to contain the converted object. Most of the conversion is straightforward copying, except for converting our changed field.

// ConvertTo converts this CronJob (v2) to the Hub version (v1).
func (src *CronJob) ConvertTo(dstRaw conversion.Hub) error {
	dst := dstRaw.(*batchv1.CronJob)
	log.Printf("ConvertTo: Converting CronJob from Spoke version v2 to Hub version v1;"+
		"source: %s/%s, target: %s/%s", src.Namespace, src.Name, dst.Namespace, dst.Name)

	sched := src.Spec.Schedule
	scheduleParts := []string{"*", "*", "*", "*", "*"}
	if sched.Minute != nil {
		scheduleParts[0] = string(*sched.Minute)
	}
	if sched.Hour != nil {
		scheduleParts[1] = string(*sched.Hour)
	}
	if sched.DayOfMonth != nil {
		scheduleParts[2] = string(*sched.DayOfMonth)
	}
	if sched.Month != nil {
		scheduleParts[3] = string(*sched.Month)
	}
	if sched.DayOfWeek != nil {
		scheduleParts[4] = string(*sched.DayOfWeek)
	}
	dst.Spec.Schedule = strings.Join(scheduleParts, " ")

rote conversion

The rest of the conversion is pretty rote.

	// ObjectMeta
	dst.ObjectMeta = src.ObjectMeta

	// Spec
	dst.Spec.StartingDeadlineSeconds = src.Spec.StartingDeadlineSeconds
	dst.Spec.ConcurrencyPolicy = batchv1.ConcurrencyPolicy(src.Spec.ConcurrencyPolicy)
	dst.Spec.Suspend = src.Spec.Suspend
	dst.Spec.JobTemplate = src.Spec.JobTemplate
	dst.Spec.SuccessfulJobsHistoryLimit = src.Spec.SuccessfulJobsHistoryLimit
	dst.Spec.FailedJobsHistoryLimit = src.Spec.FailedJobsHistoryLimit

	// Status
	dst.Status.Active = src.Status.Active
	dst.Status.LastScheduleTime = src.Status.LastScheduleTime

	return nil
}

ConvertFrom is expected to modify its receiver to contain the converted object. Most of the conversion is straightforward copying, except for converting our changed field.

// ConvertFrom converts the Hub version (v1) to this CronJob (v2).
func (dst *CronJob) ConvertFrom(srcRaw conversion.Hub) error {
	src := srcRaw.(*batchv1.CronJob)
	log.Printf("ConvertFrom: Converting CronJob from Hub version v1 to Spoke version v2;"+
		"source: %s/%s, target: %s/%s", src.Namespace, src.Name, dst.Namespace, dst.Name)

	schedParts := strings.Split(src.Spec.Schedule, " ")
	if len(schedParts) != 5 {
		return fmt.Errorf("invalid schedule: not a standard 5-field schedule")
	}
	partIfNeeded := func(raw string) *CronField {
		if raw == "*" {
			return nil
		}
		part := CronField(raw)
		return &part
	}
	dst.Spec.Schedule.Minute = partIfNeeded(schedParts[0])
	dst.Spec.Schedule.Hour = partIfNeeded(schedParts[1])
	dst.Spec.Schedule.DayOfMonth = partIfNeeded(schedParts[2])
	dst.Spec.Schedule.Month = partIfNeeded(schedParts[3])
	dst.Spec.Schedule.DayOfWeek = partIfNeeded(schedParts[4])

rote conversion

The rest of the conversion is pretty rote.

	// ObjectMeta
	dst.ObjectMeta = src.ObjectMeta

	// Spec
	dst.Spec.StartingDeadlineSeconds = src.Spec.StartingDeadlineSeconds
	dst.Spec.ConcurrencyPolicy = ConcurrencyPolicy(src.Spec.ConcurrencyPolicy)
	dst.Spec.Suspend = src.Spec.Suspend
	dst.Spec.JobTemplate = src.Spec.JobTemplate
	dst.Spec.SuccessfulJobsHistoryLimit = src.Spec.SuccessfulJobsHistoryLimit
	dst.Spec.FailedJobsHistoryLimit = src.Spec.FailedJobsHistoryLimit

	// Status
	dst.Status.Active = src.Status.Active
	dst.Status.LastScheduleTime = src.Status.LastScheduleTime

	return nil
}

现在我们已经设置好了转换，我们需要做的就是将主程序连接起来，以便提供 webhook！

设置网络hooks

我们的转换已经到位，因此剩下的就是告诉 controller-runtime 我们的转换。

Webhook设置中…

project/internal/webhook/v1/cronjob_webhook.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Go imports

package v1

import (
	"context"
	"fmt"

	"github.com/robfig/cron"
	apierrors "k8s.io/apimachinery/pkg/api/errors"
	"k8s.io/apimachinery/pkg/runtime/schema"
	validationutils "k8s.io/apimachinery/pkg/util/validation"
	"k8s.io/apimachinery/pkg/util/validation/field"

	"k8s.io/apimachinery/pkg/runtime"
	ctrl "sigs.k8s.io/controller-runtime"
	logf "sigs.k8s.io/controller-runtime/pkg/log"
	"sigs.k8s.io/controller-runtime/pkg/webhook"
	"sigs.k8s.io/controller-runtime/pkg/webhook/admission"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
)

Next, we’ll setup a logger for the webhooks.

var cronjoblog = logf.Log.WithName("cronjob-resource")

This setup doubles as setup for our conversion webhooks: as long as our types implement the Hub and Convertible interfaces, a conversion webhook will be registered.

// SetupCronJobWebhookWithManager registers the webhook for CronJob in the manager.
func SetupCronJobWebhookWithManager(mgr ctrl.Manager) error {
	return ctrl.NewWebhookManagedBy(mgr).For(&batchv1.CronJob{}).
		WithValidator(&CronJobCustomValidator{}).
		WithDefaulter(&CronJobCustomDefaulter{
			DefaultConcurrencyPolicy:          batchv1.AllowConcurrent,
			DefaultSuspend:                    false,
			DefaultSuccessfulJobsHistoryLimit: 3,
			DefaultFailedJobsHistoryLimit:     1,
		}).
		Complete()
}

Notice that we use kubebuilder markers to generate webhook manifests. This marker is responsible for generating a mutating webhook manifest.

The meaning of each marker can be found here.

This marker is responsible for generating a mutation webhook manifest.

// +kubebuilder:webhook:path=/mutate-batch-tutorial-kubebuilder-io-v1-cronjob,mutating=true,failurePolicy=fail,sideEffects=None,groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=create;update,versions=v1,name=mcronjob-v1.kb.io,admissionReviewVersions=v1

// CronJobCustomDefaulter struct is responsible for setting default values on the custom resource of the
// Kind CronJob when those are created or updated.
//
// NOTE: The +kubebuilder:object:generate=false marker prevents controller-gen from generating DeepCopy methods,
// as it is used only for temporary operations and does not need to be deeply copied.
type CronJobCustomDefaulter struct {

	// Default values for various CronJob fields
	DefaultConcurrencyPolicy          batchv1.ConcurrencyPolicy
	DefaultSuspend                    bool
	DefaultSuccessfulJobsHistoryLimit int32
	DefaultFailedJobsHistoryLimit     int32
}

var _ webhook.CustomDefaulter = &CronJobCustomDefaulter{}

We use the webhook.CustomDefaulterinterface to set defaults to our CRD. A webhook will automatically be served that calls this defaulting.

The Defaultmethod is expected to mutate the receiver, setting the defaults.

// Default implements webhook.CustomDefaulter so a webhook will be registered for the Kind CronJob.
func (d *CronJobCustomDefaulter) Default(ctx context.Context, obj runtime.Object) error {
	cronjob, ok := obj.(*batchv1.CronJob)

	if !ok {
		return fmt.Errorf("expected an CronJob object but got %T", obj)
	}
	cronjoblog.Info("Defaulting for CronJob", "name", cronjob.GetName())

	// Set default values
	d.applyDefaults(cronjob)
	return nil
}

// applyDefaults applies default values to CronJob fields.
func (d *CronJobCustomDefaulter) applyDefaults(cronJob *batchv1.CronJob) {
	if cronJob.Spec.ConcurrencyPolicy == "" {
		cronJob.Spec.ConcurrencyPolicy = d.DefaultConcurrencyPolicy
	}
	if cronJob.Spec.Suspend == nil {
		cronJob.Spec.Suspend = new(bool)
		*cronJob.Spec.Suspend = d.DefaultSuspend
	}
	if cronJob.Spec.SuccessfulJobsHistoryLimit == nil {
		cronJob.Spec.SuccessfulJobsHistoryLimit = new(int32)
		*cronJob.Spec.SuccessfulJobsHistoryLimit = d.DefaultSuccessfulJobsHistoryLimit
	}
	if cronJob.Spec.FailedJobsHistoryLimit == nil {
		cronJob.Spec.FailedJobsHistoryLimit = new(int32)
		*cronJob.Spec.FailedJobsHistoryLimit = d.DefaultFailedJobsHistoryLimit
	}
}

For instance, we’ll see below that we use this to validate a well-formed cron schedule without making up a long regular expression.

If webhook.CustomValidator interface is implemented, a webhook will automatically be served that calls the validation.

This marker is responsible for generating a validation webhook manifest.

// +kubebuilder:webhook:path=/validate-batch-tutorial-kubebuilder-io-v1-cronjob,mutating=false,failurePolicy=fail,sideEffects=None,groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=create;update,versions=v1,name=vcronjob-v1.kb.io,admissionReviewVersions=v1

// CronJobCustomValidator struct is responsible for validating the CronJob resource
// when it is created, updated, or deleted.
//
// NOTE: The +kubebuilder:object:generate=false marker prevents controller-gen from generating DeepCopy methods,
// as this struct is used only for temporary operations and does not need to be deeply copied.
type CronJobCustomValidator struct {
	// TODO(user): Add more fields as needed for validation
}

var _ webhook.CustomValidator = &CronJobCustomValidator{}

// ValidateCreate implements webhook.CustomValidator so a webhook will be registered for the type CronJob.
func (v *CronJobCustomValidator) ValidateCreate(ctx context.Context, obj runtime.Object) (admission.Warnings, error) {
	cronjob, ok := obj.(*batchv1.CronJob)
	if !ok {
		return nil, fmt.Errorf("expected a CronJob object but got %T", obj)
	}
	cronjoblog.Info("Validation for CronJob upon creation", "name", cronjob.GetName())

	return nil, validateCronJob(cronjob)
}

// ValidateUpdate implements webhook.CustomValidator so a webhook will be registered for the type CronJob.
func (v *CronJobCustomValidator) ValidateUpdate(ctx context.Context, oldObj, newObj runtime.Object) (admission.Warnings, error) {
	cronjob, ok := newObj.(*batchv1.CronJob)
	if !ok {
		return nil, fmt.Errorf("expected a CronJob object for the newObj but got %T", newObj)
	}
	cronjoblog.Info("Validation for CronJob upon update", "name", cronjob.GetName())

	return nil, validateCronJob(cronjob)
}

// ValidateDelete implements webhook.CustomValidator so a webhook will be registered for the type CronJob.
func (v *CronJobCustomValidator) ValidateDelete(ctx context.Context, obj runtime.Object) (admission.Warnings, error) {
	cronjob, ok := obj.(*batchv1.CronJob)
	if !ok {
		return nil, fmt.Errorf("expected a CronJob object but got %T", obj)
	}
	cronjoblog.Info("Validation for CronJob upon deletion", "name", cronjob.GetName())

	// TODO(user): fill in your validation logic upon object deletion.

	return nil, nil
}

We validate the name and the spec of the CronJob.

// validateCronJob validates the fields of a CronJob object.
func validateCronJob(cronjob *batchv1.CronJob) error {
	var allErrs field.ErrorList
	if err := validateCronJobName(cronjob); err != nil {
		allErrs = append(allErrs, err)
	}
	if err := validateCronJobSpec(cronjob); err != nil {
		allErrs = append(allErrs, err)
	}
	if len(allErrs) == 0 {
		return nil
	}

	return apierrors.NewInvalid(
		schema.GroupKind{Group: "batch.tutorial.kubebuilder.io", Kind: "CronJob"},
		cronjob.Name, allErrs)
}

func validateCronJobSpec(cronjob *batchv1.CronJob) *field.Error {
	// The field helpers from the kubernetes API machinery help us return nicely
	// structured validation errors.
	return validateScheduleFormat(
		cronjob.Spec.Schedule,
		field.NewPath("spec").Child("schedule"))
}

We’ll need to validate the cron schedule is well-formatted.

func validateScheduleFormat(schedule string, fldPath *field.Path) *field.Error {
	if _, err := cron.ParseStandard(schedule); err != nil {
		return field.Invalid(fldPath, schedule, err.Error())
	}
	return nil
}

Validate object name

Validating the length of a string field can be done declaratively by the validation schema.

But the ObjectMeta.Name field is defined in a shared package under the apimachinery repo, so we can’t declaratively validate it using the validation schema.

func validateCronJobName(cronjob *batchv1.CronJob) *field.Error {
	if len(cronjob.ObjectMeta.Name) > validationutils.DNS1035LabelMaxLength-11 {
		// The job name length is 63 characters like all Kubernetes objects
		// (which must fit in a DNS subdomain). The cronjob controller appends
		// a 11-character suffix to the cronjob (`-$TIMESTAMP`) when creating
		// a job. The job name length limit is 63 characters. Therefore cronjob
		// names must have length <= 63-11=52. If we don't validate this here,
		// then job creation will fail later.
		return field.Invalid(field.NewPath("metadata").Child("name"), cronjob.ObjectMeta.Name, "must be no more than 52 characters")
	}
	return nil
}

…和 `main.go`

同样，我们现有的主文件是足够的：

project/cmd/main.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Imports

package main

import (
	"crypto/tls"
	"flag"
	"os"
	"path/filepath"

	// 导入所有 Kubernetes 客户端身份验证插件（例如 Azure、GCP、OIDC 等）
	// 确保 exec-entrypoint 和 run 可以使用它们。
	_ "k8s.io/client-go/plugin/pkg/client/auth"

	kbatchv1 "k8s.io/api/batch/v1"
	"k8s.io/apimachinery/pkg/runtime"
	utilruntime "k8s.io/apimachinery/pkg/util/runtime"
	clientgoscheme "k8s.io/client-go/kubernetes/scheme"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/certwatcher"
	"sigs.k8s.io/controller-runtime/pkg/healthz"
	"sigs.k8s.io/controller-runtime/pkg/log/zap"
	"sigs.k8s.io/controller-runtime/pkg/metrics/filters"
	metricsserver "sigs.k8s.io/controller-runtime/pkg/metrics/server"
	"sigs.k8s.io/controller-runtime/pkg/webhook"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
	batchv2 "tutorial.kubebuilder.io/project/api/v2"
	"tutorial.kubebuilder.io/project/internal/controller"
	webhookbatchv1 "tutorial.kubebuilder.io/project/internal/webhook/v1"
	webhookbatchv2 "tutorial.kubebuilder.io/project/internal/webhook/v2"
	// +kubebuilder:scaffold:imports
)

existing setup

var (
	scheme   = runtime.NewScheme()
	setupLog = ctrl.Log.WithName("setup")
)

func init() {
	utilruntime.Must(clientgoscheme.AddToScheme(scheme))

	utilruntime.Must(kbatchv1.AddToScheme(scheme)) // we've added this ourselves
	utilruntime.Must(batchv1.AddToScheme(scheme))
	utilruntime.Must(batchv2.AddToScheme(scheme))
	// +kubebuilder:scaffold:scheme}

// nolint:gocyclo
func main() {

existing setup

	var metricsAddr string
	var metricsCertPath, metricsCertName, metricsCertKey string
	var webhookCertPath, webhookCertName, webhookCertKey string
	var enableLeaderElection bool
	var probeAddr string
	var secureMetrics bool
	var enableHTTP2 bool
	var tlsOpts []func(*tls.Config)
	flag.StringVar(&metricsAddr, "metrics-bind-address", "0", "The address the metrics endpoint binds to. "+
		"使用 :8443 进行 HTTPS，使用 :8080 进行 HTTP，或者保持为 0 以禁用指标服务。")
	flag.StringVar(&probeAddr, "health-probe-bind-address", ":8081", "The address the probe endpoint binds to.")
	flag.BoolVar(&enableLeaderElection, "leader-elect", false,
		"Enable leader election for controller manager. "+
			"启用此功能将确保只有一个活动的控制管理器。")
	flag.BoolVar(&secureMetrics, "metrics-secure", true,
		"如果设置，指标端点将通过 HTTPS 安全提供。请使用 --metrics-secure=false 以改为使用 HTTP。")
	flag.StringVar(&webhookCertPath, "webhook-cert-path", "", "The directory that contains the webhook certificate.")
	flag.StringVar(&webhookCertName, "webhook-cert-name", "tls.crt", "The name of the webhook certificate file.")
	flag.StringVar(&webhookCertKey, "webhook-cert-key", "tls.key", "The name of the webhook key file.")
	flag.StringVar(&metricsCertPath, "metrics-cert-path", "",
		"The directory that contains the metrics server certificate.")
	flag.StringVar(&metricsCertName, "metrics-cert-name", "tls.crt", "The name of the metrics server certificate file.")
	flag.StringVar(&metricsCertKey, "metrics-cert-key", "tls.key", "The name of the metrics server key file.")
	flag.BoolVar(&enableHTTP2, "enable-http2", false,
		"If set, HTTP/2 will be enabled for the metrics and webhook servers")
	opts := zap.Options{
		Development: true,
	}
	opts.BindFlags(flag.CommandLine)
	flag.Parse()

	ctrl.SetLogger(zap.New(zap.UseFlagOptions(&opts)))

	// 如果 enable-http2 标志为 false（默认值），则应禁用 http/2
	// 由于其存在的漏洞。更具体地说，禁用 http/2 将
	// 防止受到 HTTP/2 流取消和
	// 快速重置 CVE 的漏洞影响。有关更多信息，请参见：
	// - https://github.com/advisories/GHSA-qppj-fm5r-hxr3
	// - https://github.com/advisories/GHSA-4374-p667-p6c8
	disableHTTP2 := func(c *tls.Config) {
		setupLog.Info("disabling http/2")
		c.NextProtos = []string{"http/1.1"}
	}

	if !enableHTTP2 {
		tlsOpts = append(tlsOpts, disableHTTP2)
	}

	// 创建用于指标和 Webhook 证书的监视器
	var metricsCertWatcher, webhookCertWatcher *certwatcher.CertWatcher

	// 初始Webhook TLS选项
	webhookTLSOpts := tlsOpts

	if len(webhookCertPath) > 0 {
		setupLog.Info("使用提供的证书初始化 Webhook 证书监视器",
			"webhook-cert-path", webhookCertPath, "webhook-cert-name", webhookCertName, "webhook-cert-key", webhookCertKey)

		var err error
		webhookCertWatcher, err = certwatcher.New(
			filepath.Join(webhookCertPath, webhookCertName),
			filepath.Join(webhookCertPath, webhookCertKey),
		)
		if err != nil {
			setupLog.Error(err, "Failed to initialize webhook certificate watcher")
			os.Exit(1)
		}

		webhookTLSOpts = append(webhookTLSOpts, func(config *tls.Config) {
			config.GetCertificate = webhookCertWatcher.GetCertificate
		})
	}

	webhookServer := webhook.NewServer(webhook.Options{
		TLSOpts: webhookTLSOpts,
	})

	// 指标端点在 'config/default/kustomization.yaml' 中启用。指标选项配置服务器。
	// 更多信息：
	// - https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/metrics/server
	// - https://book.kubebuilder.io/reference/metrics.html
	metricsServerOptions := metricsserver.Options{
		BindAddress:   metricsAddr,
		SecureServing: secureMetrics,
		TLSOpts:       tlsOpts,
	}

	if secureMetrics {
		// FilterProvider 用于通过认证和授权来保护指标端点。
		// 这些配置确保只有授权用户和服务账户
		// 可以访问指标端点。RBAC 配置在 'config/rbac/kustomization.yaml' 中。更多信息：
		// https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.20.4/pkg/metrics/filters#WithAuthenticationAndAuthorization
		metricsServerOptions.FilterProvider = filters.WithAuthenticationAndAuthorization
	}

	// 如果未指定证书，controller-runtime 将自动
	// 为指标服务器生成自签名证书。虽然对于开发和测试来说很方便，
	// 但这种设置不建议用于生产环境。
	//
	// TODO(用户)：如果您启用 certManager，请取消注释以下行：
	// - [METRICS-WITH-CERTS] 在 config/default/kustomization.yaml 中生成并使用
	// 由 cert-manager 管理的指标服务器证书。
	// - [PROMETHEUS-WITH-CERTS] 在 config/prometheus/kustomization.yaml 中用于 TLS 认证。
	if len(metricsCertPath) > 0 {
		setupLog.Info("使用提供的证书初始化指标证书监视器",
			"metrics-cert-path", metricsCertPath, "metrics-cert-name", metricsCertName, "metrics-cert-key", metricsCertKey)

		var err error
		metricsCertWatcher, err = certwatcher.New(
			filepath.Join(metricsCertPath, metricsCertName),
			filepath.Join(metricsCertPath, metricsCertKey),
		)
		if err != nil {
			setupLog.Error(err, "to initialize metrics certificate watcher", "error", err)
			os.Exit(1)
		}

		metricsServerOptions.TLSOpts = append(metricsServerOptions.TLSOpts, func(config *tls.Config) {
			config.GetCertificate = metricsCertWatcher.GetCertificate
		})
	}

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme:                 scheme,
		Metrics:                metricsServerOptions,
		WebhookServer:          webhookServer,
		HealthProbeBindAddress: probeAddr,
		LeaderElection:         enableLeaderElection,
		LeaderElectionID:       "80807133.tutorial.kubebuilder.io",
		// LeaderElectionReleaseOnCancel 定义了当管理器结束时，领导者是否应自愿辞职
		// 当管理器停止时，这要求二进制文件立即结束，否则这个设置是不安全的。设置这个可以显著
		// 加快自愿领导者的过渡，因为新的领导者不必首先等待
		// LeaseDuration 时间。
		//
		// 在提供的默认脚手架中，程序会在
		// 管理器停止后立即结束，因此启用此选项是可以的。不过，
		// 如果您正在进行或打算在管理器停止后执行任何操作，如执行清理，
		// 那么使用它可能是不安全的。
		// LeaderElectionReleaseOnCancel: true,
	})
	if err != nil {
		setupLog.Error(err, "unable to start manager")
		os.Exit(1)
	}

	if err = (&controller.CronJobReconciler{
		Client: mgr.GetClient(),
		Scheme: mgr.GetScheme(),
	}).SetupWithManager(mgr); err != nil {
		setupLog.Error(err, "unable to create controller", "controller", "CronJob")
		os.Exit(1)
	}

Our existing call to SetupWebhookWithManager registers our conversion webhooks with the manager, too.

	// nolint:goconst
	if os.Getenv("ENABLE_WEBHOOKS") != "false" {
		if err = webhookbatchv1.SetupCronJobWebhookWithManager(mgr); err != nil {
			setupLog.Error(err, "unable to create webhook", "webhook", "CronJob")
			os.Exit(1)
		}
	}
	// nolint:goconst
	if os.Getenv("ENABLE_WEBHOOKS") != "false" {
		if err = webhookbatchv2.SetupCronJobWebhookWithManager(mgr); err != nil {
			setupLog.Error(err, "unable to create webhook", "webhook", "CronJob")
			os.Exit(1)
		}
	}
	// +kubebuilder:scaffold:builder

existing setup

	if metricsCertWatcher != nil {
		setupLog.Info("Adding metrics certificate watcher to manager")
		if err := mgr.Add(metricsCertWatcher); err != nil {
			setupLog.Error(err, "unable to add metrics certificate watcher to manager")
			os.Exit(1)
		}
	}

	if webhookCertWatcher != nil {
		setupLog.Info("Adding webhook certificate watcher to manager")
		if err := mgr.Add(webhookCertWatcher); err != nil {
			setupLog.Error(err, "unable to add webhook certificate watcher to manager")
			os.Exit(1)
		}
	}

	if err := mgr.AddHealthzCheck("healthz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up health check")
		os.Exit(1)
	}
	if err := mgr.AddReadyzCheck("readyz", healthz.Ping); err != nil {
		setupLog.Error(err, "unable to set up ready check")
		os.Exit(1)
	}

	setupLog.Info("starting manager")
	if err := mgr.Start(ctrl.SetupSignalHandler()); err != nil {
		setupLog.Error(err, "problem running manager")
		os.Exit(1)
	}

一切都已经准备好！现在剩下的就是测试我们的网络钩子了。

部署与测试

在我们测试转换之前，我们需要在我们的 CRD 中启用它们：

Kubebuilder 在 config 目录下生成 Kubernetes 清单，默认情况下禁用了 webhook 部分。要启用它们，我们需要：

在 config/crd/kustomization.yaml 文件中启用 patches/webhook_in_<kind>.yaml 和 patches/cainjection_in_<kind>.yaml。
在 config/default/kustomization.yaml 文件的 bases 部分启用 ../certmanager 和 ../webhook 目录。
启用 config/default/kustomization.yaml 文件中 CERTMANAGER 部分下的所有变量。

另外，如果在我们的 Makefile 中存在，我们需要将 CRD_OPTIONS 变量设置为 "crd"，移除 trivialVersions 选项（这确保我们实际上为每个版本[生成验证](/reference/generating-crd.md#multiple-versions “生成CRDs：多个版本”），而不是告诉 Kubernetes 它们是相同的）：

CRD_OPTIONS ?= "crd"

现在我们已经完成了所有的代码更改和清单，接下来将其部署到集群并进行测试。

除非你有其他证书管理解决方案，否则你需要安装 cert-manager（版本 0.9.0+）。Kubebuilder 团队已经在 0.9.0-alpha.0 版本中测试了本教程中的指令。

一旦我们的证书准备齐全，我们可以像往常一样运行 make install deploy 来将所有组件（CRD 和控制器管理器部署）部署到集群上。

测试

一旦集群中所有位都启动并运行并启用了转换功能，我们就可以通过请求不同版本来测试我们的转换。

我们将根据我们的 v1 版本制作一个 v2 版本（放在 config/samples 下）。

apiVersion: batch.tutorial.kubebuilder.io/v2
kind: CronJob
metadata:
  labels:
    app.kubernetes.io/name: project
    app.kubernetes.io/managed-by: kustomize
  name: cron作业示例
spec:
  日程安排:
    分钟: "*/1"
  启动截止时间（秒）: 60
  并发策略: 允许 # 显式指定，但允许也是默认值。
  工作模板:
    spec:
      template:
        spec:
          容器:
          - name: 你好
            image: busybox
            args:
            - /bin/sh
            - -c
            - 日期; 在Kubernetes集群中打招呼。
          重启策略: 失败时

然后，我们可以在集群上创建它：

kubectl apply -f config/samples/batch_v2_cronjob.yaml

如果我们一切都做对了，它应该会成功创建，我们应该能够通过 v2 资源来获取它。

kubectl get cronjobs.v2.batch.tutorial.kubebuilder.io -o yaml

apiVersion: batch.tutorial.kubebuilder.io/v2
kind: CronJob
metadata:
  labels:
    app.kubernetes.io/name: project
    app.kubernetes.io/managed-by: kustomize
  name: cron作业示例
spec:
  日程安排:
    分钟: "*/1"
  启动截止时间（秒）: 60
  并发策略: 允许 # 显式指定，但允许也是默认值。
  工作模板:
    spec:
      template:
        spec:
          容器:
          - name: 你好
            image: busybox
            args:
            - /bin/sh
            - -c
            - 日期; 在Kubernetes集群中打招呼。
          重启策略: 失败时

和 v1 资源

kubectl get cronjobs.v1.batch.tutorial.kubebuilder.io -o yaml

apiVersion: batch.tutorial.kubebuilder.io/v1
kind: CronJob
metadata:
  labels:
    app.kubernetes.io/name: project
    app.kubernetes.io/managed-by: kustomize
  name: cron作业示例
spec:
  日程安排: "*/1 * * * *"
  启动截止时间（秒）: 60
  并发策略: 允许 # 显式指定，但允许也是默认值。
  工作模板:
    spec:
      template:
        spec:
          容器:
          - name: 你好
            image: busybox
            args:
            - /bin/sh
            - -c
            - 日期; 在Kubernetes集群中打招呼。
          重启策略: 失败时

两者都应该填写，并且看起来与我们的 v2 和 v1 示例各自相当。请注意，每个都有不同的 API 版本。

最后，如果我们等一会儿，我们应该注意到我们的 CronJob 继续进行调整，尽管我们的控制器是针对我们的 v1 API 版本编写的。

kubectl and Preferred Versions

当我们从 Go 代码访问我们的 API 类型时，我们通过使用该版本的 Go 类型（例如 batchv2.CronJob）来请求特定版本。

您可能注意到，上述的 kubectl 调用与我们通常的做法略有不同 — 具体来说，它们指定了一个_组-版本-资源_，而不仅仅是一个资源。

当我们输入 kubectl get cronjob 时，kubectl 需要确定哪个组-版本-资源与之对应。为此，它使用 发现 API 来找出 cronjob 资源的首选版本。对于自定义资源定义（CRD），这基本上是最新的稳定版本（有关具体细节，请参见CRD 文档）。

通过我们对 CronJob 的更新，这意味着 kubectl get cronjob 将获取 batch/v2 组版本。

如果我们想要指定一个确切的版本，可以像上面一样使用 kubectl get resource.version.group。

在脚本中始终使用完整的群组-版本-资源语法。 kubectl get resource 是为人类、自我意识的机器人以及其他能够识别新版本的有意识生物设计的。 kubectl get resource.version.group 则适用于所有其他情况。

故障排除

故障排除步骤

迁移

在Kubebuilder中迁移项目结构通常涉及一些手动工作。

本节详细说明了在不同版本的 Kubebuilder 脚手架之间迁移，以及迁移到更复杂的项目布局结构所需的内容。

从旧版本（< 3.0.0）的迁移指南

请遵循从旧版 Kubebuilder 到所需的最新 v3.x 版本的迁移指南。请注意，从 v3 开始，引入了一种新的生态系统，使用插件以提高可维护性、重用性和用户体验。

有关更多信息，请参阅以下设计文档：

此外，您可以查看插件部分。

Kubebuilder v1 与 v2（从遗留的 v1.0.0+ 到 v2.0.0 的 Kubebuilder CLI 版本）

本文件涵盖了从 v1 迁移到 v2 时的所有重大变更。

所有更改的详细信息（无论是重大更改还是其他更改）可以在 controller-runtime、controller-tools 和 kubebuilder 的发布说明中找到。

常见变更

V2 项目使用 Go 模块。但是 kubebuilder 将继续支持 dep，直到 Go 1.13 发布。

控制器-runtime

Client.List 现在使用函数选项 (List(ctx, list, ...option)) 而不是 List(ctx, ListOptions, list)。
Client.DeleteAllOf 被添加到 Client 接口中。
指标现在默认开启。
在 pkg/runtime 下的一些包已被移动，其旧位置已被弃用。旧位置将在 controller-runtime v1.0.0 之前删除。有关更多信息，请参见 godocs。

与Webhook相关的

已移除自动生成 Webhook 的证书功能，Webhook 将不再自动注册。请使用 controller-tools 生成 Webhook 配置。如果您需要证书生成，我们推荐使用 cert-manager。Kubebuilder v2 将为您生成 cert-manager 配置 - 有关更多详细信息，请参阅 Webhook 教程。
builder 包现在有了单独的控制器和网络钩子构建器，这使得选择要运行的构建器更加方便。

控制器工具

生成器框架在 v2 中进行了重写。在许多情况下，它仍然与之前的工作方式相同，但请注意，有一些重大更改。有关更多详细信息，请查看标记文档。

Kubebuilder

Kubebuilder v2 引入了简化的项目布局。你可以在这里找到设计文档。
在 v1 中，管理器作为 StatefulSet 部署，而在 v2 中，它作为 Deployment 部署。
kubebuilder create webhook 命令用于搭建变更/验证/转换 Webhook，取代了 kubebuilder alpha webhook 命令。
v2 使用 distroless/static 作为基础镜像，而不是 Ubuntu。这减少了镜像大小和攻击面。
v2 需要 kustomize v3.1.0 及以上版本。

从 v1 迁移到 v2

在继续之前，请务必了解 Kubebuilder v1 和 v2 之间的差异。

请确保您已按照安装指南安装所需的组件。

推荐的迁移 v1 项目的方法是创建一个新的 v2 项目，并复制 API 和调整代码。转换后将得到一个看起来像原生 v2 项目的项目。然而，在某些情况下，也可以进行就地升级（即重用 v1 项目布局，升级 controller-runtime 和 controller-tools）。

我们以一个 V1 项目为例，将其迁移到 Kubebuilder v2。最后，我们应该得到的项目应该类似于示例 v2 项目。

准备

我们需要搞清楚组、版本、类型和域是什么。

让我们来看看我们当前的 v1 项目结构：

pkg/
├── apis
│   ├── addtoscheme_batch_v1.go
│   ├── apis.go
│   └── batch
│       ├── group.go
│       └── v1
│           ├── cronjob_types.go
│           ├── cronjob_types_test.go
│           ├── doc.go
│           ├── register.go
│           ├── v1_suite_test.go
│           └── zz_generated.deepcopy.go
├── controller
└── webhook

我们所有的 API 信息都存储在 pkg/apis/batch 中，因此我们可以在那儿找到我们需要了解的内容。

在 cronjob_types.go 文件中，我们可以找到

type CronJob struct {...}

在 register.go 中，我们可以找到

SchemeGroupVersion = schema.GroupVersion{Group: "batch.tutorial.kubebuilder.io", Version: "v1"}

将这些组合在一起，我们得到 CronJob 作为类型，batch.tutorial.kubebuilder.io/v1 作为组版本。

初始化一个 v2 项目

现在，我们需要初始化一个 v2 项目。不过，在此之前，如果我们不在 gopath 上，我们需要先初始化一个新的 Go 模块：

go mod init tutorial.kubebuilder.io/project

那么，我们可以使用 kubebuilder 完成项目的初始化：

kubebuilder init --domain tutorial.kubebuilder.io

迁移 API 和控制器

接下来，我们将重新搭建 API 类型和控制器。由于我们都需要这两者，因此在被询问要搭建哪些部分时，我们将对 API 和控制器的提示都选择“是“。

kubebuilder create api --group batch --version v1 --kind CronJob

如果您正在使用多个组，则需要进行一些手动操作来进行迁移。有关更多详细信息，请查看此链接。

迁移API

现在，让我们将 pkg/apis/batch/v1/cronjob_types.go 中的 API 定义复制到 api/v1/cronjob_types.go。我们只需要复制 Spec 和 Status 字段的实现。

我们可以用 +kubebuilder:object:root=true 来替换 +k8s:deepcopy-gen:interfaces=... 标记（该标记在 kubebuilder 中已被弃用）。

我们不再需要以下标记（它们不再使用，是早期版本的 Kubebuilder 的遗留物）：

// +生成客户端
// +k8s:openapi-gen=true

我们的API类型应该如下所示：

// +kubebuilder:object:root=true
// +kubebuilder:subresource:status
// CronJob 是 cronjobs API 的模式
type CronJob struct {...}

// +kubebuilder:object:root=true

// CronJobList 包含一个 CronJob 列表
type CronJobList struct {...}

迁移控制器

现在，让我们将控制器调整器代码从 pkg/controller/cronjob/cronjob_controller.go 迁移到 controllers/cronjob_controller.go。

我们需要进行复制。

将 ReconcileCronJob 结构体中的字段迁移到 CronJobReconciler。
Reconcile 函数的内容
将 rbac 相关标记添加到新文件中。
将以下代码从 func add(mgr manager.Manager, r reconcile.Reconciler) error 更改为 func SetupWithManager：

迁移 Webhooks

如果您没有 webhook，可以跳过这一部分。

核心类型和外部 CRD 的 Webhook

如果您正在为 Kubernetes 核心类型（例如 Pods）或不属于您的外部 CRD 使用 webhook，您可以参考 controller-runtime 的内置类型示例并进行类似的操作。Kubebuilder 在这些情况下不会生成很多内容，但您可以使用 controller-runtime 中的库。

为我们的自定义资源定义（CRD）搭建 Webhooks。

现在让我们为我们的 CRD（CronJob）搭建 Webhook。我们需要使用 --defaulting 和 --programmatic-validation 标志运行以下命令（因为我们的测试项目使用了默认值和验证 Webhook）：

kubebuilder create webhook --group batch --version v1 --kind CronJob --defaulting --programmatic-validation

根据需要多少个 CRD（自定义资源定义）使用 Webhook，我们可能需要多次运行上述命令，并使用不同的组-版本-类型。

现在，我们需要为每个 webhook 复制逻辑。对于验证 webhook，我们可以将 pkg/default_server/cronjob/validating/cronjob_create_handler.go 中的 func validatingCronJobFn 的内容复制到 api/v1/cronjob_webhook.go 中的 func ValidateCreate，然后更新操作也可以同样处理。

类似地，我们将从 func mutatingCronJobFn 复制到 func Default。

Webhook 标记

在搭建 webhooks 时，Kubebuilder v2 添加了以下标记：

`默认的动词是 verbs=create;update。我们需要确保 verbs与我们的需求相匹配。例如，如果我们只想验证创建，就需要将其更改为verbs=create`。

我们还需要确保 failure-policy 仍然保持不变。

以下标记不再需要（因为它们涉及自我部署证书配置，而该配置在 v2 中已被移除）：

// v1 标记
// +kubebuilder:webhook:port=9876,cert-dir=/tmp/cert
// +kubebuilder:webhook:service=test-system:webhook-service,selector=app:webhook-server
// +kubebuilder:webhook:secret=test-system:webhook-server-secret
// +kubebuilder:webhook:mutating-webhook-config-name=test-mutating-webhook-cfg
// +kubebuilder:webhook:validating-webhook-config-name=test-validating-webhook-cfg

在 v1 中，一个 webhook 标记可能在同一段落中拆分成多个标记。在 v2 中，每个 webhook 必须由一个单独的标记表示。

其他人

如果在 v1 的 main.go 中有任何手动更新，我们需要将这些更改移植到新的 main.go 中。我们还需要确保所有所需的方案已经注册。

如果在 config 目录下添加了其他清单，也将它们移植过来。

如果需要，请在Makefile中更改图像名称。

验证

最后，我们可以运行 make 和 make docker-build 来确保一切正常。

Kubebuilder v2 与 v3 （旧版 Kubebuilder v2.0.0+ 布局到 3.0.0+）

本文档涵盖了从 v2 迁移到 v3 时的所有重大更改。

所有更改（无论是破坏性或其他类型）的详细信息可以在 controller-runtime、controller-tools 和 kb-releases 的发布说明中找到。

常见变更

v3 项目使用 Go 模块，并要求 Go 1.18 及以上版本。Dep 不再支持用于依赖管理。

Kubebuilder

增加了对插件的初步支持。有关更多信息，请参阅可扩展 CLI 和脚手架插件：第一阶段、可扩展 CLI 和脚手架插件：第一阶段 1.5 和可扩展 CLI 和脚手架插件：第二阶段设计文档。此外，您还可以查看插件部分。
PROJECT 文件现在有了新的布局。它存储了更多关于正在使用的资源的信息，以更好地帮助插件在搭建时做出有用的决策。

此外，PROJECT 文件本身现在也进行了版本控制：version 字段对应于 PROJECT 文件自己的版本，而 layout 字段则指示当前使用的脚手架和主插件版本。
镜像 gcr.io/kubebuilder/kube-rbac-proxy 的版本从 0.5.0 更新到 0.11.0，这是一个默认启用的可选组件，用于保护对管理器的请求，以解决安全问题。所有更改的详细信息可以在 kube-rbac-proxy 中找到。

新版本 `go/v3` 插件的简述。

您可以在这里找到更多详细信息，但请查看下面的亮点

搭建/生成的 API 版本变更：
- 使用 apiextensions/v1 来生成 CRD（在 Kubernetes 1.16 中，apiextensions/v1beta1 已被弃用）
- 对生成的 Webhook 使用 admissionregistration.k8s.io/v1（admissionregistration.k8s.io/v1beta1 在 Kubernetes 1.16 中已被弃用）
- 当使用 Webhook 时，请使用 cert-manager.io/v1 作为证书管理器（cert-manager.io/v1alpha2 在 Cert-Manager 0.14 中已被弃用。更多信息请参见：CertManager v1.0 文档）
代码更改：
- 管理器的标志 --metrics-addr 和 enable-leader-election 现在被命名为 --metrics-bind-address 和 --leader-elect，以更好地与核心 Kubernetes 组件保持一致。更多信息：#1839
- 活跃性和就绪性探针现在默认使用 healthz.Ping 添加。
- 引入了一个新的选项，可以使用 ComponentConfig 创建项目。有关更多信息，请参阅其增强提案和组件配置教程。
- 管理器清单现在使用 SecurityContext 来解决安全问题。更多信息请查看：#1637
杂项：
- 对 controller-tools v0.9.0 的支持（对于 go/v2 是 v0.3.0，之前是 v0.2.5）
- 对 controller-runtime v0.12.1 的支持（对于 go/v2 版本是 v0.6.4，之前是 v0.5.0）
- 对kustomize v3.8.7的支持（对于go/v2，是v3.5.4，之前是v3.1.0）
- 所需的 Envtest 二进制文件会自动下载。
- 最低 Go 版本现在是 1.18（之前是 1.13）。

迁移到 Kubebuilder v3

所以你想要升级你的脚手架以使用最新的功能，那么请按照下面的指南进行操作，该指南将以最简单明了的方式介绍步骤，使你能够升级你的项目，以获得所有最新的变更和改进。

Apple Silicon (M1)

当前由 CLI (go/v3) 完成的脚手架使用 kubernetes-sigs/kustomize v3，该版本未为 Apple Silicon (darwin/arm64) 提供有效的二进制文件。因此，您可以改用 go/v4 插件，该插件支持该平台：

kubebuilder init --domain my.domain --repo my.domain/guestbook --plugins=go/v4

迁移指南 v2 到 v3 (推荐)

通过手动更新文件

因此，如果您想在不更改脚手架的情况下使用最新版本的 Kubebuilder CLI，请查看以下指南，该指南将描述您手动升级仅项目版本并开始使用插件版本所需的步骤。

这种方式更复杂，容易出错，成功也无法得到保证。此外，按照这些步骤操作，您将无法获得默认生成项目文件中的改进和bug修复。

您可以通过使用 go/v2 插件检查是否仍然可以使用之前的布局，该插件不会将 controller-runtime 和 controller-tools 升级到与 go/v3 一起使用的最新版本，因为这会导致不兼容的变化。通过查看此指南，您也可以了解如何手动更改文件以使用 go/v3 插件及其依赖版本。

通过手动更新文件迁移到 Kubebuilder v3

从 v2 迁移到 v3

在继续之前，请确保您了解 Kubebuilder v2 和 v3 之间的差异。

请确保您已按照安装指南安装所需的组件。

迁移 v2 项目的推荐方式是创建一个新的 v3 项目，并将 API 和调整代码复制过去。转换后的项目将类似于原生 v3 项目。然而，在某些情况下，可以进行就地升级（即重用 v2 项目的布局，升级 controller-runtime 和 controller-tools）。

初始化一个 v3 项目

创建一个新目录，使用你的项目名称。请注意，这个名称在脚手架中用于创建你的管理器 Pod 的名称以及管理器默认部署的命名空间。

$ mkdir migration-project-name
$ cd migration-project-name

现在，我们需要初始化一个 v3 项目。不过，在此之前，如果我们不在 GOPATH 目录下，就需要初始化一个新的 Go 模块。虽然在 GOPATH 内部技术上并不需要这样做，但仍然推荐这样做。

go mod init tutorial.kubebuilder.io/migration-project

The module of your project can found in the in the `go.mod` file at the root of your project:

module tutorial.kubebuilder.io/migration-project

然后，我们可以使用 kubebuilder 完成项目的初始化。

kubebuilder init --domain tutorial.kubebuilder.io

The domain of your project can be found in the PROJECT file:

...
domain: tutorial.kubebuilder.io
...

迁移 API 和控制器

接下来，我们将重新搭建 API 类型和控制器。

kubebuilder create api --group batch --version v1 --kind CronJob

迁移API

现在，让我们将旧项目中的 api/v1/<kind>_types.go 文件中的 API 定义复制到新项目中。

这些文件没有被新的插件修改，所以您应该可以用旧的文件替换新生成的文件。可能会有一些外观上的变化。因此，您可以选择仅复制类型本身。

迁移控制器

现在，让我们将旧项目中的 controllers/cronjob_controller.go 控制器代码迁移到新项目中。这里有一个重大更改，并且可能会有一些外观上的变化。

新的 Reconcile 方法现在将上下文作为参数接收，而不再需要使用 context.Background() 来创建它。您可以将旧控制器中的其余代码复制到生成的方法中，替换：

func (r *CronJobReconciler) Reconcile(req ctrl.Request) (ctrl.Result, error) {
    ctx := context.Background()
    log := r.Log.WithValues("cronjob", req.NamespacedName)

With:

func (r *CronJobReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
	log := r.Log.WithValues("cronjob", req.NamespacedName)

迁移 Webhooks

kubebuilder create webhook --group batch --version v1 --kind CronJob --defaulting --programmatic-validation

现在，让我们将旧项目中的 api/v1/<kind>_webhook.go 的 webhook 定义复制到新项目中。

其他人

如果在v2中的main.go有任何手动更新，我们需要将这些更改移植到新的main.go中。同时，我们还需要确保所有需要的方案已被注册。

如果在配置目录下添加了其他清单，请一并移植。

如果需要，请在Makefile中更改图像名称。

验证

最后，我们可以运行 make 和 make docker-build 来确保一切正常。

通过手动更新文件进行从 v2 到 v3 的迁移

在继续之前，请确保您了解 Kubebuilder v2 和 v3 之间的区别。

请确保您已按照安装指南安装所需的组件。

以下指南描述了升级您的配置版本并开始使用插件支持版本所需的手动步骤。

这种方式更复杂，容易出错，成功也无法得到保证。此外，按照这些步骤操作，您将无法获得默认生成项目文件中的改进和bug修复。

通常情况下，如果您对项目进行了自定义并且偏离了建议的框架，您才会选择手动处理。在继续之前，请确保您理解关于项目自定义的说明。请注意，手动执行此过程可能需要比组织项目自定义以遵循建议布局投入更多的精力，而后者可以让您的项目在未来更易于维护和升级。

推荐的升级方法是遵循从 V2 到 V3 的迁移指南。

从项目配置版本迁移 \

在项目配置版本之间迁移涉及对您项目的 PROJECT 文件中的字段进行添加、删除和/或更改，该文件是通过运行 init 命令创建的。

PROJECT 文件现在有了新的布局。它存储了更多关于正在使用的资源的信息，以更好地帮助插件在搭建时做出有用的决策。

此外，PROJECT 文件本身现在是版本化的。version 字段对应于 PROJECT 文件本身的版本，而 layout 字段则指示正在使用的框架和主要插件的版本。

迁移步骤

以下步骤描述了手动更改项目配置文件（PROJECT）所需的步骤。这些更改将添加Kubebuilder在生成文件时会添加的信息。该文件可以在根目录中找到。

添加 `projectName`

项目名称是项目目录的名称，使用小写字母。

...
projectName: example
...

添加 `layout`

默认的插件布局与之前的版本相当，设置为 go.kubebuilder.io/v2：

...
layout:
- go.kubebuilder.io/v2
...

更新`版本`。

version 字段表示项目布局的版本。将其更新为 "3"：

...
version: "3"
...

添加资源数据

属性 resources 代表在您的项目中搭建的资源列表。

您需要为每个添加到项目中的资源添加以下数据。

通过添加 `resources[entry].api.crdVersion: v1beta1` 来添加 Kubernetes API 版本：

...
resources:
- api:
    ...
    crdVersion: v1beta1
  domain: 我的域名
  group: 网络应用程序
  kind:  guestbook (签名册)
  ...

通过添加 `resources[entry].api.namespaced: true` 来添加用于搭建 CRDs 的范围，除非它们是集群范围的。

...
resources:
- api:
    ...
    namespaced: true
  group: 网络应用程序
  kind:  guestbook (签名册)
  ...

如果你为 API 创建了控制器框架，那么添加 `resources[entry].controller: true`：

...
resources:
- api:
    ...
  controller: true
  group: 网络应用程序
  kind:  guestbook (签名册)

添加资源域，例如 `resources[entry].domain: testproject.org`，这通常是项目域，除非 API 骨架是核心类型和/或外部类型：

...
resources:
- api:
    ...
  domain: testproject.org
  group: 网络应用程序
  kind:  guestbook (签名册)

请注意，只有当您的项目有一个核心类型 API 的脚手架，并且 Kubernetes API 组合格方案定义中的 Domain 值不为空时，您才需要添加 domain。（例如，您可以查看这里，在 API apps 中，Kinds 的域为空，而在这里中，API authentication 的 Kinds 的域是 k8s.io）

请查看以下列表，以了解支持的核心类型及其领域：

核心类型	域名
入学	“k8s.io”
入学注册	“k8s.io”
apps	empty
审计注册	“k8s.io”
apiextensions 的中文翻译是“API 扩展“。	“k8s.io”
身份验证	“k8s.io”
授权	“k8s.io”
自动扩展	empty
batch	empty
证书	“k8s.io”
调整	“k8s.io”
核心	empty
events	“k8s.io”
扩展包	empty
图像策略	“k8s.io”
网络连接	“k8s.io”
节点	“k8s.io”
指标	“k8s.io”
政策	empty
rbac.authorization	“k8s.io”
调度	“k8s.io”
设置	“k8s.io”
storage	“k8s.io”

以下是一个示例，其中通过命令 create api --group apps --version v1 --kind Deployment --controller=true --resource=false --make=false 为核心类型 Kind Deployment 搭建了控制器：

- controller: true
  group: apps
  kind: 部署
  path: k8s.io/api/apps/v1
  version: v1

将 `resources[entry].path` 添加为 api 的导入路径：

...
resources:
- api:
    ...
  ...
  group: 网络应用程序
  kind:  guestbook (签名册)
  path: 示例/api/v1

如果您的项目使用了 Webhooks，则对于每种生成的类型，添加 `resources[entry].webhooks.[type]: true`，然后添加 `resources[entry].webhooks.webhookVersion: v1beta1`。

resources:
- api:
    ...
  ...
  group: 网络应用程序
  kind:  guestbook (签名册)
  webhooks:
    defaulting: true
    validation: true
    webhookVersion: v1beta1

检查您的项目文件。

现在请确保您的 PROJECT 文件在通过 Kubebuilder V3 CLI 生成清单时包含相同的信息。

对于 QuickStart 示例，手动更新为使用 go.kubebuilder.io/v2 的 PROJECT 文件如下所示：

domain: 我的域名
layout:
- go.kubebuilder.io/v2
projectName: example
repo: example
resources:
- api:
    crdVersion: v1
    namespaced: true
  controller: true
  domain: 我的域名
  group: 网络应用程序
  kind:  guestbook (签名册)
  path: 示例/api/v1
  version: v1
version: "3"

您可以通过比较一个涉及多个 API 和 Webhook 的示例场景，查看以前布局（版本 2）和当前格式（版本 3）之间的差异，具体请参阅 go.kubebuilder.io/v2。

示例（项目版本 2）

domain: testproject.org
repo: sigs.k8s.io/kubebuilder/example
resources:
- group: 船员
  kind: 船长
  version: v1
- group: 船员
  kind: 第一伴侣
  version: v1
- group: 船员
  kind: 海军上将
  version: v1
version: "2"

示例（项目版本 3）

domain: testproject.org
layout:
- go.kubebuilder.io/v2
projectName: example
repo: sigs.k8s.io/kubebuilder/example
resources:
- api:
    crdVersion: v1
    namespaced: true
  controller: true
  domain: testproject.org
  group: 船员
  kind: 船长
  path: 示例/api/v1
  version: v1
  webhooks:
    defaulting: true
    validation: true
    webhookVersion: v1
- api:
    crdVersion: v1
    namespaced: true
  controller: true
  domain: testproject.org
  group: 船员
  kind: 第一伴侣
  path: 示例/api/v1
  version: v1
  webhooks:
    转换: true
    webhookVersion: v1
- api:
    crdVersion: v1
  controller: true
  domain: testproject.org
  group: 船员
  kind: 海军上将
  path: 示例/api/v1
  plural: 海军将领
  version: v1
  webhooks:
    defaulting: true
    webhookVersion: v1
version: "3"

验证

在上述步骤中，你只更新了代表项目配置的 PROJECT 文件。这个配置仅对命令行工具有用。它不应该影响你的项目的行为。

没有选项可以验证您是否正确更新了配置文件。确保配置文件具有正确的 V3+ 字段的最佳方法是初始化一个具有相同 API、控制器和 webhook 的项目，以便比较生成的配置与手动更改的配置。

如果您在上述过程中犯了错误，您可能会在使用命令行界面时遇到问题。

将您的项目更新为使用 go/v3 插件。

在项目之间迁移插件涉及对任何插件支持的命令（例如 init 和 create）创建的文件进行添加、删除和/或更改。一个插件支持一个或多个项目配置版本；在升级插件版本之前，请确保将项目的配置版本升级到目标插件版本所支持的最新版本。

以下步骤描述了手动修改项目布局所需的变更，以便使您的项目能够使用 go/v3 插件。这些步骤不会帮助您解决已生成的脚手架中的所有错误。

迁移步骤

将你的插件版本更新到 PROJECT 文件中。

在更新 layout 之前，请确保您已经按照上述步骤将您的项目版本升级到 3。一旦您升级了项目版本，请将 layout 更新为新插件版本 go.kubebuilder.io/v3，具体操作如下：

domain: 我的域名
layout:
- go.kubebuilder.io/v3
...

升级 Go 版本及其依赖项：

确保你的 go.mod 文件使用 Go 版本 1.15 和以下依赖版本：

module example

go 1.18

require (
    github.com/onsi/ginkgo/v2 v2.1.4
    github.com/onsi/gomega v1.19.0
    k8s.io/api v0.24.0
    k8s.io/apimachinery v0.24.0
    k8s.io/client-go v0.24.0
    sigs.k8s.io/controller-runtime v0.12.1
)

更新 Go 语言镜像

在 Dockerfile 中替换：

# Build the manager binary
FROM docker.io/golang:1.13 as builder

With:

# Build the manager binary
FROM docker.io/golang:1.16 as builder

更新你的 Makefile

允许 controller-gen 来搭建新的 Kubernetes API。

为了让 controller-gen 和脚手架工具使用新的 API 版本，请替换：

``With:

``##### 允许自动下载

为了允许将 Envtest 所需的 Kubernetes 二进制文件的新版本下载到您项目的 testbin/ 目录中，而不是全局设置，请替换：

# 运行测试
test: 生成格式化的兽医清单
	go test ./... -coverprofile cover.out

With:

将SHELL设置为bash允许通过配方执行bash命令。
# Options are set to exit when a recipe line exits non-zero or a piped command fails.
SHELL = /usr/bin/env bash -o pipefail
.SHELLFLAGS = -ec

ENVTEST_ASSETS_DIR=$(shell pwd)/testbin
test: 生成清单 格式 校验 ## 运行测试。
	mkdir -p ${ENVTEST_ASSETS_DIR}
	test -f ${ENVTEST_ASSETS_DIR}/setup-envtest.sh || curl -sSLo ${ENVTEST_ASSETS_DIR}/setup-envtest.sh https://raw.githubusercontent.com/kubernetes-sigs/controller-runtime/v0.8.3/hack/setup-envtest.sh
	source ${ENVTEST_ASSETS_DIR}/setup-envtest.sh; fetch_envtest_tools $(ENVTEST_ASSETS_DIR); setup_envtest_env $(ENVTEST_ASSETS_DIR); go test ./... -coverprofile cover.out

升级所使用的 `controller-gen` 和 `kustomize` 依赖版本

要升级用于生成清单的 controller-gen 和 kustomize 版本，请替换：

# find or download controller-gen
# download controller-gen if necessary
controller-gen:
ifeq (, $(shell which controller-gen))
	@{ \
	set -e ;\
	CONTROLLER_GEN_TMP_DIR=$$(mktemp -d) ;\
	cd $$CONTROLLER_GEN_TMP_DIR ;\
	go mod init tmp ;\
	go get sigs.k8s.io/controller-tools/cmd/controller-gen@v0.2.5 ;\
	rm -rf $$CONTROLLER_GEN_TMP_DIR ;\
	}
CONTROLLER_GEN=$(GOBIN)/controller-gen
else
CONTROLLER_GEN=$(shell which controller-gen)
endif

With:

`然后，为了使您的项目使用 Makefile 中定义的 kustomize版本，请将所有kustomize的用法替换为$(KUSTOMIZE)`。

更新您的控制器。

Replace:

func (r *<MyKind>Reconciler) Reconcile(req ctrl.Request) (ctrl.Result, error) {
    ctx := context.Background()
    log := r.Log.WithValues("cronjob", req.NamespacedName)

With:

func (r *<MyKind>Reconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
    log := r.Log.WithValues("cronjob", req.NamespacedName)

更新你的控制器和 webhook 测试套件。

Replace:

	. "github.com/onsi/ginkgo"

With:

	. "github.com/onsi/ginkgo/v2"

另外，请调整您的测试套件。

针对控制器套件：

	RunSpecsWithDefaultAndCustomReporters(t,
		"Controller Suite",
		[]Reporter{printer.NewlineReporter{}})

With:

	RunSpecs(t, "Controller Suite")

用于 Webhook 套件：

	RunSpecsWithDefaultAndCustomReporters(t,
		"Webhook Suite",
		[]Reporter{printer.NewlineReporter{}})

With:

	RunSpecs(t, "Webhook Suite")

最后但同样重要的是，从 BeforeSuite 块中移除超时变量：

Replace:

var _ = BeforeSuite(func(done Done) {
	....
}, 60)

与

var _ = BeforeSuite(func(done Done) {
	....
})

将日志记录器更改为使用标志选项。

在 main.go 文件中替换：

flag.Parse()

ctrl.SetLogger(zap.New(zap.UseDevMode(true)))

With:

opts := zap.Options{
	Development: true,
}
opts.BindFlags(flag.CommandLine)
flag.Parse()

ctrl.SetLogger(zap.New(zap.UseFlagOptions(&opts)))

重命名监控程序标志

该管理器的--metrics-addr和enable-leader-election标志已重命名为--metrics-bind-address和--leader-elect，以与核心Kubernetes组件更一致。更多信息请查看：#1839。

在您的 main.go 文件中替换：

func main() {
	var metricsAddr string
	var enableLeaderElection bool
	flag.StringVar(&metricsAddr, "metrics-addr", ":8080", "The address the metric endpoint binds to.")
	flag.BoolVar(&enableLeaderElection, "enable-leader-election", false,
		"Enable leader election for controller manager. "+
			"启用此功能将确保只有一个活动的控制管理器。")

With:

func main() {
	var metricsAddr string
	var enableLeaderElection bool
	flag.StringVar(&metricsAddr, "metrics-bind-address", ":8080", "The address the metric endpoint binds to.")
	flag.BoolVar(&enableLeaderElection, "leader-elect", false,
		"Enable leader election for controller manager. "+
			"启用此功能将确保只有一个活动的控制管理器。")

然后，重命名 config/default/manager_auth_proxy_patch.yaml 和 config/default/manager.yaml 中的标志：

- name: manager
args:
- "--health-probe-bind-address=:8081"
- "--metrics-bind-address=127.0.0.1:8080"
- "--leader-elect"

验证

最后，我们可以运行 make 和 make docker-build 来确保一切正常。

将您的项目更改为删除对Kubernetes已弃用API版本的使用。

以下步骤描述了一个工作流程，用于升级您的项目以移除已弃用的 Kubernetes API：apiextensions.k8s.io/v1beta1、admissionregistration.k8s.io/v1beta1、cert-manager.io/v1alpha2。

Kubebuilder CLI 工具不支持同时使用具有两个 Kubernetes API 版本的脚手架资源，例如：一个 API/CRD 使用 apiextensions.k8s.io/v1beta1，另一个使用 apiextensions.k8s.io/v1。

第一步是更新您的 PROJECT 文件，将 api.crdVersion:v1beta 和 webhooks.WebhookVersion:v1beta 替换为 api.crdVersion:v1 和 webhooks.WebhookVersion:v1，如下所示：

domain: 我的域名
layout: go.kubebuilder.io/v3
projectName: example
repo: example
resources:
- api:
    crdVersion: v1
    namespaced: true
  group: 网络应用程序
  kind:  guestbook (签名册)
  version: v1
  webhooks:
    defaulting: true
    webhookVersion: v1
version: "3"

您可以尝试使用 --force 标志重新创建 APIS（CRD）和 Webhooks 清单。

现在，通过运行 kubebuilder create api 和 kubebuilder create webhook 命令，并分别使用 --force 标志，为相同的组、种类和版本重新创建 APIS（CRDs）和 Webhooks 清单。

V3 - 插件布局迁移指南

请参阅插件版本的迁移指南。请注意，插件生态系统是在 Kubebuilder v3.0.0 版本中引入的，自 2021年4月28日 起，go/v3 版本是默认布局。

因此，您可以在这里查看如何将使用 Kubebuilder 3.x 和 go/v3 插件构建的项目迁移到最新版本。

go/v3 与 go/v4 的比较

本文档涵盖了从使用插件 go/v3（自 2021 年 4 月 28 日以来任何脚手架的默认选项）构建的项目迁移到下一个版本的 Golang 插件 go/v4 时的所有重大变更。

所有更改（无论是重大更改还是其他更改）的详细信息可以在以下位置找到：

常见变更

go/v4 项目使用 Kustomize v5x（而不是 v3x）
请注意，config/ 目录下的一些清单已被更改，以不再使用已弃用的 Kustomize 功能，例如环境变量。
一个 kustomization.yaml 文件被创建在 config/samples 目录下。这有助于简单灵活地生成示例清单：kustomize build config/samples。
添加对 Apple Silicon M1 (darwin/arm64) 的支持。
移除对不再支持的 CRD/WebHooks Kubernetes API v1beta1 版本的支持，该版本自 k8s 1.22 起不再得到支持。
不再使用 "k8s.io/api/admission/v1beta1" 来搭建 webhook 测试文件，因为从 k8s 1.25 开始，该 API 已不再提供。默认情况下，webhook 测试文件使用 "k8s.io/api/admission/v1" 进行搭建，该 API 从 k8s 1.20 起获得支持。
不再为 k8s 版本低于 1.16 提供向后兼容的支持。
将布局更改为以适应社区请求，遵循标准 Go 项目布局，将 API 移动到一个名为 api 的新目录，控制器移到一个名为 internal 的新目录，main.go 移动到一个名为 cmd 的新目录。

新版本的 `go/v4` 插件简要说明：

有关此内容的更多详细信息，请查看这里，但如果想了解要点，请查看以下内容

迁移到 Kubebuilder go/v4

如果您想升级您的脚手架以使用最新和最优秀的功能，请按照本指南进行操作，该指南将以最简单明了的方式介绍步骤，以便您能够升级您的项目，获取所有最新的变更和改进。

迁移指南 go/v3 到 go/v4 （推荐）

通过手动更新文件

如果您想在不更改脚手架的情况下使用最新版本的 Kubebuilder CLI，请查看以下指南，该指南将描述手动执行的步骤，以便仅升级您的项目版本并开始使用插件版本。

这种方式更复杂，容易出错，成功也无法得到保证。此外，按照这些步骤操作，您将无法获得默认生成项目文件中的改进和bug修复。

通过手动更新文件迁移到 go/v4

从 go/v3 迁移到 go/v4

在继续之前，请确保您了解 Kubebuilder go/v3 和 go/v4 之间的区别。

请确保您已经按照安装指南安装了所需的组件。

迁移 go/v3 项目的推荐方法是创建一个新的 go/v4 项目，并将 API 和调整代码复制过去。转换后的项目将呈现出原生 go/v4 项目布局的样子（最新版本）。

然而，在某些情况下，可以进行就地升级（即重用 go/v3 项目布局，手动升级 PROJECT 文件和脚手架）。有关更多信息，请参见通过手动更新文件从 go/v3 迁移到 go/v4。

初始化一个 go/v4 项目

创建一个新目录，使用你的项目名称。请注意，这个名称在脚手架中用于创建你的管理器 Pod 的名称以及管理器默认部署的命名空间。

$ mkdir migration-project-name
$ cd migration-project-name

现在，我们需要初始化一个 go/v4 项目。在此之前，如果我们不在 GOPATH 中，我们需要初始化一个新的 go 模块。虽然从技术上讲，在 GOPATH 内部并不需要，但仍然推荐这样做。

go mod init tutorial.kubebuilder.io/migration-project

The module of your project can found in the `go.mod` file at the root of your project:

module tutorial.kubebuilder.io/migration-project

现在，我们可以使用 kubebuilder 完成项目的初始化。

kubebuilder init --domain tutorial.kubebuilder.io --plugins=go/v4

The domain of your project can be found in the PROJECT file:

...
domain: tutorial.kubebuilder.io
...

迁移 API 和控制器

接下来，我们将重新搭建 API 类型和控制器。

kubebuilder create api --group batch --version v1 --kind CronJob

迁移API

现在，让我们将旧项目中的 api/v1/<kind>_types.go 文件中的 API 定义复制到新项目中。

这些文件没有被新的插件修改，所以您应该可以用旧的文件替换新生成的文件。可能会有一些外观上的变化。因此，您可以选择仅复制类型本身。

迁移控制器

现在，让我们将旧项目中 controllers/cronjob_controller.go 的控制器代码迁移到新项目中的 internal/controller/cronjob_controller.go。

迁移 Webhooks

kubebuilder create webhook --group batch --version v1 --kind CronJob --defaulting --programmatic-validation

现在，让我们将旧项目中的 api/v1/<kind>_webhook.go 的 webhook 定义复制到新项目中。

其他人

如果在 v3 的 main.go 中有任何手动更新，我们需要将这些更改迁移到新的 main.go 中。我们还需要确保所有需要的 controller-runtime schemes 都已注册。

如果在配置目录下添加了其他清单，请一并移植。请注意，新版本的 go/v4 使用 Kustomize v5.x，而不再是 Kustomize v4。因此，如果在配置中添加了自定义实现，您需要确保它们能够与 Kustomize v5 一起使用，如果不能，则需要更新/升级您可能遇到的任何破坏性更改。

在 v4 中，Kustomize 的安装方式已经从 bash 脚本更改为 go get。请将 Makefile 中的 kustomize 依赖更改为

``如果需要，请在Makefile中更改图像名称。

验证

最后，我们可以运行 make 和 make docker-build 来确保一切正常。

通过手动更新文件进行从 go/v3 到 go/v4 的迁移。

在继续之前，请确保您了解 Kubebuilder go/v3 和 go/v4 之间的区别。

请确保您已经按照安装指南安装了所需的组件。

以下指南描述了升级您的 PROJECT 配置文件以开始使用 go/v4 所需的手动步骤。

这种方式更复杂，容易出错，成功也无法得到保证。此外，按照这些步骤操作，您将无法获得默认生成项目文件中的改进和bug修复。

通常建议如果您对项目进行了自定义并偏离了建议的框架，最好手动操作。在继续之前，请确保您理解关于 [项目自定义][project-customizations] 的说明。请注意，您可能需要花费比整理项目自定义更多的精力来手动完成此过程。建议的布局将使您的项目在未来更易于维护和升级，所需的努力也会更少。

推荐的升级方法是遵循从 go/v3 到 go/v4 的迁移指南。

从项目配置版本迁移\

更新 PROJECT 文件布局，以存储有关用于使插件在搭建时做出有用决策的资源的信息。layout 字段指示所使用的搭建方式和主要插件版本。

迁移步骤

将布局版本迁移到 PROJECT 文件中。

以下步骤描述了手动更改项目配置文件（PROJECT）所需的步骤。这些更改将添加Kubebuilder在生成文件时会添加的信息。该文件可以在根目录中找到。

通过替换来更新 PROJECT 文件：

layout:
- go.kubebuilder.io/v3

With:

layout:
- go.kubebuilder.io/v4

布局更改

新布局：

目录 apis 已重命名为 api 以遵循标准。
controller(s) 目录已被移至一个名为 internal 的新目录下，并且也改名为单数形式 controller。
之前在根目录下搭建的 main.go 文件已经移动到一个名为 cmd 的新目录下。

因此，您可以检查布局结果的变化为：

...
├── cmd
│ └── main.go
├── internal
│ └── controller
└── api

迁移到新布局：

创建一个新的目录 cmd 并将 main.go 移动到该目录下。
如果您的项目支持多组，则 API 将在名为 apis 的目录下生成。将此目录重命名为 api。
将 controllers 目录移动到 internal 下，并将其重命名为 controller。
现在请确保导入将相应更新：
- 将 main.go 的导入更新为查找 internal/controller 目录下的新路径。

那么，让我们更新脚手架的路径

更新 Dockerfile，以确保您将拥有：

COPY cmd/main.go cmd/main.go
COPY api/ api/
COPY internal/controller/ internal/controller/

然后，替换：

RUN CGO_ENABLED=0 GOOS=${TARGETOS:-linux} GOARCH=${TARGETARCH} go build -a -o manager main.go

With:

RUN CGO_ENABLED=0 GOOS=${TARGETOS:-linux} GOARCH=${TARGETARCH} go build -a -o manager cmd/main.go

更新 Makefile 的目标，以通过替换来构建和运行管理器：

.PHONY: build
build: manifests generate fmt vet ## Build manager binary.
	go build -o bin/manager main.go

.PHONY: run
run: manifests generate fmt vet ## Run a controller from your host.
	go run ./main.go

With:

.PHONY: build
build: manifests generate fmt vet ## Build manager binary.
	go build -o bin/manager cmd/main.go

.PHONY: run
run: manifests generate fmt vet ## Run a controller from your host.
	go run ./cmd/main.go

更新 internal/controller/suite_test.go 以设置 CRDDirectoryPaths 的路径：

Replace:

``With:

`请注意，如果您的项目有多个组（multigroup:true），那么上述更新应该导致 “..”, “..”, “..”,而不是“..”,“..”`。

现在，让我们相应地更新项目文件中的路径。

该项目跟踪您项目中使用的所有 API 的路径。请确保它们现在指向 api/...，例如以下示例：

更新前：

  group: crew
  kind: Captain
  path: sigs.k8s.io/kubebuilder/testdata/project-v4/apis/crew/v1

更新后：


  group: crew
  kind: Captain
  path: sigs.k8s.io/kubebuilder/testdata/project-v4/api/crew/v1

使用迄今为止所做的更改更新 kustomize 清单。

在 config/ 目录下更新清单，包含使用 go/v4 插件在默认脚手架上所做的所有更改（例如，请参阅 testdata/project-v4/config/），以便将所有默认脚手架的更改应用到您的项目中。
创建 config/samples/kustomization.yaml，将所有指定在 config/samples 中的自定义资源示例包含在内。 (例如参见 testdata/project-v4/config/samples/kustomization.yaml)

如果您有 webhook：

在 Webhook 测试文件中，将导入 admissionv1beta1 "k8s.io/api/admission/v1beta1" 替换为 admissionv1 "k8s.io/api/admission/v1"。

Makefile 更新

请根据所用发布标签下的测试数据中的示例更新 Makefile 的更改。（例如，请参见 testdata/project-v4/Makefile）

更新依赖项

请根据所使用的发布标签在 testdata 中的示例中找到的更改更新 go.mod 文件（例如，参考 testdata/project-v4/go.mod）。然后，运行 go mod tidy 以确保获取最新的依赖项，并确保你的 Golang 代码没有出现破坏性更改。

验证

在以上步骤中，您手动更新了您的项目，以确保它遵循使用 go/v4 插件引入的更新模板的布局变化。

没有选项可以验证您是否正确更新了项目的 PROJECT 文件。确保所有内容正确更新的最佳方法是使用 go/v4 插件初始化一个项目，即使用 kubebuilder init --domain tutorial.kubebuilder.io plugins=go/v4，并生成相同的 API、控制器和 webhook，以便将生成的配置与手动更改的配置进行比较。

此外，在所有更新完成后，您需要运行以下命令：

make manifests（在更新 Makefile 后使用最新版本的 controller-gen 重新生成文件）
make all（以确保您能够构建并执行所有操作）

单组到多组

让我们迁移 CronJob 示例.

要将您的项目布局更改为支持多组，请运行命令 kubebuilder edit --multigroup=true。一旦您切换到多组布局，新的 Kinds 将根据新布局生成，但需要额外的手动工作将旧 API 组迁移到新布局。

一般来说，我们将 API 组的前缀用作目录名称。我们可以检查 api/v1/groupversion_info.go 来了解这一点：

// +组名=batch.tutorial.kubebuilder.io
package v1

然后，我们将把现有的 API 移动到一个新的子目录中，子目录名称将以该组的名称命名。考虑到CronJob 示例，子目录名称为“batch“：

mkdir api/batch
mv api/* api/batch

在将 API 移动到新目录后，控制器也需要进行相应的调整。对于 go/v4：

mkdir internal/controller/batch
mv internal/controller/* internal/controller/batch/

同样的原则也适用于任何现有的 webhooks：

mkdir internal/webhook/batch
mv internal/webhook/* internal/webhook/batch/

为新创建的群组所创建的任何新webhook，其相应的功能将被创建在子目录internal/webhook/<group>/下。

If you are using the deprecated layout go/v3

Then, your layout has not the internal directory. So, you will move the controller(s) under a directory with the name of the API group which it is responsible for manage. ```bash mkdir controller/batch mv controller/* controller/batch/ ```

接下来，我们需要更新所有对旧包名称的引用。对于 CronJob，需替换的路径包括 main.go 和 controllers/batch/cronjob_controller.go，将它们更改为新项目结构中的相应位置。

如果您在项目中添加了其他文件，您还需要在那里跟踪导入。

最后，手动修复 PROJECT 文件，命令 kubebuilder edit --multigroup=true 将我们的项目设置为多组，但它并没有修复现有 API 的路径。对于每个资源，我们需要修改路径。

例如，对于一个文件：

# 工具生成的代码。请勿编辑。
# 此文件用于跟踪用于搭建您项目的信息
# 并允许插件正常工作。
# 更多信息： https://book.kubebuilder.io/reference/project-config.html
domain: tutorial.kubebuilder.io
layout:
- go.kubebuilder.io/v4
多组: true
projectName: test
repo: 教程.kubebuilder.io/项目
resources:
- api:
    crdVersion: v1
    namespaced: true
  controller: true
  domain: tutorial.kubebuilder.io
  group: batch
  kind: CronJob
  path: tutorial.kubebuilder.io/project/api/v1beta1
  version: v1beta1
version: "3"

将 path: tutorial.kubebuilder.io/project/api/v1beta1 替换为 path: tutorial.kubebuilder.io/project/api/batch/v1beta1。

在这个过程中，如果项目不是新的并且已经实现了以前的API，那么仍然需要根据需要进行修改。请注意，在 multi-group 项目中，Kind API 的文件是在 api/<group>/<version> 目录下创建，而不是在 api/<version> 下。同时，请注意，控制器将被创建在 internal/controller/<group> 而不是 internal/controller 下。

这就是我们将之前生成的 API 移动到新结构中相应位置的原因。请记得相应地更新导入中的引用。

为了让 envtest 正确地将 CRD 安装到测试环境中，需要在每个 internal/controller/<group>/suite_test.go 文件中相应地更新 CRD 目录的相对路径。我们需要在 CRD 目录的相对路径中添加额外的 ".."，如下所示。

    By("bootstrapping test environment")
    testEnv = &envtest.Environment{
        CRDDirectoryPaths: []string{filepath.Join("..", "..", "config", "crd", "bases")},
    }

CronJob 教程更详细地解释了这些更改（针对它们是如何通过 Kubebuilder 为单组项目生成的）。

项目升级助手

概述

请注意，通过 Kubebuilder 工具使用的所有输入都记录在 PROJECT 文件中（示例）。该文件负责存储重要信息，代表项目的各个方面，例如其布局、插件、API 等。（更多信息）。

随着新插件版本/布局或甚至新的 Kubebuilder CLI 版本的发布，升级项目的一种简单方法是重新搭建框架。这个过程允许用户使用 IDE 等工具比较变化，使他们能够将自己的代码实现叠加在新的框架上，或将这些变化整合到他们现有的项目中。

何时使用它？

此命令在您希望将现有项目升级到最新版本的 Kubebuilder 项目布局时非常有用。它使用户更容易将他们的操作项目迁移到新的脚手架。

如何使用它？

要将您的项目脚手架升级为使用新插件版本：

kubebuilder alpha generate --plugins="pluginkey/version"

要升级您项目的脚手架以获取最新更改：

目前，它支持两个可选参数，input-dir 和 output-dir。

input-dir 是您想要重新构建的现有项目的路径。默认值为当前工作目录。

output-dir 是您希望生成新项目的目录路径。默认是在当前工作目录下的一个子目录。

kubebuilder alpha generate --input-dir=/path/to/existing/project --output-dir=/path/to/new/project

参考

生成 CRD
使用最终器最终器是一种机制，用于在资源从 Kubernetes 集群中删除之前执行与该资源相关的任何自定义逻辑。
监控资源监控 Kubernetes 集群中的资源，以便获取信息并对变更采取行动。
Kind 集群
什么是webhook？ Webhooks是HTTP回调，在k8s中有三种类型的webhook：1）准入webhook 2）CRD转换webhook 3）授权webhook
- 接收Webhook 接收Webhook是在API服务器接收资源之前，对其进行变更或验证的HTTP回调。
配置/代码生成的标记
- CRD 生成
- CRD 验证
- Webhook
- 对象/深拷贝
- RBAC
- 脚手架
使用 Pprof 进行监控
controller-gen 命令行界面
您接受的训练数据截止至2023年10月。
文物
平台支持
子模块布局
使用外部资源 / API
指标
- 参考
CLI 插件

生成 CRD（自定义资源定义）

Kubebuilder 使用一个名为 controller-gen 的工具来生成实用代码和 Kubernetes 对象的 YAML，比如自定义资源定义（CustomResourceDefinitions）。

为此，它使用特殊的“标记注释“（以 // + 开头的注释）来指示有关字段、类型和包的附加信息。在自定义资源定义（CRD）的情况下，这些信息通常来自于你的 _types.go 文件。有关标记的更多信息，请参见标记参考文档。

Kubebuilder 提供了一个 make 目标来运行 controller-gen 并生成 CRD：make manifests。

当你运行 make manifests 时，应该可以在 config/crd/bases 目录下看到生成的 CRD。make manifests 还可以生成许多其他的构件—更多细节请查看标记参考文档。

验证

CRD 支持使用 validation 部分中的 OpenAPI v3 架构进行声明式验证.

一般来说，验证标记可以附加到字段或类型上。如果您在定义复杂的验证、需要重用验证或需要验证切片元素，通常最好定义一个新类型来描述您的验证。

例如：

type ToySpec struct {
	// +kubebuilder:validation:MaxLength=15
	// +kubebuilder:validation:MinLength=1
	Name string `json:"name,omitempty"`

	// +kubebuilder:validation:MaxItems=500
	// +kubebuilder:validation:MinItems=1
	// +kubebuilder:validation:UniqueItems=true
	Knights []string `json:"knights,omitempty"`

	Alias   Alias   `json:"alias,omitempty"`
	Rank    Rank    `json:"rank"`
}

// +kubebuilder:validation:Enum=狮子;狼;龙
type Alias string

// +kubebuilder:validation:最小值=1
// +kubebuilder:validation:最大值=3
// +kubebuilder:validation:排除最大值=false
type Rank int32

附加打印机列

从 Kubernetes 1.11 开始，kubectl get 可以向服务器请求显示哪些列。对于自定义资源定义（CRD），这可以用于提供有用的特定类型信息，类似于内置类型所提供的信息。

显示的信息可以通过您的 CRD 上的 additionalPrinterColumns 字段进行控制，该字段由 CRD 的 Go 类型上的 +kubebuilder:printcolumn 标记控制。

例如，在以下示例中，我们添加字段以显示有关骑士的信息，以及来自验证示例的等级和别名字段：

// +kubebuilder:printcolumn:name="别名",type=string,JSONPath=`.spec.alias`
// +kubebuilder:printcolumn:name="等级",type=integer,JSONPath=`.spec.rank`
// +kubebuilder:printcolumn:name="勇敢逃跑",type=boolean,JSONPath=`.spec.knights[?(@ == "罗宾爵士")]`,description="当危险抬起丑陋的头颅时，他勇敢地转身逃跑",priority=10
// +kubebuilder:printcolumn:name="年龄",type="日期",JSONPath=".metadata.creationTimestamp"
type Toy struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   ToySpec   `json:"spec,omitempty"`
	Status ToyStatus `json:"status,omitempty"`
}

子资源

从 Kubernetes 1.13 开始，CRDs 可以选择实现 /status 和 /scale 子资源。

一般建议您在所有具有状态字段的资源中使用 /status 子资源。

两个子资源都有相应的标记.

状态

状态子资源是通过 +kubebuilder:subresource:status 启用的。当启用时，主资源的更新不会更改状态。同样，状态子资源的更新只能更改状态字段，不能更改其他内容。

例如：

// +kubebuilder:subresource:status
type Toy struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   ToySpec   `json:"spec,omitempty"`
	Status ToyStatus `json:"status,omitempty"`
}

规模

通过 +kubebuilder:subresource:scale 启用 scale 子资源。启用后，用户将能够使用 kubectl scale 命令来缩放您的资源。如果 selectorpath 参数指向标签选择器的字符串形式，则水平 Pod 自动扩缩器 (HorizontalPodAutoscaler) 将能够对您的资源进行自动扩缩。

例如：

type CustomSetSpec struct {
	Replicas *int32 `json:"replicas"`
}

type CustomSetStatus struct {
	Replicas int32 `json:"replicas"`
    Selector string `json:"selector"` // this must be the string form of the selector
}


// +kubebuilder:subresource:status
// +kubebuilder:subresource:scale:specpath=.spec.replicas,statuspath=.status.replicas,selectorpath=.status.selector
type CustomSet struct {
	metav1.TypeMeta   `json:",inline"`
	metav1.ObjectMeta `json:"metadata,omitempty"`

	Spec   CustomSetSpec   `json:"spec,omitempty"`
	Status CustomSetStatus `json:"status,omitempty"`
}

多个版本

从 Kubernetes 1.13 开始，您可以在 CRD 中定义多个版本的 Kind，并使用一个 webhook 在它们之间进行转换。

有关此过程的更多详细信息，请参见多版本教程。

默认情况下，Kubebuilder 禁用了为 CRD 中的 Kind 不同版本生成不同的验证，以便与旧版本的 Kubernetes 兼容。

如果使用 v1beta CRD，您需要将 makefile 中的 CRD_OPTIONS ?= "crd:trivialVersions=true,preserveUnknownFields=false 这一行更改为 CRD_OPTIONS ?= crd:preserveUnknownFields=false；如果使用 v1（推荐），则更改为 CRD_OPTIONS ?= crd。

然后，您可以使用 +kubebuilder:storageversion 标记来指示 API 服务器应该使用的用于存储数据的 GVK。

在内部实现上

Kubebuilder 自动生成用于运行 controller-gen 的 make 规则。该规则会使用 Go 模块通过 go install 自动安装 controller-gen，如果它不在您的路径中。

如果你想查看 controller-gen 的具体操作，也可以直接运行它。

每个 controller-gen 的“生成器“都由 controller-gen 的一个选项控制，使用与标记相同的语法。controller-gen 还支持不同的输出“规则“，以控制输出的方式和去向。请注意 manifests 制作规则（略微简化，仅生成 CRD）：

# 为 CRD 生成清单
manifests: controller-gen
	$(CONTROLLER_GEN) rbac:roleName=manager-role crd webhook paths="./..." output:crd:artifacts:config=配置/CRD/基础

它使用 output:crd:artifacts 输出规则来指示与 CRD 相关的配置（非代码）工件应最终放在 config/crd/bases 中，而不是 config/crd。

要查看包括生成器在内的所有 controller-gen 选项，请运行

$ controller-gen -h

或者，欲了解更多详情：

$ controller-gen -hhh

使用终结器

Finalizers 允许控制器实现异步预删除钩子。假设您为每个 API 类型的对象创建一个外部资源（例如存储桶），并且您希望在 Kubernetes 中删除对象时删除相关的外部资源，您可以使用 finalizer 来实现这一点。

您可以在Kubernetes参考文档中阅读更多关于最终器的信息。下面的部分演示了如何在控制器的Reconcile方法中注册和触发预删除钩子。

需要注意的关键点是，最终处理器导致对象的“删除“变成“更新“，以设置删除时间戳。对象上存在删除时间戳表明该对象正在被删除。否则，如果没有最终处理器，删除会表现为一个调整过程，其中对象在缓存中丢失。

亮点：

如果对象没有被删除且没有注册终结器，则在 Kubernetes 中添加终结器并更新该对象。
如果对象正在被删除，并且最终器仍然在最终器列表中，那么请执行预删除逻辑，移除最终器并更新对象。
确保预删除逻辑是幂等的。

../../cronjob-tutorial/testdata/finalizer_example.go

Apache License

Licensed under the Apache License, Version 2.0 (the “License”); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Imports

First, we start out with some standard imports. As before, we need the core controller-runtime library, as well as the client package, and the package for our API types.

package controllers

import (
	"context"

	"k8s.io/kubernetes/pkg/apis/batch"
	ctrl "sigs.k8s.io/controller-runtime"
	"sigs.k8s.io/controller-runtime/pkg/client"
	"sigs.k8s.io/controller-runtime/pkg/controller/controllerutil"

	batchv1 "tutorial.kubebuilder.io/project/api/v1"
)

By default, kubebuilder will include the RBAC rules necessary to update finalizers for CronJobs.

// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs/status,verbs=get;update;patch
// +kubebuilder:rbac:groups=batch.tutorial.kubebuilder.io,resources=cronjobs/finalizers,verbs=update

The code snippet below shows skeleton code for implementing a finalizer.

func (r *CronJobReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
	log := r.Log.WithValues("cronjob", req.NamespacedName)

	cronJob := &batchv1.CronJob{}
	if err := r.Get(ctx, req.NamespacedName, cronJob); err != nil {
		log.Error(err, "unable to fetch CronJob")
		// we'll ignore not-found errors, since they can't be fixed by an immediate
		// requeue (we'll need to wait for a new notification), and we can get them
		// on deleted requests.
		return ctrl.Result{}, client.IgnoreNotFound(err)
	}

	// name of our custom finalizer
	myFinalizerName := "batch.tutorial.kubebuilder.io/finalizer"

	// examine DeletionTimestamp to determine if object is under deletion
	if cronJob.ObjectMeta.DeletionTimestamp.IsZero() {
		// The object is not being deleted, so if it does not have our finalizer,
		// then let's add the finalizer and update the object. This is equivalent
		// to registering our finalizer.
		if !controllerutil.ContainsFinalizer(cronJob, myFinalizerName) {
			controllerutil.AddFinalizer(cronJob, myFinalizerName)
			if err := r.Update(ctx, cronJob); err != nil {
				return ctrl.Result{}, err
			}
		}
	} else {
		// The object is being deleted
		if controllerutil.ContainsFinalizer(cronJob, myFinalizerName) {
			// our finalizer is present, so let's handle any external dependency
			if err := r.deleteExternalResources(cronJob); err != nil {
				// if fail to delete the external dependency here, return with error
				// so that it can be retried.
				return ctrl.Result{}, err
			}

			// remove our finalizer from the list and update it.
			controllerutil.RemoveFinalizer(cronJob, myFinalizerName)
			if err := r.Update(ctx, cronJob); err != nil {
				return ctrl.Result{}, err
			}
		}

		// Stop reconciliation as the item is being deleted
		return ctrl.Result{}, nil
	}

	// Your reconcile logic

	return ctrl.Result{}, nil
}

func (r *Reconciler) deleteExternalResources(cronJob *batch.CronJob) error {
	//
	// delete any external resources associated with the cronJob
	//
	// Ensure that delete implementation is idempotent and safe to invoke
	// multiple times for same object.
}

良好实践

What is “Reconciliation” in Operators?

当你使用 Kubebuilder 创建一个项目时，可以查看在 cmd/main.go 中生成的代码。这段代码初始化了一个 Manager，项目依赖于 controller-runtime 框架。这个 Manager 管理着 Controllers，提供了一种调整功能，用于在集群内同步资源直到达到所需状态。

调整是一个持续的循环，执行必要的操作以保持期望的状态，遵循Kubernetes的原则，如控制循环。有关更多信息，请查阅Kubernetes的Operator模式文档，以更好地理解这些概念。

为什么重调应该是幂等的？

在开发运算符时，控制器的对账循环需要是幂等的。通过遵循运算符模式，我们创建控制器，这些控制器提供一个对账函数，负责在集群上同步资源，直到达到期望状态。开发幂等的解决方案将允许对账器正确响应通用或意外事件，轻松处理应用程序的启动或升级。更多相关解释可以参考这里。

根据特定事件编写调整逻辑，会违反 Operator 模式的建议，并且违背了controller-runtime的设计原则。这可能导致不可预见的后果，例如资源被卡住，需要人工干预。

理解 Kubernetes API 和遵循 API 约定

构建操作器通常涉及扩展 Kubernetes API 本身。了解自定义资源定义（CRDs）如何与 Kubernetes API 交互是很有帮助的。此外，关于分组、版本和种类的 Kubebuilder 文档也可能有助于更好地理解这些与操作器相关的概念。

此外，我们建议您查看 Kubernetes 上的 Operator 模式文档，以更好地理解使用 KubeBuilder 构建的标准解决方案的目的。

为什么您应该遵循 Kubernetes API 的约定和标准

遵循 Kubernetes API 规范和标准对于最大化应用程序和部署的潜力至关重要。通过遵循这些既定实践，您可以在多个方面受益。

首先，遵循标准确保了Kubernetes生态系统内的无缝互操作性。遵循约定使您的应用程序能够与其他组件和谐工作，从而减少兼容性问题并促进一致的用户体验。

其次，遵循API标准可以提高应用程序的可维护性和故障排除能力。采用熟悉的模式和结构使得调试和支持您的部署变得更加容易，从而提高了运营效率和快速问题解决的能力。

此外，利用Kubernetes API的惯例可以让您充分发挥平台的全部功能。通过在定义的框架内工作，您可以利用Kubernetes提供的丰富特性和资源，从而实现可扩展性、性能优化和弹性。

最后，遵循这些标准可以使您的本土解决方案具备未来适应能力。通过与不断发展的Kubernetes生态系统保持一致，您可以确保与未来更新、新功能以及活跃的Kubernetes社区引入的增强功能保持兼容。

总之，通过遵循Kubernetes API的约定和标准，您可以实现无缝集成、简化维护、优化性能和为未来做好准备的潜力，这些都为您的应用程序和部署的成功做出了贡献。

Why should one avoid a system design where a single controller is responsible for managing multiple CRDs (Custom Resource Definitions)(for example, an ‘install_all_controller.go’)?

避免采用一种设计方案，其中同一个控制器对账多个 Kind。将多个 Kind（如 CRD）都由同一个控制器管理，通常与 controller-runtime 提出的设计相悖。此外，这可能会损害封装性、单一职责原则和内聚性等概念。损害这些概念可能会导致意想不到的副作用，并增加扩展、重用或维护操作器的难度。在一个操作器中，由一个控制器管理多个自定义资源（CRs）可能会导致几个问题：

复杂性：单个控制器管理多个自定义资源（CR）可能会增加代码的复杂性，从而使其更难理解、维护和调试。
可扩展性：每个控制器通常管理一种类型的自定义资源（CR）以实现可扩展性。如果一个控制器处理多个CR，它可能成为瓶颈，从而降低系统的整体效率和响应速度。
单一职责原则：遵循软件工程中的这一原则，理想情况下每个控制器应该只有一个职责。这种方法简化了开发和调试，并使系统更加健壮。
错误隔离：如果一个控制器管理多个自定义资源（CR），并且发生错误，可能会影响它管理的所有 CR。为每个 CR 配置一个单独的控制器可以确保一个控制器或 CR 的问题不会直接影响其他资源。
并发与同步：一个单一的控制器管理多个自定义资源（CR）可能导致竞争条件，并需要复杂的同步，特别是当这些CR之间存在相互依赖时。

总之，虽然让一个控制器管理多个CR看起来效率较高，但这通常会导致更高的复杂性、较低的可扩展性以及潜在的稳定性问题。通常遵循单一职责原则更为合适，每个CR由其自己的控制器管理。

为什么你应该采用状态条件

我们建议您使用状态条件（Status Conditionals）来管理您的解决方案，遵循K8s API 约定，因为：

标准化：条件提供了一种标准化的方式来表示操作员自定义资源的状态，使用户和工具更容易理解和解释资源的状态。
可读性：通过使用多个条件的组合，条件可以清晰地表达复杂的状态，使用户更容易理解资源的当前状态和进展。
可扩展性：当新的功能或状态被添加到您的 Operator 时，可以轻松扩展条件以表示这些新状态，而无需对现有的 API 或结构进行重大更改。
可观察性：集群管理员和外部监控工具可以监视和跟踪状态条件，从而更好地了解由操作员管理的自定义资源的状态。
兼容性：通过采用在 Kubernetes API 中使用条件的常见模式，Operator 作者确保他们的自定义资源与更广泛的生态系统保持一致，这有助于用户在与集群中的多个 Operator 和资源交互时获得一致的体验。

创建活动

在控制器的 Reconcile 函数中发布 Event 对象通常是非常有用的，因为它们允许用户或任何自动化过程了解特定对象的状态并做出相应的响应。

可以通过运行 $ kubectl describe <资源类型> <资源名称> 来查看对象的最近事件。也可以通过运行 $ kubectl get events 来检查事件。

撰写事件

事件的构成：

Event(object runtime.Object, eventtype, reason, message string)

object 是本事件所指的对象。
eventtype 是事件类型，可以是 Normal 或 Warning。 (更多信息)
reason 是生成此事件的原因。它应该简短且唯一，采用 UpperCamelCase 格式。该值可以在自动化的 switch 语句中使用。 (更多信息)
message 是供人类使用的。 (更多信息)

Example Usage

以下是引发事件的代码实现示例。

	// 以下实现将触发一个事件
	r.Recorder.Eventf(cr, "Warning", "Deleting",
		"Custom Resource %s is being deleted from the namespace %s",
		cr.Name, cr.Namespace)

如何能够触发事件？

以下是一些步骤和示例，帮助您在控制器的调整中触发事件。事件是通过使用EventRecorder的type CorrelatorOptions struct从控制器发布的，可以通过在管理器上调用GetRecorder(name string)来为控制器创建。请注意，我们将更改在cmd/main.go中构建的实现。

	if err = (&controller.MyKindReconciler{
		Client:   mgr.GetClient(),
		Scheme:   mgr.GetScheme(),
		// 请注意，我们添加了以下行：
		Recorder: mgr.GetEventRecorderFor("mykind-controller"),
	}).SetupWithManager(mgr); err != nil {
		setupLog.Error(err, "unable to create controller", "controller", "MyKind")
		os.Exit(1)
	}

在控制器上允许使用 EventRecorder

要引发事件，您必须在控制器中访问 record.EventRecorder。因此，首先让我们更新控制器的实现：

import (
	...
	"k8s.io/client-go/tools/record"
	...
)
// MyKindReconciler 调整一个 MyKind 对象type MyKindReconciler struct {
	client.Client
	Scheme   *runtime.Scheme
	// 请注意，我们添加了以下代码，以便能够传递 record.EventRecorder。	Recorder record.EventRecorder
}

将事件记录器传递给控制器

事件是通过控制器使用\[EventRecorder\]类型的CorrelatorOptions结构发布的，可以通过在管理器上调用GetRecorder(name string)为控制器创建。请注意，我们将更改在cmd/main.go中搭建的实现。

	if err = (&controller.MyKindReconciler{
		Client:   mgr.GetClient(),
		Scheme:   mgr.GetScheme(),
		// 请注意，我们添加了以下行：
		Recorder: mgr.GetEventRecorderFor("mykind-controller"),
	}).SetupWithManager(mgr); err != nil {
		setupLog.Error(err, "unable to create controller", "controller", "MyKind")
		os.Exit(1)
	}

授予所需的权限

您还必须授予 RBAC 规则权限，以允许您的项目创建事件。因此，请确保将 RBAC 添加到您的控制器中：

...
// +kubebuilder:rbac:groups=core,resources=events,verbs=create;patch
...
func (r *MyKindReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {

然后，运行 $ make manifests 来更新 config/rbac/role.yaml 下的规则。

观看资源

在扩展 Kubernetes API 时，我们的目标是确保我们的解决方案与 Kubernetes 本身的行为一致。例如，考虑一个由控制器管理的 Deployment 资源。这个控制器负责响应集群中的变化——例如，当 Deployment 被创建、更新或删除时——通过触发调整以确保资源的状态与期望状态相匹配。

同样，在开发我们的控制器时，我们希望关注对我们解决方案至关重要的资源中的相关变化。这些变化——无论是创建、更新还是删除——都应该触发调整循环，以采取适当的行动并维护集群的一致性。

controller-runtime 库提供了多种方式来监视和管理资源。

主要资源

主要资源是你的控制器负责管理的资源。例如，如果你为 MyApp 创建了一个自定义资源定义（CRD），那么相应的控制器负责管理 MyApp 的实例。

在这种情况下，MyApp 是该控制器的 主资源，您的控制器的调整循环专注于确保这些主资源的期望状态得以维护。

当你使用 Kubebuilder 创建一个新的 API 时，以下默认代码会被生成，确保控制器监视所有相关事件——例如创建、更新和删除——以便于新的 API。

该设置确保每当创建、更新或删除 API 实例时，都会触发对账循环：

// 监视主要资源（例如，MyApp）的创建、更新、删除事件if err := ctrl.NewControllerManagedBy(mgr).
   For(&<YourAPISpec>{}). <-- See there that the Controller is For this API
   Complete(r); err != nil {
   return err
}

次要资源

您的控制器可能还需要管理辅助资源，这是集群中支持主要资源所需的资源。

对这些次级资源的更改可能会直接影响主要资源，因此控制者必须相应地监控和调整这些资源。

由控制者拥有的。

这些辅助资源，例如 Services、ConfigMaps 或 Deployments，在被控制器拥有时，由特定控制器创建和管理，并通过 OwnerReferences 与主资源相关联。

例如，如果我们在集群中有一个控制器来管理 MyApp 类型的自定义资源（CR），这代表了我们的应用解决方案，那么确保 MyApp 以所需实例数正常运行所需的所有资源将被称为 次要资源。负责创建、删除和更新这些资源的代码将是 MyApp 控制器的一部分。我们将使用 controllerutil.SetControllerReference 函数添加适当的 OwnerReferences 以指示这些资源由相同的控制器所拥有，该控制器负责管理 MyApp 实例，这些实例将由 MyAppReconciler 进行调整。

此外，如果删除了主要资源，Kubernetes 的垃圾回收机制将确保所有关联的次要资源以层级方式自动删除。

哪些不是由控制器“拥有“的？

请注意，辅助资源可以是您项目中定义的 API/CRD，也可以是与 主要资源 相关的其他项目中的 API/CRD，但特定控制器并不负责创建或管理这些资源。

例如，如果我们有一个表示备份解决方案（即 MyBackup）的自定义资源定义（CRD），用于我们的 MyApp，它可能需要监视 MyApp 资源的变化，以便在 MyBackup 中触发对账，确保达到期望的状态。同样，MyApp 的行为也可能受到其他项目中定义的 CRD/API 的影响。

在这两种情况下，这些资源都被视为次级资源，即使它们不是由MyAppController“拥有”（即没有被创建或管理）。

在 Kubebuilder 中，未在项目中定义且不是 核心类型（即未在 Kubernetes API 中定义的类型）的资源称为 外部类型。

外部类型是指在您的项目中未定义但您需要监视和响应的资源。例如，如果操作员 A管理一个用于应用程序部署的 MyApp CRD，而操作员 B处理备份，那么操作员 B可以将 MyApp CRD 视为外部类型，以便根据 MyApp 的变化触发备份操作。

在这种情况下，运维人员 B 可以定义一个 BackupConfig 自定义资源定义（CRD），该定义依赖于 MyApp 的状态。通过将 MyApp 视为 辅助资源，运维人员 B 可以监视并调整 运维人员 A 的 MyApp 中的变化，确保在 MyApp 更新或扩展时启动备份过程。

观看资源的一般概念

无论资源是在您的项目内定义的还是来自外部项目，主要资源和次要资源的概念始终是相同的：

主要资源是控制器主要负责管理的资源。
次级资源是指为了确保主要资源按预期工作而必需的资源。

因此，无论该资源是由您的项目定义还是由其他项目定义，您的控制器都可以根据需要监视、对账和管理这些资源的变化。

观看二级资源有什么重要性？

在构建 Kubernetes 控制器时，关注 主要资源 是至关重要的，但同样重要的是监控 次要资源。未能跟踪这些资源可能导致您的控制器行为和整个集群状态的不一致。

次级资源可能并不直接由您的控制器管理，但对这些资源的更改仍然会对主资源和您的控制器的功能产生重大影响。以下是关注这些资源的重要原因：

确保一致性：
- 二级资源（例如，子对象或外部依赖）可能与其预期状态发生偏离。例如，二级资源可能被修改或删除，从而导致系统不同步。
- 观察辅助资源确保任何变化都能立即被检测到，这使得控制器能够对账并恢复所需状态。
避免随机自我修复：
- 在没有查看二级资源的情况下，控制器可能只在重启后或在触发特定事件时“自我恢复“。这可能导致对问题的反应不可预测或延迟。
- 监控二级资源可以确保及时处理不一致性，而不是等待控制器重启或外部事件来触发调整。
有效的生命周期管理:
- 次要资源可能并不直接由控制者拥有，但它们的状态仍然会影响主要资源的行为。如果不对这些进行监控，就可能导致孤儿资源或过时资源的存在。
- 观看非拥有的二级资源使控制器能够对可能影响主资源的生命周期事件（创建、更新、删除）作出响应，从而确保系统行为的一致性。

请参阅观看未拥有的次级资源以获取示例。

为什么不在所有场景中都使用 `RequeueAfter X` 而不是监听资源呢？

Kubernetes 控制器本质上是 事件驱动 的。在创建控制器时，调整循环 通常是由对资源的 create、update 或 delete 操作等事件触发的。这种事件驱动的方法相比于不断重新排队或轮询资源使用 RequeueAfter 更加高效和响应迅速。这确保了系统只在必要时采取行动，从而保持性能和效率。

在许多情况下，监视资源是确保Kubernetes资源保持在所需状态的首选方法。它更高效、更灵敏，并且与Kubernetes的事件驱动架构相一致。然而，在某些场景中，RequeueAfter是合适且必要的，特别是在管理不发出事件的外部系统或处理需要时间才能收敛的资源时，例如长时间运行的过程。仅依赖RequeueAfter处理所有场景可能导致不必要的开销和反应延迟。因此，至关重要的是优先考虑事件驱动的调整，通过在可能的情况下配置控制器以监视资源，并将RequeueAfter保留用于需要定期检查的情况。

`RequeueAfter X` 何时有用

虽然 RequeueAfter 不是触发调整的主要方法，但在某些特定情况下是必要的，例如：

观察外部系统：在处理不生成事件的外部资源（例如，外部数据库或第三方服务）时，RequeueAfter 允许控制器定期检查这些资源的状态。
基于时间的操作：一些任务，例如旋转密钥或更新证书，必须在特定的时间间隔内执行。RequeueAfter 确保这些操作按计划进行，即使没有其他更改发生。
处理错误或延迟：在管理遇到错误或需要时间自我修复的资源时，RequeueAfter 确保控制器在再次检查资源状态之前等待指定的时间，从而避免不断尝试进行调整。

谓词的使用

对于更复杂的使用场景，可以使用谓词来精确调整您的控制器何时应该触发状态同步。谓词允许您根据特定条件筛选事件，例如对特定字段、标签或注释的更改，从而确保您的控制器仅对相关事件做出响应，并高效地运行。

查看控制器“拥有“的二级资源

在 Kubernetes 控制器中，通常会同时管理 主资源 和 次资源。主资源 是控制器负责的主要资源，而 次资源 是由控制器创建和管理，以支持 主资源。

在本节中，我们将解释如何管理由控制器“拥有“的 二级资源。这个例子将展示如何：

在主要资源（Busybox）和次要资源（Deployment）之间设置所有者引用，以确保正确的生命周期管理。
将控制器配置为在 SetupWithManager() 中使用 Owns() 监视次要资源。可以看到 Deployment 由 Busybox 控制器拥有，因为它将由该控制器创建和管理。

设置拥有者引用

要将次级资源（Deployment）的生命周期与主资源（Busybox）连接起来，我们需要在次级资源上设置一个所有者引用。这确保了 Kubernetes 会自动处理层叠删除：如果主资源被删除，次级资源也会被删除。

Controller-runtime 提供了 controllerutil.SetControllerReference 函数，您可以使用它来设置资源之间的关系。

设置拥有者引用

下面，我们创建 Deployment 并使用 controllerutil.SetControllerReference() 在 Busybox 自定义资源和 Deployment 之间设置 Owner 引用。

// deploymentForBusybox 返回一个 Busybox 的 Deployment 对象
func (r *BusyboxReconciler) deploymentForBusybox(busybox *examplecomv1alpha1.Busybox) *appsv1.Deployment {
    replicas := busybox.Spec.Size

    dep := &appsv1.Deployment{
        ObjectMeta: metav1.ObjectMeta{
            Name:      busybox.Name,
            Namespace: busybox.Namespace,
        },
        Spec: appsv1.DeploymentSpec{
            Replicas: &replicas,
            Selector: &metav1.LabelSelector{
                MatchLabels: map[string]string{"app": busybox.Name},
            },
            Template: metav1.PodTemplateSpec{
                ObjectMeta: metav1.ObjectMeta{
                    Labels: map[string]string{"app": busybox.Name},
                },
                Spec: corev1.PodSpec{
                    Containers: []corev1.Container{
                        {
                            Name:  "busybox",
                            Image: "busybox:latest",
                        },
                    },
                },
            },
        },
    }

    // 设置 Deployment 的 ownerRef，确保在删除 Busybox CR 时，Deployment 也会被删除。    controllerutil.SetControllerReference(busybox, dep, r.Scheme)
    return dep
}

Explanation

通过设置 OwnerReference，如果 Busybox 资源被删除，Kubernetes 会自动删除 Deployment。这还允许控制器监视 Deployment 的变化，并确保维护所需的状态（例如副本数）。

例如，如果有人修改了 Deployment，将副本数更改为 3，而 Busybox CR 定义的期望状态为 1 个副本，控制器将进行调整，确保 Deployment 缩减回 1 个副本。

对账函数示例

// Reconcile 处理 Busybox 和 Deployment 的主要调整循环。func (r *BusyboxReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
    log := logf.FromContext(ctx)

    // 获取 Busybox 实例    busybox := &examplecomv1alpha1.Busybox{}
    if err := r.Get(ctx, req.NamespacedName, busybox); err != nil {
        if apierrors.IsNotFound(err) {
            log.Info("Busybox resource not found. Ignoring since it must be deleted")
            return ctrl.Result{}, nil
        }
        log.Error(err, "Failed to get Busybox")
        return ctrl.Result{}, err
    }

    // 检查部署是否已经存在，如果不存在则创建一个新的。    found := &appsv1.Deployment{}
    err := r.Get(ctx, types.NamespacedName{Name: busybox.Name, Namespace: busybox.Namespace}, found)
    if err != nil && apierrors.IsNotFound(err) {
        // 定义一个新的部署        dep := r.deploymentForBusybox(busybox)
        log.Info("Creating a new Deployment", "Deployment.Namespace", dep.Namespace, "Deployment.Name", dep.Name)
        if err := r.Create(ctx, dep); err != nil {
            log.Error(err, "无法创建新的部署", "Deployment.Namespace", dep.Namespace, "Deployment.Name", dep.Name)
            return ctrl.Result{}, err
        }
        // 重新排队请求以确保创建部署        return ctrl.Result{RequeueAfter: time.Minute}, nil
    } else if err != nil {
        log.Error(err, "Failed to get Deployment")
        return ctrl.Result{}, err
    }

    // 确保部署大小与期望状态匹配
    size := busybox.Spec.Size
    if *found.Spec.Replicas != size {
        found.Spec.Replicas = &size
        if err := r.Update(ctx, found); err != nil {
            log.Error(err, "Failed to update Deployment size", "Deployment.Namespace", found.Namespace, "Deployment.Name", found.Name)
            return ctrl.Result{}, err
        }
        // 重新排队请求以确保达到正确的状态
        return ctrl.Result{Requeue: true}, nil
    }

    // 更新 Busybox 状态以反映该部署可用    busybox.Status.AvailableReplicas = found.Status.AvailableReplicas
    if err := r.Status().Update(ctx, busybox); err != nil {
        log.Error(err, "Failed to update Busybox status")
        return ctrl.Result{}, err
    }

    return ctrl.Result{}, nil
}

观看辅助资源

为了确保对次要资源（例如 Deployment）的更改能够触发对主要资源（Busybox）的对账，我们配置控制器以监视这两个资源。

Owns() 方法允许您指定控制器应该监控的辅助资源。这样，控制器将在辅助资源发生变化（例如，被更新或删除）时自动调整主资源。

示例：配置 `SetupWithManager` 以监视辅助资源

// SetupWithManager 使用 Manager 设置控制器。
// 控制器将同时监视 Busybox 主资源和 Deployment 次资源。func (r *BusyboxReconciler) SetupWithManager(mgr ctrl.Manager) error {
    return ctrl.NewControllerManagedBy(mgr).
        For(&examplecomv1alpha1.Busybox{}).  // 观看主要资源        Owns(&appsv1.Deployment{}).          // 监视次要资源（部署）
        Complete(r)
}

确保正确的权限

Kubebuilder 使用标记来定义控制器所需的 RBAC 权限。为了使控制器能够正确监视和管理主资源（Busybox）和次资源（Deployment），必须授予其适当的权限；即对这些资源具有 watch、get、list、create、update 和 delete 权限。

示例：RBAC 标记

在 Reconcile 方法之前，我们需要定义适当的 RBAC 标记。这些标记将由 controller-gen 在您运行 make manifests 时，用于生成所需的角色和权限。

// +kubebuilder:rbac:groups=example.com,resources=busyboxes,verbs=获取;列表;观察;创建;更新;补丁;删除
// +kubebuilder:rbac:groups=apps,resources=deployments,verbs=获取;列表;观察;创建;更新;补丁;删除

第一个标记授予控制器管理 Busybox 自定义资源（主要资源）的权限。
第二个标记授予控制器管理 Deployment 资源（次要资源）的权限。

请注意，我们正在授予对资源的 watch 权限。

观看未“拥有“的辅助资源

在某些情况下，控制器可能需要监视并响应它并不“拥有“的资源的变化，这意味着这些资源是由另一个控制器创建和管理的。

以下示例演示了控制器如何监控和对账它不直接管理的资源。这适用于任何不是由控制器“拥有“的资源，包括由其他控制器或项目管理的核心类型或自定义资源，并在单独的流程中进行对账。

例如，考虑两个自定义资源——Busybox 和 BackupBusybox。如果对 Busybox 的更改应该触发 BackupBusybox 控制器的调整，我们可以配置 BackupBusybox 控制器来监视 Busybox 的更新。

示例：监视未拥有的 Busybox 资源以重新调整 BackupBusybox

考虑一个控制器，它管理一个自定义资源 BackupBusybox，同时需要监控整个集群中 Busybox 资源的变化。我们只希望在 Busybox 实例启用备份功能时触发对其的调整。

为什么观看二次资源？
- BackupBusybox 控制器并不负责创建或拥有 Busybox 资源，但这些资源的变化（例如更新或删除）会直接影响主要资源（BackupBusybox）。
- 通过监视具有特定标签的 Busybox 实例，控制器确保只有相关资源触发必要的操作（例如备份）。

配置示例

以下是如何配置 BackupBusyboxReconciler 以监视 Busybox 资源的更改并触发 BackupBusybox 的对账：

// SetupWithManager 用于设置控制器与管理器。
// 控制器将监视 BackupBusybox 主要资源和 Busybox 资源。func (r *BackupBusyboxReconciler) SetupWithManager(mgr ctrl.Manager) error {
    return ctrl.NewControllerManagedBy(mgr).
        For(&examplecomv1alpha1.BackupBusybox{}).  // 观察主要资源（BackupBusybox）
        Watches(
            &source.Kind{Type: &examplecomv1alpha1.Busybox{}},  // 观察 Busybox CR
            handler.EnqueueRequestsFromMapFunc(func(ctx context.Context, obj client.Object) []reconcile.Request {
                // 在同一命名空间中触发 BackupBusybox 的同步                return []reconcile.Request{
                    {
                        NamespacedName: types.NamespacedName{
                            Name:      "backupbusybox",  // 对关联的 BackupBusybox 资源进行调整
                            Namespace: obj.GetNamespace(),  // 使用已更改的 Busybox 命名空间
                        },
                    },
                }
            }),
        ).  // 当 Busybox 资源发生变化时触发调整。        Complete(r)
}

以下是我们如何配置控制器，以仅过滤和监视具有特定标签的 Busybox 资源的变化：

// SetupWithManager 用于将控制器与管理器进行设置。
// 控制器将监视 BackupBusybox 主要资源和 Busybox 资源，并按标签进行过滤。func (r *BackupBusyboxReconciler) SetupWithManager(mgr ctrl.Manager) error {
    return ctrl.NewControllerManagedBy(mgr).
        For(&examplecomv1alpha1.BackupBusybox{}).  // 观察主要资源（BackupBusybox）
        Watches(
            &source.Kind{Type: &examplecomv1alpha1.Busybox{}},  // 观察 Busybox CR
            handler.EnqueueRequestsFromMapFunc(func(ctx context.Context, obj client.Object) []reconcile.Request {
                // 检查 Busybox 资源是否有标签 'backup-needed: "true"'                 if val, ok := obj.GetLabels()["backup-enable"]; ok && val == "true" {
                    // 如果标签存在并设置为"true"，则触发 BackupBusybox 的对账                    return []reconcile.Request{
                        {
                            NamespacedName: types.NamespacedName{
                                Name:      "backupbusybox",  // 对关联的 BackupBusybox 资源进行调整
                                Namespace: obj.GetNamespace(),  // 使用已更改的 Busybox 命名空间
                            },
                        },
                    }
                }
                // 如果标签不存在或不匹配，则不触发和解                return []reconcile.Request{}
            }),
        ).  // 当标记的 Busybox 资源发生变化时触发重对账        Complete(r)
}

使用谓词来优化手表

在使用控制器时，使用谓词来过滤事件和控制何时触发调整循环通常是有益的。

谓词允许您基于事件（例如创建、更新或删除）和资源字段（例如标签、注释或状态字段）定义条件。通过使用谓词，您可以细化控制器的行为，使其仅对所观察资源的特定变化做出响应。

这在你想要细化哪些资源的变化应该触发对账时尤其有用。通过使用谓词，你可以避免不必要的对账，并确保控制器仅对相关变化做出反应。

何时使用谓词

谓词在以下情况下很有用：

您想忽略某些更改，例如那些不影响控制器关注的字段的更新。
您只想对具有特定标签或注释的资源触发调整。
您希望监视外部资源，并仅对特定更改做出反应。

示例：使用谓词过滤更新事件

假设我们只希望我们的 BackupBusybox 控制器在 Busybox 资源的某些字段发生变化时进行调整，例如，当 spec.size 字段发生变化时，但我们希望忽略所有其他变化（如状态更新）。

定义谓词

在下面的示例中，我们定义了一个谓词，仅在对 Busybox 资源有重要更新时才允许对账：

import (
    "sigs.k8s.io/controller-runtime/pkg/predicate"
    "sigs.k8s.io/controller-runtime/pkg/event"
)

// 仅在 Busybox 规格的大小变化时触发重新调整的谓词
updatePred := predicate.Funcs{
    // 仅在 Busybox 资源的 spec.size 发生变化时允许更新
    UpdateFunc: func(e event.UpdateEvent) bool {
        oldObj := e.ObjectOld.(*examplecomv1alpha1.Busybox)
        newObj := e.ObjectNew.(*examplecomv1alpha1.Busybox)

        // 仅在 spec.size 字段发生变化时触发重新对账        return oldObj.Spec.Size != newObj.Spec.Size
    },

    // 允许创建事件
    CreateFunc: func(e event.CreateEvent) bool {
        return true
    },

    // 允许删除事件
    DeleteFunc: func(e event.DeleteEvent) bool {
        return true
    },

    // 允许通用事件（例如，外部触发）
    GenericFunc: func(e event.GenericEvent) bool {
        return true
    },
}

Explanation

在这个例子中：

UpdateFunc 仅在 spec.size 字段在旧对象和新对象之间发生变化时返回 true，这意味着在 spec 中的其他所有更改（例如注释或其他字段）将被忽略。
CreateFunc、DeleteFunc 和 GenericFunc 返回 true，意味着创建、删除和通用事件仍然被处理，从而允许这些事件类型的调整发生。

这确保了只有在特定字段 spec.size 被修改时，控制器才会进行调整，而忽略 spec 中与您的逻辑无关的其他修改。

示例：在`Watches`中使用谓词

现在，我们将这个谓词应用在 BackupBusyboxReconciler 的 Watches() 方法中，以便仅针对相关事件触发重新对账：

// SetupWithManager 使用 Manager 设置控制器。
// 控制器将同时监视 BackupBusybox 主要资源和 Busybox 资源，并使用谓词。func (r *BackupBusyboxReconciler) SetupWithManager(mgr ctrl.Manager) error {
    return ctrl.NewControllerManagedBy(mgr).
        For(&examplecomv1alpha1.BackupBusybox{}).  // 观察主要资源（BackupBusybox）
        Watches(
            &source.Kind{Type: &examplecomv1alpha1.Busybox{}},  // 观察 Busybox CR
            handler.EnqueueRequestsFromMapFunc(func(ctx context.Context, obj client.Object) []reconcile.Request {
                return []reconcile.Request{
                    {
                        NamespacedName: types.NamespacedName{
                            Name:      "backupbusybox",  // 对关联的 BackupBusybox 资源进行调整
                            Namespace: obj.GetNamespace(),  // 使用已更改的 Busybox 命名空间
                        },
                    },
                }
            }),
            builder.WithPredicates(updatePred),  // 应用谓词        ).  // 当 Busybox 资源发生变化时触发调整（如果符合谓词条件）
        Complete(r)
}

Explanation

builder.WithPredicates(updatePred)：此方法应用谓词，确保只有在 Busybox 中 spec.size 字段发生变化时才会进行调解。
其他事件：控制器仍将在 创建、删除 和 通用 事件上触发调整。

使用 Kind 进行开发目的和持续集成（CI）

为什么使用 Kind

快速设置： 在一分钟内在本地启动一个多节点的Kubernetes集群。
快速拆解： 仅需几秒钟即可拆解集群，简化您的开发工作流程。
本地镜像使用： 可以直接部署您的容器镜像，无需推送到远程注册中心。
轻量高效： Kind 是一个极简的 Kubernetes 发行版，非常适合本地开发和 CI/CD 流程。

这仅涵盖了使用 kind 集群的基础知识。您可以在 kind 文档中找到更多详细信息。

安装

您可以按照这个链接来安装kind。

创建一个集群

您可以通过以下方式简单地创建一个 kind 集群：

kind create cluster

要自定义您的集群，您可以提供额外的配置。例如，以下是一个示例 kind 配置。

kind: 集群
apiVersion: kind.x-k8s.io/v1alpha4
节点:
  - 角色: 控制平面
  - 角色: 工人
  - 角色: 工人
  - 角色: 工人

使用上述配置，运行以下命令将为您提供一个包含 1 个控制平面节点和 3 个工作节点的 k8s v1.17.2 集群。

kind create cluster --config hack/kind-config.yaml --image=kindest/node:v1.17.2

您可以使用 --image 参数指定您想要的集群版本，例如 --image=kindest/node:v1.17.2，支持的版本可以在这里查看。

将 Docker 镜像加载到集群中

在使用本地 kind 集群进行开发时，将 Docker 镜像加载到集群中是一个非常有用的功能。您可以避免使用容器注册表。

kind load docker-image your-image-name:your-tag

请参阅将本地镜像加载到 kind 集群以获取更多信息。

删除集群

kind delete cluster

Webhook（网络钩子）

Webhooks 是以阻塞方式发送的信息请求。实现 Webhook 的 web 应用程序会在某个事件发生时向其他应用程序发送 HTTP 请求。

在Kubernetes世界中，有三种类型的Webhook：准入Webhook、授权Webhook和CRD转换Webhook。

在 controller-runtime 库中，我们支持准入 webhook 和 CRD 转换 webhook。

Kubernetes 从 1.9 版本开始支持这些动态 Admission Webhooks（当时该功能进入 beta 阶段）。

Kubernetes 从 1.15 版本开始支持转换 Webhook（该功能在此时进入测试版）。

入学 Webhooks

Admission Webhooks 是接收入场请求的 HTTP 回调，处理这些请求并返回入场响应。

Kubernetes 提供以下类型的准入 webhook：

变更Admission Webhook：这些Webhook可以在对象创建或更新时对其进行变更，在对象被存储之前。它可以用于在资源请求中设置字段的默认值，例如，在用户未指定的Deployment字段中。还可以用于注入边车容器。
验证入场 Webhook：这些可以在对象被创建或更新时进行验证，确保其在存储之前有效。它允许比纯基于模式的验证更复杂的验证，例如跨字段验证和容器镜像白名单。

默认情况下，apiserver 并不会对 webhook 进行身份验证。然而，如果您想要对客户端进行身份验证，您可以配置 apiserver 使用基本身份验证、令牌或证书来对 webhook 进行身份验证。您可以在这里找到详细步骤。

在入场Webhook中处理资源状态

理解原因：

变异 admission Webhooks

变更的 Admission Webhooks 主要旨在拦截和修改与对象的创建、修改或删除相关的请求。尽管它们具备修改对象规格的能力，但直接更改对象的状态并不被视为标准做法，通常会导致意外结果。

// MutatingWebhookConfiguration 允许对对象进行修改。
// 然而，直接修改状态可能会导致意外行为。type MutatingWebhookConfiguration struct {
    ...
}

设置初始状态

对于那些深入研究自定义资源的自定义控制器的人来说，了解设置初始状态的概念是至关重要的。这个初始化通常在控制器内部进行。当控制器通过监视机制识别到其管理资源的新实例时，它有权为该资源分配一个初始状态。

// 自定义控制器的调整函数可能看起来像这样：
func (r *ReconcileMyResource) Reconcile(request reconcile.Request) (reconcile.Result, error) {
    // ...
    // 在发现新实例时，设置初始状态
    instance.Status = SomeInitialStatus
    // ...
}

状态子资源

深入研究 Kubernetes 自定义资源时，可以明确区分 spec（描述期望状态）和 status（展示观察到的状态）。为自定义资源定义（CRD）启用 /status 子资源，将 status 和 spec 分开，各自分配给相应的 API 端点。这样的分离确保了用户引入的变更，例如修改 spec，以及系统驱动的更新，如状态变化，能够保持明确的区分。在修改 spec 操作期间利用变更的 webhook 来调整状态，可能无法如预期那样顺利进行，这要归功于这种隔离。

apiVersion: apiextensions.k8s.io/v1
kind: CustomResourceDefinition
metadata:
  name: myresources.mygroup.mydomain
spec:
  ...
  subresources:
    status: {} # 启用 /status 子资源

结论

虽然某些边缘场景可能允许变更的 webhook 无缝地修改状态，但走这条道路并不是普遍认可或推荐的策略。将状态更新的责任交给控制器逻辑仍然是最被提倡的方法。

配置/代码生成标记

Kubebuilder 使用一个名为 controller-gen 的工具来生成实用代码和 Kubernetes YAML。此代码和配置的生成是通过在 Go 代码中添加特殊的“标记注释“来控制的。

标记是以加号开头的单行注释，后面跟着标记名称，后面可以选择性地跟上一些标记特定配置：

// +kubebuilder:validation:可选
// +kubebuilder:validation:最大项数=2
// +kubebuilder:printcolumn:JSONPath=".status.replicas",name=副本数,type=string

请查看每个子部分以获取有关不同类型代码和 YAML 生成的信息。

在 Kubebuilder 中生成代码和工件

Kubebuilder 项目有两个 make 目标，用于使用 controller-gen：

make manifests 生成 Kubernetes 对象 YAML，诸如 CustomResourceDefinitions、WebhookConfigurations 和 RBAC roles。
make generate 生成代码，例如 runtime.Object/DeepCopy 实现。

请查看生成 CRD以获取全面概述。

标记语法

确切的语法在 controller-tools 的文档中进行了描述。

通常，标记可以是：

空 (+kubebuilder:validation:Optional): 空标记就像命令行上的布尔标志 -- 仅仅指定它们就可以启用某些行为。
匿名 (+kubebuilder:validation:MaxItems=2): 匿名标记的参数只能接受一个值。
多选项 (+kubebuilder:printcolumn:JSONPath=".status.replicas",name=Replicas,type=string): 多选项标记可以接受一个或多个命名参数。第一个参数通过冒号与名称分隔，后续参数用逗号分隔。参数的顺序没有关系。某些参数可能是可选的。

标记参数可以是字符串、整数、布尔值、切片或它们的映射。字符串、整数和布尔值遵循它们的 Go 语法：

// +kubebuilder:validation:ExclusiveMaximum=false
// +kubebuilder:validation:Format="date-time"
// +kubebuilder:validation:Maximum=42

为了方便，对于简单情况，可以省略字符串中的引号，但不鼓励在单词字符串以外的其他情况下这样做：

// +kubebuilder:validation:Type=string

切片可以通过用大括号包围并用逗号分隔来指定：

// +kubebuilder:webhooks:Enum={"饼干, 龟兔赛跑, 我们忘记带饼干了!","连温斯莱代尔奶酪都没有吗?"}

或在简单情况下，用分号分隔：

// +kubebuilder:validation:Enum=华莱士;格罗米特;鸡

映射使用字符串键和任何类型的值指定（实际上是 map[string]interface{}）。映射用大括号（{}）包围，每个键和值之间用冒号（:）分隔，每对键值对之间用逗号分隔：

// +kubebuilder:default={magic: {numero: 42, stringified: 四十二}}

CRD 生成

这些标记描述了如何根据一系列 Go 类型和包构建自定义资源定义。实际验证模式的生成由验证标记描述。

请参见生成 CRD以获取示例。

Show Detailed Argument Help

// +groupName

: string

specifies the API group name for this package.

: string

// +kubebuilder:deprecatedversion

warning: string

marks this version as deprecated.

warning: string; message to be shown on the deprecated version

// +kubebuilder:metadata

annotations: string
labels: string

configures the additional annotations or labels for this CRD.

For example adding annotation “api-approved.kubernetes.io” for a CRD with Kubernetes groups, or annotation “cert-manager.io/inject-ca-from-secret” for a CRD that needs CA injection.

annotations: string; will be added into the annotations of this CRD.
labels: string; will be added into the labels of this CRD.

// +kubebuilder:printcolumn

JSONPath: string
description: string
format: string
name: string
priority: int
type: string

adds a column to "kubectl get" output for this CRD.

JSONPath: string; specifies the jsonpath expression used to extract the value of the column.
description: string; specifies the help/description for this column.
format: string; specifies the format of the column.

It may be any OpenAPI data format corresponding to the type, listed at https://github.com/OAI/OpenAPI-Specification/blob/master/versions/2.0.md#data-types.
name: string; specifies the name of the column.
priority: int; indicates how important it is that this column be displayed.

Lower priority (higher numbered) columns will be hidden if the terminal width is too small.
type: string; indicates the type of the column.

It may be any OpenAPI data type listed at https://github.com/OAI/OpenAPI-Specification/blob/master/versions/2.0.md#data-types.

// +kubebuilder:resource

categories: string
path: string
scope: string
shortName: string
singular: string

configures naming and scope for a CRD.

categories: string; specifies which group aliases this resource is part of.

Group aliases are used to work with groups of resources at once. The most common one is “all” which covers about a third of the base resources in Kubernetes, and is generally used for “user-facing” resources.
path: string; specifies the plural "resource" for this CRD.

It generally corresponds to a plural, lower-cased version of the Kind. See https://book.kubebuilder.io/cronjob-tutorial/gvks.html.
scope: string; overrides the scope of the CRD (Cluster vs Namespaced).

Scope defaults to “Namespaced”. Cluster-scoped (“Cluster”) resources don’t exist in namespaces.
shortName: string; specifies aliases for this CRD.

Short names are often used when people have work with your resource over and over again. For instance, “rs” for “replicaset” or “crd” for customresourcedefinition.
singular: string; overrides the singular form of your resource.

The singular form is otherwise defaulted off the plural (path).

// +kubebuilder:selectablefield

JSONPath: string

adds a field that may be used with field selectors.

JSONPath: string; specifies the jsonpath expression which is used to produce a field selector value.

// +kubebuilder:skip

don't consider this package as an API version.

// +kubebuilder:skipversion

removes the particular version of the CRD from the CRDs spec.

This is useful if you need to skip generating and listing version entries for ‘internal’ resource versions, which typically exist if using the Kubernetes upstream conversion-gen tool.

// +kubebuilder:storageversion

marks this version as the "storage version" for the CRD for conversion.

When conversion is enabled for a CRD (i.e. it’s not a trivial-versions/single-version CRD), one version is set as the “storage version” to be stored in etcd. Attempting to store any other version will result in conversion to the storage version via a conversion webhook.

// +kubebuilder:subresource:scale

selectorpath: string
specpath: string
statuspath: string

enables the "/scale" subresource on a CRD.

selectorpath: string; specifies the jsonpath to the pod label selector field for the scale's status.

The selector field must be the string form (serialized form) of a selector. Setting a pod label selector is necessary for your type to work with the HorizontalPodAutoscaler.
specpath: string; specifies the jsonpath to the replicas field for the scale's spec.
statuspath: string; specifies the jsonpath to the replicas field for the scale's status.

// +kubebuilder:subresource:status

enables the "/status" subresource on a CRD.

// +kubebuilder:unservedversion

does not serve this version.

This is useful if you need to drop support for a version in favor of a newer version.

// +versionName

: string

overrides the API group version for this package (defaults to the package name).

: string

CRD 验证

这些标记会修改 CRD 验证模式在其修改的类型和字段上的生成方式。每个标记大致对应于一个 OpenAPI/JSON 模式选项。

请参阅生成 CRD 以获取示例。

Show Detailed Argument Help

// +default

value: any

Default sets the default value for this field.

A default value will be accepted as any value valid for the field. Only JSON-formatted values are accepted. ref(...) values are ignored. Formatting for common types include: boolean: true, string: "Cluster", numerical: 1.24, array: [1,2], object: {"policy": "delete"}). Defaults should be defined in pruned form, and only best-effort validation will be performed. Full validation of a default requires submission of the containing CRD to an apiserver.

value: any

// +kubebuilder:default

: any

sets the default value for this field.

A default value will be accepted as any value valid for the field. Formatting for common types include: boolean: true, string: Cluster, numerical: 1.24, array: {1,2}, object: {policy: "delete"}). Defaults should be defined in pruned form, and only best-effort validation will be performed. Full validation of a default requires submission of the containing CRD to an apiserver.

: any

// +kubebuilder:example

: any

sets the example value for this field.

An example value will be accepted as any value valid for the field. Formatting for common types include: boolean: true, string: Cluster, numerical: 1.24, array: {1,2}, object: {policy: "delete"}). Examples should be defined in pruned form, and only best-effort validation will be performed. Full validation of an example requires submission of the containing CRD to an apiserver.

: any

// +kubebuilder:validation:EmbeddedResource

EmbeddedResource marks a fields as an embedded resource with apiVersion, kind and metadata fields.

An embedded resource is a value that has apiVersion, kind and metadata fields. They are validated implicitly according to the semantics of the currently running apiserver. It is not necessary to add any additional schema for these field, yet it is possible. This can be combined with PreserveUnknownFields.

// +kubebuilder:validation:Enum

: any

specifies that this (scalar) field is restricted to the *exact* values specified here.

: any

// +kubebuilder:validation:Enum

: any

specifies that this (scalar) field is restricted to the *exact* values specified here.

: any

// +kubebuilder:validation:ExclusiveMaximum

: bool

indicates that the maximum is "up to" but not including that value.

: bool

// +kubebuilder:validation:ExclusiveMaximum

: bool

indicates that the maximum is "up to" but not including that value.

: bool

// +kubebuilder:validation:ExclusiveMinimum

: bool

indicates that the minimum is "up to" but not including that value.

: bool

// +kubebuilder:validation:ExclusiveMinimum

: bool

indicates that the minimum is "up to" but not including that value.

: bool

// +kubebuilder:validation:Format

: string

specifies additional "complex" formatting for this field.

For example, a date-time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:Format

: string

specifies additional "complex" formatting for this field.

For example, a date-time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:MaxItems

: int

specifies the maximum length for this list.

: int

// +kubebuilder:validation:MaxItems

: int

specifies the maximum length for this list.

: int

// +kubebuilder:validation:MaxLength

: int

specifies the maximum length for this string.

: int

// +kubebuilder:validation:MaxLength

: int

specifies the maximum length for this string.

: int

// +kubebuilder:validation:MaxProperties

: int

restricts the number of keys in an object

: int

// +kubebuilder:validation:MaxProperties

: int

restricts the number of keys in an object

: int

// +kubebuilder:validation:Maximum

specifies the maximum numeric value that this field can have.

// +kubebuilder:validation:Maximum

specifies the maximum numeric value that this field can have.

// +kubebuilder:validation:MinItems

: int

specifies the minimum length for this list.

: int

// +kubebuilder:validation:MinItems

: int

specifies the minimum length for this list.

: int

// +kubebuilder:validation:MinLength

: int

specifies the minimum length for this string.

: int

// +kubebuilder:validation:MinLength

: int

specifies the minimum length for this string.

: int

// +kubebuilder:validation:MinProperties

: int

restricts the number of keys in an object

: int

// +kubebuilder:validation:MinProperties

: int

restricts the number of keys in an object

: int

// +kubebuilder:validation:Minimum

specifies the minimum numeric value that this field can have. Negative numbers are supported.

// +kubebuilder:validation:Minimum

specifies the minimum numeric value that this field can have. Negative numbers are supported.

// +kubebuilder:validation:MultipleOf

specifies that this field must have a numeric value that's a multiple of this one.

// +kubebuilder:validation:MultipleOf

specifies that this field must have a numeric value that's a multiple of this one.

// +kubebuilder:validation:Optional

specifies that this field is optional.

// +kubebuilder:validation:Optional

specifies that all fields in this package are optional by default.

// +kubebuilder:validation:Pattern

: string

specifies that this string must match the given regular expression.

: string

// +kubebuilder:validation:Pattern

: string

specifies that this string must match the given regular expression.

: string

// +kubebuilder:validation:Required

specifies that all fields in this package are required by default.

// +kubebuilder:validation:Required

specifies that this field is required.

// +kubebuilder:validation:Schemaless

marks a field as being a schemaless object.

Schemaless objects are not introspected, so you must provide any type and validation information yourself. One use for this tag is for embedding fields that hold JSONSchema typed objects. Because this field disables all type checking, it is recommended to be used only as a last resort.

// +kubebuilder:validation:Type

: string

overrides the type for this field (which defaults to the equivalent of the Go type).

This generally must be paired with custom serialization. For example, the metav1.Time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:Type

: string

overrides the type for this field (which defaults to the equivalent of the Go type).

This generally must be paired with custom serialization. For example, the metav1.Time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:UniqueItems

: bool

specifies that all items in this list must be unique.

: bool

// +kubebuilder:validation:UniqueItems

: bool

specifies that all items in this list must be unique.

: bool

// +kubebuilder:validation:XEmbeddedResource

EmbeddedResource marks a fields as an embedded resource with apiVersion, kind and metadata fields.

// +kubebuilder:validation:XEmbeddedResource

EmbeddedResource marks a fields as an embedded resource with apiVersion, kind and metadata fields.

// +kubebuilder:validation:XIntOrString

IntOrString marks a fields as an IntOrString.

This is required when applying patterns or other validations to an IntOrString field. Known information about the type is applied during the collapse phase and as such is not normally available during marker application.

// +kubebuilder:validation:XIntOrString

IntOrString marks a fields as an IntOrString.

// +kubebuilder:validation:XValidation

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

marks a field as requiring a value for which a given

expression evaluates to true.

This marker may be repeated to specify multiple expressions, all of which must evaluate to true.

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

// +kubebuilder:validation:XValidation

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

marks a field as requiring a value for which a given

expression evaluates to true.

This marker may be repeated to specify multiple expressions, all of which must evaluate to true.

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

// +kubebuilder:validation:items:Enum

: any

for array items specifies that this (scalar) field is restricted to the *exact* values specified here.

: any

// +kubebuilder:validation:items:Enum

: any

for array items specifies that this (scalar) field is restricted to the *exact* values specified here.

: any

// +kubebuilder:validation:items:ExclusiveMaximum

: bool

for array items indicates that the maximum is "up to" but not including that value.

: bool

// +kubebuilder:validation:items:ExclusiveMaximum

: bool

for array items indicates that the maximum is "up to" but not including that value.

: bool

// +kubebuilder:validation:items:ExclusiveMinimum

: bool

for array items indicates that the minimum is "up to" but not including that value.

: bool

// +kubebuilder:validation:items:ExclusiveMinimum

: bool

for array items indicates that the minimum is "up to" but not including that value.

: bool

// +kubebuilder:validation:items:Format

: string

for array items specifies additional "complex" formatting for this field.

For example, a date-time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:items:Format

: string

for array items specifies additional "complex" formatting for this field.

For example, a date-time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:items:MaxItems

: int

for array items specifies the maximum length for this list.

: int

// +kubebuilder:validation:items:MaxItems

: int

for array items specifies the maximum length for this list.

: int

// +kubebuilder:validation:items:MaxLength

: int

for array items specifies the maximum length for this string.

: int

// +kubebuilder:validation:items:MaxLength

: int

for array items specifies the maximum length for this string.

: int

// +kubebuilder:validation:items:MaxProperties

: int

for array items restricts the number of keys in an object

: int

// +kubebuilder:validation:items:MaxProperties

: int

for array items restricts the number of keys in an object

: int

// +kubebuilder:validation:items:Maximum

for array items specifies the maximum numeric value that this field can have.

// +kubebuilder:validation:items:Maximum

for array items specifies the maximum numeric value that this field can have.

// +kubebuilder:validation:items:MinItems

: int

for array items specifies the minimum length for this list.

: int

// +kubebuilder:validation:items:MinItems

: int

for array items specifies the minimum length for this list.

: int

// +kubebuilder:validation:items:MinLength

: int

for array items specifies the minimum length for this string.

: int

// +kubebuilder:validation:items:MinLength

: int

for array items specifies the minimum length for this string.

: int

// +kubebuilder:validation:items:MinProperties

: int

for array items restricts the number of keys in an object

: int

// +kubebuilder:validation:items:MinProperties

: int

for array items restricts the number of keys in an object

: int

// +kubebuilder:validation:items:Minimum

for array items specifies the minimum numeric value that this field can have. Negative numbers are supported.

// +kubebuilder:validation:items:Minimum

for array items specifies the minimum numeric value that this field can have. Negative numbers are supported.

// +kubebuilder:validation:items:MultipleOf

for array items specifies that this field must have a numeric value that's a multiple of this one.

// +kubebuilder:validation:items:MultipleOf

for array items specifies that this field must have a numeric value that's a multiple of this one.

// +kubebuilder:validation:items:Pattern

: string

for array items specifies that this string must match the given regular expression.

: string

// +kubebuilder:validation:items:Pattern

: string

for array items specifies that this string must match the given regular expression.

: string

// +kubebuilder:validation:items:Type

: string

for array items overrides the type for this field (which defaults to the equivalent of the Go type).

This generally must be paired with custom serialization. For example, the metav1.Time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:items:Type

: string

for array items overrides the type for this field (which defaults to the equivalent of the Go type).

This generally must be paired with custom serialization. For example, the metav1.Time field would be marked as “type: string” and “format: date-time”.

: string

// +kubebuilder:validation:items:UniqueItems

: bool

for array items specifies that all items in this list must be unique.

: bool

// +kubebuilder:validation:items:UniqueItems

: bool

for array items specifies that all items in this list must be unique.

: bool

// +kubebuilder:validation:items:XEmbeddedResource

for array items EmbeddedResource marks a fields as an embedded resource with apiVersion, kind and metadata fields.

// +kubebuilder:validation:items:XEmbeddedResource

for array items EmbeddedResource marks a fields as an embedded resource with apiVersion, kind and metadata fields.

// +kubebuilder:validation:items:XIntOrString

for array items IntOrString marks a fields as an IntOrString.

// +kubebuilder:validation:items:XIntOrString

for array items IntOrString marks a fields as an IntOrString.

// +kubebuilder:validation:items:XValidation

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

for array items marks a field as requiring a value for which a given

expression evaluates to true.

This marker may be repeated to specify multiple expressions, all of which must evaluate to true.

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

// +kubebuilder:validation:items:XValidation

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

for array items marks a field as requiring a value for which a given

expression evaluates to true.

This marker may be repeated to specify multiple expressions, all of which must evaluate to true.

fieldPath: string
message: string
messageExpression: string
reason: string
rule: string

// +nullable

marks this field as allowing the "null" value.

This is often not necessary, but may be helpful with custom serialization.

// +optional

specifies that this field is optional.

// +required

specifies that this field is required.

CRD处理

这些标记有助于控制 Kubernetes API 服务器如何处理涉及您的自定义资源的 API 请求。

请参阅生成 CRD 以获取示例。

Show Detailed Argument Help

// +kubebuilder:pruning:PreserveUnknownFields

PreserveUnknownFields stops the apiserver from pruning fields which are not specified.

By default the apiserver drops unknown fields from the request payload during the decoding step. This marker stops the API server from doing so. It affects fields recursively, but switches back to normal pruning behaviour if nested properties or additionalProperties are specified in the schema. This can either be true or undefined. False is forbidden.

NB: The kubebuilder:validation:XPreserveUnknownFields variant is deprecated in favor of the kubebuilder:pruning:PreserveUnknownFields variant. They function identically.

// +kubebuilder:pruning:PreserveUnknownFields

PreserveUnknownFields stops the apiserver from pruning fields which are not specified.

NB: The kubebuilder:validation:XPreserveUnknownFields variant is deprecated in favor of the kubebuilder:pruning:PreserveUnknownFields variant. They function identically.

// +kubebuilder:validation:XPreserveUnknownFields

PreserveUnknownFields stops the apiserver from pruning fields which are not specified.

NB: The kubebuilder:validation:XPreserveUnknownFields variant is deprecated in favor of the kubebuilder:pruning:PreserveUnknownFields variant. They function identically.

// +kubebuilder:validation:XPreserveUnknownFields

PreserveUnknownFields stops the apiserver from pruning fields which are not specified.

NB: The kubebuilder:validation:XPreserveUnknownFields variant is deprecated in favor of the kubebuilder:pruning:PreserveUnknownFields variant. They function identically.

// +kubebuilder:validation:items:XPreserveUnknownFields

for array items PreserveUnknownFields stops the apiserver from pruning fields which are not specified.

NB: The kubebuilder:validation:XPreserveUnknownFields variant is deprecated in favor of the kubebuilder:pruning:PreserveUnknownFields variant. They function identically.

// +kubebuilder:validation:items:XPreserveUnknownFields

for array items PreserveUnknownFields stops the apiserver from pruning fields which are not specified.

NB: The kubebuilder:validation:XPreserveUnknownFields variant is deprecated in favor of the kubebuilder:pruning:PreserveUnknownFields variant. They function identically.

// +listMapKey

: string

specifies the keys to map listTypes.

It indicates the index of a map list. They can be repeated if multiple keys must be used. It can only be used when ListType is set to map, and the keys should be scalar types.

: string

// +listMapKey

: string

specifies the keys to map listTypes.

It indicates the index of a map list. They can be repeated if multiple keys must be used. It can only be used when ListType is set to map, and the keys should be scalar types.

: string

// +listType

: string

specifies the type of data-structure that the list

represents (map, set, atomic).

Possible data-structure types of a list are:

“map”: it needs to have a key field, which will be used to build an associative list. A typical example is a the pod container list, which is indexed by the container name.
“set”: Fields need to be “scalar”, and there can be only one occurrence of each.
“atomic”: All the fields in the list are treated as a single value, are typically manipulated together by the same actor.

: string

// +listType

: string

specifies the type of data-structure that the list

represents (map, set, atomic).

Possible data-structure types of a list are:

“map”: it needs to have a key field, which will be used to build an associative list. A typical example is a the pod container list, which is indexed by the container name.
“set”: Fields need to be “scalar”, and there can be only one occurrence of each.
“atomic”: All the fields in the list are treated as a single value, are typically manipulated together by the same actor.

: string

// +mapType

: string

specifies the level of atomicity of the map;

i.e. whether each item in the map is independent of the others, or all fields are treated as a single unit.

Possible values:

“granular”: items in the map are independent of each other, and can be manipulated by different actors. This is the default behavior.
“atomic”: all fields are treated as one unit. Any changes have to replace the entire map.

: string

// +mapType

: string

specifies the level of atomicity of the map;

i.e. whether each item in the map is independent of the others, or all fields are treated as a single unit.

Possible values:

“granular”: items in the map are independent of each other, and can be manipulated by different actors. This is the default behavior.
“atomic”: all fields are treated as one unit. Any changes have to replace the entire map.

: string

// +structType

: string

specifies the level of atomicity of the struct;

i.e. whether each field in the struct is independent of the others, or all fields are treated as a single unit.

Possible values:

“granular”: fields in the struct are independent of each other, and can be manipulated by different actors. This is the default behavior.
“atomic”: all fields are treated as one unit. Any changes have to replace the entire struct.

: string

// +structType

: string

specifies the level of atomicity of the struct;

i.e. whether each field in the struct is independent of the others, or all fields are treated as a single unit.

Possible values:

“granular”: fields in the struct are independent of each other, and can be manipulated by different actors. This is the default behavior.
“atomic”: all fields are treated as one unit. Any changes have to replace the entire struct.

: string

Webhook（网络钩子）

这些标记描述了如何生成 webhook 配置。使用这些标记可以让您的 webhook 描述与实现它们的代码保持紧密关联。

Show Detailed Argument Help

// +kubebuilder:webhook

admissionReviewVersions: string
failurePolicy: string
groups: string
matchPolicy: string
mutating: bool
name: string
path: string
reinvocationPolicy: string
resources: string
serviceName: string
serviceNamespace: string
servicePort: int
sideEffects: string
timeoutSeconds: int
url: string
verbs: string
versions: string
webhookVersions: string

specifies how a webhook should be served.

It specifies only the details that are intrinsic to the application serving it (e.g. the resources it can handle, or the path it serves on).

admissionReviewVersions: string; is an ordered list of preferred `AdmissionReview`

versions the Webhook expects.
failurePolicy: string; specifies what should happen if the API server cannot reach the webhook.

It may be either “ignore” (to skip the webhook and continue on) or “fail” (to reject the object in question).
groups: string; specifies the API groups that this webhook receives requests for.
matchPolicy: string; defines how the "rules" list is used to match incoming requests.

Allowed values are “Exact” (match only if it exactly matches the specified rule) or “Equivalent” (match a request if it modifies a resource listed in rules, even via another API group or version).
mutating: bool; marks this as a mutating webhook (it's validating only if false)

Mutating webhooks are allowed to change the object in their response, and are called before all validating webhooks. Mutating webhooks may choose to reject an object, similarly to a validating webhook.
name: string; indicates the name of this webhook configuration. Should be a domain with at least three segments separated by dots
path: string; specifies that path that the API server should connect to this webhook on. Must be

prefixed with a ‘/validate-’ or ‘/mutate-’ depending on the type, and followed by $GROUP-$VERSION-$KIND where all values are lower-cased and the periods in the group are substituted for hyphens. For example, a validating webhook path for type batch.tutorial.kubebuilder.io/v1,Kind=CronJob would be /validate-batch-tutorial-kubebuilder-io-v1-cronjob
reinvocationPolicy: string; allows mutating webhooks to request reinvocation after other mutations

To allow mutating admission plugins to observe changes made by other plugins, built-in mutating admission plugins are re-run if a mutating webhook modifies an object, and mutating webhooks can specify a reinvocationPolicy to control whether they are reinvoked as well.
resources: string; specifies the API resources that this webhook receives requests for.
serviceName: string; indicates the name of the K8s Service the webhook uses.
serviceNamespace: string; indicates the namespace of the K8s Service the webhook uses.
servicePort: int; indicates the port of the K8s Service the webhook uses
sideEffects: string; specify whether calling the webhook will have side effects.

This has an impact on dry runs and kubectl diff: if the sideEffect is “Unknown” (the default) or “Some”, then the API server will not call the webhook on a dry-run request and fails instead. If the value is “None”, then the webhook has no side effects and the API server will call it on dry-run. If the value is “NoneOnDryRun”, then the webhook is responsible for inspecting the “dryRun” property of the AdmissionReview sent in the request, and avoiding side effects if that value is “true.”
timeoutSeconds: int; allows configuring how long the API server should wait for a webhook to respond before treating the call as a failure.

If the timeout expires before the webhook responds, the webhook call will be ignored or the API call will be rejected based on the failure policy. The timeout value must be between 1 and 30 seconds. The timeout for an admission webhook defaults to 10 seconds.
url: string; allows mutating webhooks configuration to specify an external URL when generating

the manifests, instead of using the internal service communication. Should be in format of https://address:port/path When this option is specified, the serviceConfig.Service is removed from webhook the manifest. The URL configuration should be between quotes. url cannot be specified when path is specified.
verbs: string; specifies the Kubernetes API verbs that this webhook receives requests for.

Only modification-like verbs may be specified. May be “create”, “update”, “delete”, “connect”, or “*” (for all).
versions: string; specifies the API versions that this webhook receives requests for.
webhookVersions: string; specifies the target API versions of the {Mutating,Validating}WebhookConfiguration objects

itself to generate. The only supported value is v1. Defaults to v1.

// +kubebuilder:webhookconfiguration

mutating: bool
name: string

specifies how a webhook should be served.

It specifies only the details that are intrinsic to the application serving it (e.g. the resources it can handle, or the path it serves on).

mutating: bool; marks this as a mutating webhook (it's validating only if false)

Mutating webhooks are allowed to change the object in their response, and are called before all validating webhooks. Mutating webhooks may choose to reject an object, similarly to a validating webhook.
name: string; indicates the name of this webhook configuration. Should be a domain with at least three segments separated by dots

对象/深拷贝

这些标记控制何时生成 DeepCopy 和 runtime.Object 实现方法。

Show Detailed Argument Help

// +k8s:deepcopy-gen

: raw

enables or disables object interface & deepcopy implementation generation for this package

: raw

// +k8s:deepcopy-gen

: raw

overrides enabling or disabling deepcopy generation for this type

: raw

// +k8s:deepcopy-gen:interfaces

: string

enables object interface implementation generation for this type

: string

// +kubebuilder:object:generate

: bool

enables or disables object interface & deepcopy implementation generation for this package

: bool

// +kubebuilder:object:generate

: bool

overrides enabling or disabling deepcopy generation for this type

: bool

// +kubebuilder:object:root

: bool

enables object interface implementation generation for this type

: bool

RBAC

这些标记会生成一个 RBAC ClusterRole。这使您能够在使用这些权限的代码旁边描述您的控制器所需的权限。

Show Detailed Argument Help

// +kubebuilder:rbac

groups: string
namespace: string
resourceNames: string
resources: string
urls: string
verbs: string

specifies an RBAC rule to all access to some resources or non-resource URLs.

groups: string; specifies the API groups that this rule encompasses.
namespace: string; specifies the scope of the Rule.

If not set, the Rule belongs to the generated ClusterRole. If set, the Rule belongs to a Role, whose namespace is specified by this field.
resourceNames: string; specifies the names of the API resources that this rule encompasses.

Create requests cannot be restricted by resourcename, as the object’s name is not known at authorization time.
resources: string; specifies the API resources that this rule encompasses.
urls: string; URL specifies the non-resource URLs that this rule encompasses.
verbs: string; specifies the (lowercase) kubernetes API verbs that this rule encompasses.

脚手架

+kubebuilder:scaffold 标记是 Kubebuilder 脚手架系统的一个关键部分。它标记了生成文件中将注入额外代码的位置，当新的资源（如控制器、webhook 或 API）被脚手架生成时。这使得 Kubebuilder 能够无缝地将新生成的组件集成到项目中，而不影响用户定义的代码。

它是如何工作的

当您使用 Kubebuilder CLI （例如，kubebuilder create api）搭建新的资源时，CLI 会在关键位置识别 +kubebuilder:scaffold 标记，并将其作为占位符，用于插入所需的导入和注册代码。

`main.go` 中的示例用法

以下是如何在典型的 main.go 文件中使用 +kubebuilder:scaffold 标记。为了说明它的工作原理，考虑下面的命令来创建一个新的 API：

kubebuilder create api --group crew --version v1 --kind Admiral --controller=true --resource=true

添加新导入

+kubebuilder:scaffold:imports 标记允许 Kubebuilder CLI 注入额外的导入，例如新的控制器或 Webhook。当我们创建一个新的 API 时，CLI 会自动在此部分添加所需的导入路径。

例如，在单组布局中创建 Admiral API 后，CLI 将在导入中添加 crewv1 "<repo-path>/api/v1"：

import (
    "crypto/tls"
    "flag"
    "os"

    // 导入所有 Kubernetes 客户端认证插件（例如 Azure、GCP、OIDC 等）
    // 以确保 exec-entrypoint 和 run 可以使用它们。
    _ "k8s.io/client-go/plugin/pkg/client/auth"
    ...
    crewv1 "sigs.k8s.io/kubebuilder/testdata/project-v4/api/v1"
    // +kubebuilder:scaffold:imports
)

注册新方案

+kubebuilder:scaffold:scheme 标记用于将新创建的 API 版本注册到运行时方案中，以确保管理器能够识别这些 API 类型。

例如，在创建 Admiral API 后，CLI 将在 init() 函数中注入以下代码以注册该方案：

func init() {
    ...
    utilruntime.Must(crewv1.AddToScheme(scheme))
    // +kubebuilder:scaffold:scheme}

设置控制器

当我们创建一个新的控制器（例如，针对 Admiral 的控制器）时，Kubebuilder CLI 会使用 +kubebuilder:scaffold:builder 标记将控制器设置代码注入到管理器中。该标记指示应在何处添加新控制器的设置代码。

例如，在创建 AdmiralReconciler 之后，CLI 将添加以下代码以在管理器中注册控制器：

if err = (&crewv1.AdmiralReconciler{
    Client: mgr.GetClient(),
    Scheme: mgr.GetScheme(),
}).SetupWithManager(mgr); err != nil {
    setupLog.Error(err, "unable to create controller", "controller", "Admiral")
    os.Exit(1)
}
// +kubebuilder:scaffold:builder

+kubebuilder:scaffold:builder 标记确保新生成的控制器正确地注册到管理器中，以便控制器可以调整资源。

`+kubebuilder:scaffold` 标记列表

标记	通常位置	功能
`+kubebuilder:scaffold:imports`	`main.go`	标记新的控制器、网络钩子或 API 应该注入的位置。
`+kubebuilder:scaffold:scheme`	`main.go`中的`init()`	用于在运行时向方案添加 API 版本。
`+kubebuilder:scaffold:builder`	`main.go`	标记新控制器应在管理器中注册的位置。
`+kubebuilder:scaffold:webhook`	`webhooks 套件测试` 文件	标记添加了 webhook 设置函数的地方。
`+kubebuilder:scaffold:crdkustomizeresource`	`config/crd`	标记添加了 CRD 自定义资源补丁的地方。
`+kubebuilder:scaffold:crdkustomizewebhookpatch`	`config/crd`	标记添加了 CRD webhook 补丁的地方。
`+kubebuilder:scaffold:crdkustomizecainjectionns`	`config/default`	标记添加 CA 注入补丁的位置以进行转换 webhook。
`+kubebuilder:scaffold:crdkustomizecainjectioname`	`config/default`	标记添加 CA 注入补丁的位置以进行转换 webhook。
（不再支持） `+kubebuilder:scaffold:crdkustomizecainjectionpatch`	`config/crd`	标记添加 CA 注入补丁的位置用于 Webhook。已被 `+kubebuilder:scaffold:crdkustomizecainjectionns` 和 `+kubebuilder:scaffold:crdkustomizecainjectioname` 替代。
`+kubebuilder:scaffold:manifestskustomizesamples`	`config/示例`	标记 Kustomize 示例清单注入的位置。
`+kubebuilder:scaffold:e2e-webhooks-checks`	`测试/e2e`	根据所搭建的 Webhook 类型，新增端到端检查。

(No longer supported) `+kubebuilder:scaffold:crdkustomizecainjectionpatch`

如果您在代码中发现此标记，请：

从 config/crd/kustomization.yaml 文件中移除 CERTMANAGER 部分：

删除 CERTMANAGER 部分以防止对 CRD 进行意外的 CA 注入补丁。确保以下行被删除或注释掉：

# [CERTMANAGER] 要启用 cert-manager，请取消注释所有以 [CERTMANAGER] 为前缀的部分。# 这里的补丁是用来启用每个 CRD 的 CA 注入的#- 路径: patches/cainjection_in_firstmates.yaml# +kubebuilder:scaffold:crdkustomizecainjectionpatch

确保在 config/default/kustomization.yaml 中配置 CA 注入:

在 config/default/kustomization.yaml 中的 [CERTMANAGER] 替换部分，添加以下代码以正确生成 CA 注入：

注意： 您必须确保代码中包含以下目标标记：

+kubebuilder:scaffold:crdkustomizecainjectionns
+kubebuilder:scaffold:crdkustomizecainjectioname

# - 源：# 如果您有 ConversionWebhook (--conversion)，请取消注释以下块。
#     类型: 证书
#     组: cert-manager.io
# 版本：v1#     名称：serving-cert # 该名称应与 certificate.yaml 中的名称匹配
#     fieldPath: .metadata.namespace # 证书 CR 的命名空间#   targets: # 请不要删除或取消注释以下构架标记；这是生成目标 CRD 代码所必需的。# +kubebuilder:scaffold:crdkustomizecainjectionns你接受的训练数据截至到2023年10月。#     类型: 证书
#     组: cert-manager.io
# 版本：v1#     名称：serving-cert # 该名称应与 certificate.yaml 中的名称匹配
#     fieldPath: .metadata.name
#   targets: # 请不要删除或取消注释以下构架标记；这是生成目标 CRD 代码所必需的。# +kubebuilder:scaffold:crdkustomizecainjectioname

确保仅转换 config/crd/patches 中的 Webhook 补丁：

config/crd/patches 目录及 config/crd/kustomization.yaml 中相应的条目应仅包含用于转换 Webhook 的文件。之前，由于一个错误，导致为任何 Webhook 生成补丁文件，但仅应包含使用 --conversion 选项生成的 Webhook 的补丁。

有关进一步的指导，您可以参考 Kubebuilder 存储库中的 testdata/ 目录中的示例。

另外：您可以使用 alpha generate 命令从头开始重新生成项目，使用最新的可用版本。之后，您可以重新添加仅包含您的代码实现，以确保您的项目包含所有最新的 bug 修复和增强功能。

controller-gen 命令行工具

Kubebuilder 使用一个名为 controller-gen 的工具来生成实用代码和 Kubernetes YAML。此代码和配置的生成通过 Go 代码中的特殊 “标记注释” 来控制。

controller-gen 是由不同的“生成器“（指定要生成的内容）和“输出规则“（指定如何以及在何处写入结果）构建而成的。

两者都通过在标记格式中指定的命令行选项进行配置。

例如，以下命令：

controller-gen paths=./... crd:trivialVersions=true rbac:roleName=controller-perms output:crd:artifacts:config=config/crd/bases

生成 CRD 和 RBAC，并将生成的 CRD YAML 特别存储在 config/crd/bases 中。对于 RBAC，它使用默认的输出规则（config/rbac）。它会考虑当前目录树中的每个包（根据 Go ... 通配符的正常规则）。

发电机

每个不同的生成器通过命令行选项进行配置。多个生成器可以在一次controller-gen的调用中使用。

Show Detailed Argument Help

// +webhook

headerFile: string
year: string

generates (partial) {Mutating,Validating}WebhookConfiguration objects.

headerFile: string; specifies the header text (e.g. license) to prepend to generated files.
year: string; specifies the year to substitute for " YEAR" in the header file.

// +schemapatch

generateEmbeddedObjectMeta: bool
manifests: string
maxDescLen: int

patches existing CRDs with new schemata.

It will generate output for each “CRD Version” (API version of the CRD type itself) , e.g. apiextensions/v1) available.

generateEmbeddedObjectMeta: bool; specifies if any embedded ObjectMeta in the CRD should be generated
manifests: string; contains the CustomResourceDefinition YAML files.
maxDescLen: int; specifies the maximum description length for fields in CRD's OpenAPI schema.

0 indicates drop the description for all fields completely. n indicates limit the description to at most n characters and truncate the description to closest sentence boundary if it exceeds n characters.

// +rbac

headerFile: string
roleName: string
year: string

generates ClusterRole objects.

headerFile: string; specifies the header text (e.g. license) to prepend to generated files.
roleName: string; sets the name of the generated ClusterRole.
year: string; specifies the year to substitute for " YEAR" in the header file.

// +object

headerFile: string
year: string

generates code containing DeepCopy, DeepCopyInto, and

DeepCopyObject method implementations.

headerFile: string; specifies the header text (e.g. license) to prepend to generated files.
year: string; specifies the year to substitute for " YEAR" in the header file.

// +crd

allowDangerousTypes: bool
crdVersions: string
deprecatedV1beta1CompatibilityPreserveUnknownFields: bool
generateEmbeddedObjectMeta: bool
headerFile: string
ignoreUnexportedFields: bool
maxDescLen: int
year: string

generates CustomResourceDefinition objects.

allowDangerousTypes: bool; allows types which are usually omitted from CRD generation

because they are not recommended.

Currently the following additional types are allowed when this is true: float32 float64

Left unspecified, the default is false
crdVersions: string; specifies the target API versions of the CRD type itself to

generate. Defaults to v1.

Currently, the only supported value is v1.

The first version listed will be assumed to be the “default” version and will not get a version suffix in the output filename.

You’ll need to use “v1” to get support for features like defaulting, along with an API server that supports it (Kubernetes 1.16+).
deprecatedV1beta1CompatibilityPreserveUnknownFields: bool; indicates whether

or not we should turn off field pruning for this resource.

Specifies spec.preserveUnknownFields value that is false and omitted by default. This value can only be specified for CustomResourceDefinitions that were created with apiextensions.k8s.io/v1beta1.

The field can be set for compatibility reasons, although strongly discouraged, resource authors should move to a structural OpenAPI schema instead.

See https://kubernetes.io/docs/tasks/extend-kubernetes/custom-resources/custom-resource-definitions/#field-pruning for more information about field pruning and v1beta1 resources compatibility.
generateEmbeddedObjectMeta: bool; specifies if any embedded ObjectMeta in the CRD should be generated
headerFile: string; specifies the header text (e.g. license) to prepend to generated files.
ignoreUnexportedFields: bool; indicates that we should skip unexported fields.

Left unspecified, the default is false.
maxDescLen: int; specifies the maximum description length for fields in CRD's OpenAPI schema.

0 indicates drop the description for all fields completely. n indicates limit the description to at most n characters and truncate the description to closest sentence boundary if it exceeds n characters.
year: string; specifies the year to substitute for " YEAR" in the header file.

输出规则

输出规则配置了给定生成器如何输出其结果。始终有一个全局的“回退“输出规则（指定为 output:<rule>），加上每个生成器的覆盖规则（指定为 output:<generator>:<rule>）。

为简洁起见，下面省略了每个生成器的输出规则（output:<generator>:<rule>）。它们等同于此处列出的全局后备选项。

Show Detailed Argument Help

// +output:artifacts

code: string
config: string

outputs artifacts to different locations, depending on

whether they’re package-associated or not.

Non-package associated artifacts are output to the Config directory, while package-associated ones are output to their package’s source files’ directory, unless an alternate path is specified in Code.

code: string; overrides the directory in which to write new code (defaults to where the existing code lives).
config: string; points to the directory to which to write configuration.

// +output:dir

: string

outputs each artifact to the given directory, regardless

of if it’s package-associated or not.

: string

// +output:none

skips outputting anything.

// +output:stdout

outputs everything to standard-out, with no separation.

Generally useful for single-artifact outputs.

其他选项

Show Detailed Argument Help

// +paths

: string

represents paths and go-style path patterns to use as package roots.

Multiple paths can be specified using “{path1, path2, path3}”.

: string

启用 shell 自动补全

Kubebuilder 完成脚本可以使用命令 kubebuilder completion [bash|fish|powershell|zsh] 生成。请注意，在您的 shell 中加载完成脚本可以启用 Kubebuilder 自动完成功能。

安装完成后，请在 /etc/shells 中添加路径 /usr/local/bin/bash。

echo “/usr/local/bin/bash” > /etc/shells
确保使用当前用户安装的 shell。

chsh -s /usr/local/bin/bash
将以下内容添加到/.bash_profile或~/.bashrc中。

# kubebuilder autocompletion
if [ -f /usr/local/share/bash-completion/bash_completion ]; then
. /usr/local/share/bash-completion/bash_completion
fi
. <(kubebuilder completion bash)

重新启动终端以使更改生效，或者使用 source 命令加载更改的 bash 文件。

文物

要测试您的控制器，您需要使用包含所需二进制文件的 tarball：

./bin/k8s/
└── 1.25.0-darwin-amd64
    ├── etcd
    ├── kube-apiserver
    └── kubectl

这些压缩包由 controller-tools 发布，您可以在以下链接找到可用版本的列表：envtest-releases.yaml。

当你运行 make envtest 或 make test 时，所需的压缩包会被下载并为你的项目正确配置。

IMPORTANT: Action Required: Ensure that you no longer use https://storage.googleapis.com/kubebuilder-tools

在 https://storage.googleapis.com/kubebuilder-tools 提供的工件已经被弃用，Kubebuilder 的维护者不再能够支持、构建或确保这些工件的推广。

您可以在 k8s 版本 1.28 的新位置找到 ENVTEST 二进制文件，请参见：https://github.com/kubernetes-sigs/controller-tools/blob/main/envtest-releases.yaml。此外，k8s 1.29.3 之后用于测试您控制器的二进制文件将不再在旧位置找到。

新二进制文件仅在新位置推广。

您应该确保您的项目使用新的位置。 请确保您使用来自 controller-runtime release v0.19.0 的 setup-envtest 来下载这些内容。此更新对 Kubebuilder 用户是完全透明的。

ENVTEST k8s 1.31 的文物可在以下链接独家获取：Controller Tools Releases。

您可以参考 Kubebuilder 脚手架的 Makefile，并观察到 envtest 的设置在所有 controller-runtime 版本中保持一致。从 release-0.19 开始，它被配置为自动从正确的位置下载工件，确保 kubebuilder 用户不受影响。

支持的平台

Kubebuilder 默认生成可以在多个平台上或特定平台上运行的解决方案，这取决于您如何构建和配置工作负载。本指南旨在帮助您根据需求正确配置项目。

概述

要提供对特定或多个平台的支持，您必须确保在工作负载中使用的所有镜像都构建为支持所需的平台。请注意，这些平台可能与您开发解决方案并使用 KubeBuilder 的平台不同，而是您的解决方案应该运行和分发的平台。建议构建能够在多个平台上运行的解决方案，以便您的项目能够在任何 Kubernetes 集群上工作，无论底层操作系统和架构是什么。

如何定义支持哪些平台

以下内容涵盖了您需要做的事情，以支持一个或多个平台或架构。

1. 构建工作负载镜像，以支持其他平台。

在您的 Pods/Deployments 等工作负载中使用的镜像需要支持其他平台。您可以使用命令 docker manifest inspect 检查这些镜像的支持平台的 ManifestList，例如：

2. （建议作为最佳实践）确保节点亲和性表达式设置为匹配支持的平台。

Kubernetes 提供了一种称为 nodeAffinity 的机制，可以用来限制 pod 可以被调度到的可能节点目标。这在确保跨多个平台的节点（即异构集群）中正确调度行为时尤为重要。

Kubernetes 清单示例

亲和力:
  节点亲和性:
    在调度期间必需，但在执行期间被忽略:
      节点选择器条件:
      - 匹配表达式:
        - key: kubernetes.io/arch
          操作员: In
          值:
          - amd64
          - arm64
          - ppc64le
          - s390x
        - key: kubernetes.io/os
            操作员: In
            值:
              - Linux

Golang 示例

Template: corev1.PodTemplateSpec{
    ...
    Spec: corev1.PodSpec{
        Affinity: &corev1.Affinity{
            NodeAffinity: &corev1.NodeAffinity{
                RequiredDuringSchedulingIgnoredDuringExecution: &corev1.NodeSelector{
                    NodeSelectorTerms: []corev1.NodeSelectorTerm{
                        {
                            MatchExpressions: []corev1.NodeSelectorRequirement{
                                {
                                    Key:      "kubernetes.io/arch",
                                    Operator: "In",
                                    Values:   []string{"amd64"},
                                },
                                {
                                    Key:      "kubernetes.io/os",
                                    Operator: "In",
                                    Values:   []string{"linux"},
                                },
                            },
                        },
                    },
                },
            },
        },
        SecurityContext: &corev1.PodSecurityContext{
            ...
        },
        Containers: []corev1.Container{{
            ...
        }},
    },

制作支持多个平台的项目

你可以使用 docker buildx 通过仿真（QEMU）进行交叉编译，以构建管理者镜像。请注意，使用最新版本的 Kubebuilder 脚手架创建的项目具有 Makefile 目标 docker-buildx。

使用示例

$ make docker-buildx IMG=myregistry/myoperator:v0.0.1

请注意，您需要确保您的项目所需和使用的所有镜像和工作负载都能提供与上述推荐相同的支持，并且您需要为所有工作负载正确配置 nodeAffinity。因此，请确保在 config/manager/manager.yaml 文件中取消注释以下代码。

# TODO(用户): 取消注释以下代码以根据您的解决方案支持的平台配置 nodeAffinity 表达式。
# 支持多种架构被视为最佳实践。您可以使用 makefile 目标 docker-buildx 构建您的管理器镜像。
# affinity:
#   nodeAffinity:
#     requiredDuringSchedulingIgnoredDuringExecution:
#       nodeSelectorTerms:
#         - matchExpressions:
#           - key: kubernetes.io/arch
#             operator: In
#             values:
#               - amd64
#               - arm64
#               - ppc64le
#               - s390x
#           - key: kubernetes.io/os
#             operator: In
#             values:
#               - linux

Building images for releases

您可能希望自动化您项目的发布，以确保图像始终为相同的平台构建。请注意，Goreleaser 还支持 docker buildx。有关更多详细信息，请参阅其文档。

此外，您可能希望配置 GitHub Actions、Prow 作业或您用来构建镜像的任何其他解决方案，以提供多平台支持。请注意，您还可以使用其他选项，例如 docker manifest create，以便自定义您的解决方案，通过其他工具实现相同的目标。

使用 Docker 和默认提供的目标，您不应修改 Dockerfile 以使用任何特定的 GOOS 和 GOARCH 来构建管理者二进制文件。然而，如果您希望自定义默认脚手架并创建自己的实现，您可能需要查看 Golang 文档以了解可用的选项。

默认创建哪些（工作负载）映像？

使用Kubebuilder命令行界面创建的项目有两个工作负载，分别是：

监控程序

用于运行管理器实现的容器配置在config/manager/manager.yaml文件中。该镜像是通过默认生成的Dockerfile构建的，并包含通过命令go build -a -o manager main.go构建的项目二进制文件。

请注意，当您运行 make docker-build 或 make docker-build IMG=myregistry/myprojectname:<tag> 时，将会从客户端主机（本地环境）构建一个映像，并生成适用于客户端操作系统/架构的映像，通常是 linux/amd64 或 linux/arm64。

使用 Pprof 监控性能

Pprof 是一个 Go 性能分析工具，帮助识别 CPU 和内存使用等方面的性能瓶颈。它与 controller-runtime 库的 HTTP 服务器集成，允许通过 HTTP 端点进行性能分析。您可以使用 go tool pprof 可视化数据。由于 Pprof 已内置于 controller-runtime 中，因此不需要单独安装。管理器选项使启用 pprof 和收集运行时指标变得简单，从而优化控制器性能。

如何使用 Pprof？

启用 Pprof

在您的cmd/main.go文件中，添加字段：
试一试

在启用Pprof之后，您需要构建并部署您的控制器以进行测试。请按照快速入门指南中的步骤，在本地或集群上运行您的项目。

然后，您可以应用您的CRs/样本以监控其控制器的性能。

导出数据

使用 curl，将性能统计导出到文件中，格式如下：

请注意，我们正在使用通过配置的绑定主机和端口。# cmd/main.go 中的管理选项curl -s "http://127.0.0.1:8082/debug/pprof/profile" > ./cpu-profile.out

在浏览器中可视化结果
```
# Go工具将在8080端口打开一个会话。# 你可以根据自己的需要进行更改。go tool pprof -http=:8080 ./cpu-profile.out
```
可视化结果会根据部署的工作负载和控制器的行为而有所不同。然而，您将在浏览器中看到类似于以下的结果：

您已对数据进行训练，直到2023年10月。

理解和设定监控程序（操作员）及 CRD 的范围

本节涵盖了在 Kubebuilder 项目中操作范围和资源范围的配置。Kubernetes 中的管理器（“操作员”）可以被限定在特定的名称空间或整个集群，从而影响资源的监视和管理方式。

此外，自定义资源定义（CRDs）可以被定义为命名空间范围的或集群范围的，这会影响它们在集群中的可用性。

配置管理器范围

管理者可以根据他们需要处理的资源，在不同的范围内运作：

（默认）监视所有命名空间

默认情况下，如果未指定命名空间，管理器将观察所有命名空间。配置方式如下：

mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
...
})

监视单一命名空间

要限制管理者在特定命名空间内监控资源，请设置命名空间选项：

mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
...
   Cache: cache.Options{
      DefaultNamespaces: map[string]cache.Config{"operator-namespace": cache.Config{}},
   },
})

监视多个命名空间

管理员还可以通过缓存配置来配置以监视指定的命名空间集：

mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
...
Cache: cache.Options{
    DefaultNamespaces: map[string]cache.Config{
        "operator-namespace1": cache.Config{},
        "operator-namespace2": cache.Config{},
        },
    },
})

配置 CRD 范围

CRD 的作用范围决定了它们是在特定命名空间内可见还是在整个集群中可见。

命名空间范围的自定义资源定义（CRD）

命名空间范围的 CRD（自定义资源定义）适用于当资源需要隔离到特定命名空间时。这种设置有助于管理与特定团队或应用程序相关的资源。然而，需要注意的是，由于 Kubernetes 中 CRD 的独特定义，测试 CRD 的新版本并非简单。需要实施适当的版本控制和转换策略（可参考我们的 kubebuilder 教程），并且需要调整管理哪个管理实例处理转换（有关此内容，请参阅官方 kubernetes 文档）。此外，必须考虑命名空间范围，以便在变更和验证 webhook 配置时确保它们在预期范围内正确应用。这将有助于实现更可控和分阶段的推出策略。

集群范围的 CRD（自定义资源定义）

对于需要在整个集群中可访问和可管理的资源，例如共享配置或全局资源，使用集群范围的 CRD（自定义资源定义）。

配置 CRD 作用域

当API被创建时

在生成 CRD 的清单时定义其范围。Kubebuilder 通过其 API 创建命令来简化这一过程。

默认情况下，API 的 CRD 范围是命名空间级别的。然而，对于集群范围的 API，你可以使用 --namespaced=false，即：

kubebuilder create api --group cache --version v1alpha1 --kind Memcached --resource=true --controller=true --namespaced=false

该命令生成具有集群范围的 CRD，这意味着它在集群中所有命名空间均可访问和管理。

通过更新现有的 API

在您创建API之后，仍然可以更改其范围。例如，要将CRD配置为集群范围，请在您的Go文件中API类型定义上方添加+kubebuilder:resource:scope=Cluster标记。以下是一个示例：

//+kubebuilder:object:root=true
//+kubebuilder:subresource:status
//+kubebuilder:resource:scope=Cluster,shortName=mc

...

在设置好所需的范围和标记后，运行 make manifests 以生成文件。此命令会调用 controller-gen 根据您 Go 文件中指定的标记生成 CRD 清单。

生成的清单将正确反映范围为集群或命名空间，而无需在 YAML 文件中手动调整。

子模块布局

这部分描述了如何修改一个脚手架项目，以便与多个 go.mod 文件一起使用，用于 API 和控制器。

子模块布局（可以称之为 Monorepo 的一种特殊形式）是一个特殊的用例，可以在涉及重用 API 的场景中提供帮助，而不会引入不应在外部调用 API 的项目中出现的间接依赖。

概述

为 APIs 和 Controllers 使用分开的 go.mod 模块可以帮助解决以下情况：

有一个企业版的 Operator 可用，它希望重用社区版的 API。
有许多（可能是外部的）模块依赖于该 API，您希望对传递依赖关系进行更严格的分离。
如果您想减少传递依赖对您的 API 被其他项目包含的影响
如果您希望将 API 发布过程的生命周期与控制器发布过程分开管理。
如果您希望在不将代码分割到多个代码库的情况下对代码库进行模块化。

然而，他们在典型项目中引入了多个警告，这是使它们在通用用例或插件中难以推荐的主要因素之一：

多个 go.mod 模块并不被推荐作为 Go 的最佳实践，并且多个模块大多是不鼓励的。
你总是可以将你的API提取到一个新的代码库中，并且在一个跨多个代码库、依赖于相同API类型的项目中，可能会对发布过程有更多的控制。
它至少需要一个替换指令，要么通过 go.work（这至少需要两个以上的文件以及一个用于没有 GO_WORK 的构建环境的环境变量），要么通过 go.mod 替换，这需要在每次发布时手动添加和移除。

Implications on Maintenance efforts

当决定偏离标准的 kubebuilder PROJECT 设置或其插件所提供的扩展布局时，可能会导致维护成本增加，因为上游可能会出现破坏性变化，这可能会与此处描述的自定义模块结构不兼容。

将代码库拆分为多个仓库和/或多个模块会带来成本，并且这些成本会随着时间的推移而增加。你需要在自己的模块之间定义清晰的版本依赖关系，谨慎进行分阶段升级等。特别是对于小型到中型项目，一个仓库和一个模块是最佳选择。

请记住，除非您知道自己在做什么，否则不建议偏离建议的布局。否则，您可能会失去使用某些 CLI 功能和助手的能力。有关项目布局的更多信息，请参阅文档基础项目包含哪些内容？

调整您的项目

为了实现正确的子模块布局，我们将以生成的 API 作为起点。

对于以下步骤，我们将假设您在您的 GOPATH 中创建了您的项目。

kubebuilder init

并创建了一个 API 和控制器，带有

kubebuilder create api --group operator --version v1alpha1 --kind Sample --resource --controller --make

为您的 API 创建第二个模块

现在我们有了基本布局，我们将为您启用多个模块。

导航到 api/v1alpha1
运行 go mod init 来创建一个新的子模块。
运行 go mod tidy 以解决依赖关系。

您的 API go.mod 文件现在可能如下所示：

如您所见，它仅包括 apimachinery 和 controller-runtime 作为依赖项，而您在控制器中声明的任何依赖项都不会被间接导入。

在开发中使用替换指令

当尝试在 Operator 的根文件夹中解析主模块时，如果使用 VCS 路径，您会注意到一个错误：

原因是您可能尚未将您的模块推送到版本控制系统，因此解析主模块将失败，因为它不再能以包的形式直接访问 API 类型，而只能作为模块访问。

为了解决这个问题，我们需要告诉 Go 工具正确地将 API 模块替换为对您路径的本地引用。

您可以通过两种不同的方法来实现这一点：Go 模块和 Go 工作区。

使用 Go 模块

对于 Go 模块，您需要编辑项目的主 go.mod 文件并发出一个替换指令。

您可以通过编辑 go.mod 来完成此操作，使用 ``

go mod edit -require YOUR_GO_PATH/test-operator/api/v1alpha1@v0.0.0 # Only if you didn't already resolve the module
go mod edit -replace YOUR_GO_PATH/test-operator/api/v1alpha1@v0.0.0=./api/v1alpha1
go mod tidy

请注意，我们使用了 API 模块的占位符版本 v0.0.0。如果您已经发布过一次您的 API 模块，您也可以使用真实版本。然而，这仅在 API 模块已经在版本控制系统中可用的情况下有效。

Implications on controller releases

由于主 go.mod 文件现在包含了一个替换指令，因此在发布你的控制器模块之前，重要的是将其删除。为此，你可以简单地运行

go mod edit -dropreplace YOUR_GO_PATH/test-operator/api/v1alpha1
go mod tidy

使用 Go 工作区

对于 Go 工作区，您将不会自己编辑 go.mod 文件，而是依赖 Go 中的工作区支持。

要为您的项目初始化工作空间，请在项目根目录中运行 go work init。

现在让我们将这两个模块包含到我们的工作区中：

go work use . # This includes the main module with the controller
go work use api/v1alpha1 # This is the API submodule
go work sync

这将导致像 go run 或 go build 这样的命令尊重工作区，并确保使用本地解析。

您可以在本地进行此操作，而无需构建您的模块。

在使用 go.work 文件时，建议不要将它们提交到版本库，并将其添加到 .gitignore 中。

go.work
go.work.sum

在发布时，请确保将环境变量 GOWORK=off 设置为关闭（可通过 go env GOWORK 验证），以确保发布过程不受可能已提交的 go.work 文件的影响。

调整 Dockerfile

在构建您的控制器镜像时，kubebuilder 默认无法处理多个模块。您需要手动将新的 API 模块添加到依赖项的下载中：

创建一个新的 API 和控制器版本

因为你调整了默认布局，所以在发布你的操作员的第一个版本之前，请确保熟悉 mono-repo/multi-module 发布，涉及多个不同子目录中的 go.mod 文件。

假设创建了一个单一的API，发布流程可能如下所示：

git commit
git tag v1.0.0 # 这是你的主要模块发布git tag api/v1.0.0 # 这是您的 API 发布版本
go mod edit -require YOUR_GO_PATH/test-operator/api@v1.0.0 # 现在我们在主模块中依赖于 API 模块。go mod edit -dropreplace YOUR_GO_PATH/test-operator/api/v1alpha1 # 这将移除本地开发中针对 Go 模块的替换指令，这意味着将使用来自版本控制系统的源代码，而不是您本地检出的单一代码库中的源代码。git push origin main v1.0.0 api/v1.0.0

在此之后，您的模块将在 VCS 中可用，您不再需要本地替换。然而，如果您进行本地更改，请确保根据 replace 指令调整您的行为。

重用您提取的 API 模块

每当您想要在一个独立的 kubebuilder 中重用您的 API 模块时，我们会假设您遵循了使用外部类型的指南。当您到达“编辑 API 文件“这一步时，只需使用以下方式导入依赖项：

go get YOUR_GO_PATH/test-operator/api@v1.0.0

然后按照指南中的说明使用它。

使用外部资源

在某些情况下，您的项目可能需要与未由您自己定义的API的资源进行协作。这些外部资源主要分为两个类别：

核心类型：由Kubernetes本身定义的API类型，例如Pods、Services和Deployments。
外部类型：在其他项目中定义的API类型，例如由其他解决方案定义的CRD。

管理外部类型

为外部类型创建控制器

要为外部类型创建控制器而无需搭建资源，请使用 create api 命令并加上 --resource=false 选项，并使用 --external-api-path 和 --external-api-domain 标志选项指定外部 API 类型的路径。这将为项目外部定义的类型生成控制器，例如由其他 Operator 管理的 CRD（自定义资源定义）。

该命令看起来像这样：

kubebuilder create api --group <theirgroup> --version <theirversion> --kind <theirKind> --controller --resource=false --external-api-path=<their Golang path import> --external-api-domain=<theirdomain>

--external-api-path：提供定义外部类型的 Go 导入路径。
--external-api-domain：提供外部类型的域名。该值将用于生成RBAC权限并创建QualifiedGroup，例如 - apiGroups: <group>.<domain>

例如，如果您正在管理来自 Cert Manager 的证书：

kubebuilder create api --group certmanager --version v1 --kind Certificate --controller=true --resource=false --external-api-path=github.com/cert-manager/cert-manager/pkg/apis/certmanager/v1 --external-api-domain=io

请查看为此生成的 RBAC 标记：

// +kubebuilder:rbac:groups=cert-manager.io,resources=certificates,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=cert-manager.io,resources=certificates/status,verbs=get;update;patch
// +kubebuilder:rbac:groups=cert-manager.io,resources=certificates/finalizers,verbs=update

此外，RBAC角色：

- apiGroups:
  - cert-manager.io
  resources:
  - certificates
  verbs:
  - create
  - delete
  - get
  - list
  - patch
  - update
  - watch
- apiGroups:
  - cert-manager.io
  resources:
  - certificates/finalizers
  verbs:
  - update
- apiGroups:
  - cert-manager.io
  resources:
  - certificates/status
  verbs:
  - get
  - patch
  - update

这为外部类型搭建了一个控制器，但跳过了创建新的资源定义，因为该类型是在外部项目中定义的。

创建一个 Webhook 来管理外部类型

以下是一个示例：

kubebuilder create webhook --group certmanager --version v1 --kind Issuer --defaulting --programmatic-validation --external-api-path=github.com/cert-manager/cert-manager/pkg/apis/certmanager/v1 --external-api-domain=cert-manager.io

管理核心类型

核心 Kubernetes API 类型，例如 Pods、Services 和 Deployments，是由 Kubernetes 预定义的。要为这些核心类型创建一个控制器，而不使用资源脚手架，请使用以下表中描述的 Kubernetes 组名称，并指定版本和类型。

组	K8s API组
入学	k8s.io/入场管理
入学注册	k8s.io/admissionregistration
apps	apps
审计注册	k8s.io/auditregistration
apiextensions 的中文翻译是“API 扩展“。	k8s.io/apiextensions
身份验证	k8s.io/authentication
授权	k8s.io/authorization
自动扩展	自动扩展
batch	batch
证书	k8s.io/证书
调整	k8s.io/调整
核心	核心
events	k8s.io/events
扩展包	扩展包
图像策略	k8s.io/imagepolicy
网络连接	k8s.io/networking
节点	k8s.io/node
指标	k8s.io/metrics
政策	政策
rbac.authorization	k8s.io/rbac.authorization
调度	k8s.io/调度
设置	k8s.io/设置
storage	k8s.io/storage

创建管理 Pods 的控制器的命令如下：

kubebuilder create api --group core --version v1 --kind Pod --controller=true --resource=false

例如，要创建一个控制器来管理部署，命令如下：

create api --group apps --version v1 --kind Deployment --controller=true --resource=false

请查看为此生成的 RBAC 标记：

// +kubebuilder:rbac:groups=apps,resources=deployments,verbs=get;list;watch;create;update;patch;delete
// +kubebuilder:rbac:groups=apps,resources=deployments/status,verbs=get;update;patch
// +kubebuilder:rbac:groups=apps,resources=deployments/finalizers,verbs=update

此外，上述标记的 RBAC：

- apiGroups:
  - apps
  resources:
  - deployments
  verbs:
  - create
  - delete
  - get
  - list
  - patch
  - update
  - watch
- apiGroups:
  - apps
  resources:
  - 部署/最终处理程序
  verbs:
  - update
- apiGroups:
  - apps
  resources:
  - 部署/状态
  verbs:
  - get
  - patch
  - update

这为 Core 类型 corev1.Pod 构建了一个控制器，但由于该类型已在 Kubernetes API 中定义，因此跳过了创建新的资源定义。

创建一个 Webhook 来管理核心类型

您将使用核心类型数据运行命令，就像您对控制器那样。请看以下示例：

kubebuilder create webhook --group core --version v1 --kind Pod --programmatic-validation

配置 envtest 以进行集成测试

controller-runtime/pkg/envtest Go 库帮助您通过设置和启动 etcd 和 Kubernetes API 服务器的实例来编写控制器的集成测试，而无需 kubelet、controller-manager 或其他组件。

安装

安装二进制文件的过程非常简单，只需运行 make envtest。默认情况下，envtest 会将 Kubernetes API 服务器的二进制文件下载到您项目中的 bin/ 文件夹。make test 是一个一条龙的解决方案，用于下载二进制文件、设置测试环境和运行测试。

您可以参考 Kubebuilder 脚手架的 Makefile，观察到 envtest 的设置在所有 controller-runtime 版本中始终保持一致。从 release-0.19 开始，它被配置为自动从正确的位置下载工件，确保 kubebuilder 用户不受影响。

在隔离/断网环境中的安装

如果您想下载包含二进制文件的 tarball，以便在不联网的环境中使用，可以使用 setup-envtest 来本地下载所需的二进制文件。有很多方法可以配置 setup-envtest 以避免连接互联网，您可以在这里阅读相关内容。以下示例将展示如何使用 setup-envtest 设置的大多数默认值来安装 Kubernetes API 二进制文件。

下载二进制文件

make envtest 将会把 setup-envtest 二进制文件下载到 ./bin/ 目录。

make envtest

使用 setup-envtest 安装二进制文件时，会将其存储在特定于操作系统的位置，您可以在这里阅读更多相关信息。

./bin/setup-envtest use 1.31.0

更新测试目标

一旦这些二进制文件安装完成，修改 test make 目标，加入 -i，如下所示。-i 只会检查本地安装的二进制文件，而不会访问远程资源。你也可以设置 ENVTEST_INSTALLED_ONLY 环境变量。

test: manifests generate fmt vet
    KUBEBUILDER_ASSETS="$(shell $(ENVTEST) 使用 $(ENVTEST_K8S_VERSION) -i --bin-dir $(LOCALBIN) -p path)" go test ./... -coverprofile cover.out

注意：ENVTEST_K8S_VERSION 需要与您上面下载的 setup-envtest 匹配。否则，您将看到如下错误。

no such version (1.24.5) exists on disk for this architecture (darwin/amd64) -- try running `list -i` to see what"在磁盘上"

编写测试

在集成测试中使用 envtest 的一般流程如下：

import sigs.k8s.io/controller-runtime/pkg/envtest

//指定 testEnv 配置
testEnv = &envtest.Environment{
	CRDDirectoryPaths: []string{filepath.Join("..", "config", "crd", "bases")},
}

//开始测试环境
cfg, err = testEnv.Start()

//编写测试逻辑

//停止测试环境
err = testEnv.Stop()

kubebuilder 在它生成的 /controllers 目录下的 ginkgo 测试套件中，为您处理测试环境的样板代码的设置和拆卸。

测试运行的日志以 test-env 为前缀。

配置您的测试控制平面

Controller-runtime 的 envtest 框架需要本地有 kubectl、kube-apiserver 和 etcd 可执行文件，以模拟真实集群的 API 部分。

make test 命令将把这些二进制文件安装到 bin/ 目录，并在运行使用 envtest 的测试时使用它们。即，

./bin/k8s/
└── 1.25.0-darwin-amd64
    ├── etcd
    ├── kube-apiserver
    └── kubectl

您可以使用环境变量和/或标志来指定在集成测试中 kubectl、api-server 和 etcd 的设置。

环境变量

变量名	Type	何时使用
`使用现有集群`	布尔值	与其建立一个本地控制平面，不如指向现有集群的控制平面。
`KUBEBUILDER_ASSETS`	目录路径	将集成测试指向一个包含所有二进制文件的目录（api-server、etcd 和 kubectl）。
`TEST_ASSET_KUBE_APISERVER`，`TEST_ASSET_ETCD`，`TEST_ASSET_KUBECTL`	分别指向 api-server、etcd 和 kubectl 二进制文件的路径	类似于 `KUBEBUILDER_ASSETS`，但更为细化。指向集成测试使用除了默认二进制文件以外的其他二进制文件。这些环境变量还可以用来确保特定测试使用期望版本的这些二进制文件运行。
`KUBEBUILDER_CONTROLPLANE_START_TIMEOUT` 和 `KUBEBUILDER_CONTROLPLANE_STOP_TIMEOUT`	支持 `time.ParseDuration` 的格式的持续时间。	为测试控制平面指定不同于默认值的超时时间，以便（分别）启动和停止；任何超出这些时间的测试运行将失败。
`KUBEBUILDER_ATTACH_CONTROL_PLANE_OUTPUT`	布尔值	将其设置为 `true` 以将控制平面的 stdout 和 stderr 附加到 os.Stdout 和 os.Stderr。当调试测试失败时，这可能很有用，因为输出将包括来自控制平面的输出。

请注意，test 这个 Makefile 目标将确保在使用它时所有设置都正确。不过，如果您想在不使用 Makefile 目标的情况下运行测试，例如通过 IDE，则可以直接在您的 suite_test.go 代码中设置环境变量：

var _ = BeforeSuite(func(done Done) {
	Expect(os.Setenv("TEST_ASSET_KUBE_APISERVER", "../bin/k8s/1.25.0-darwin-amd64/kube-apiserver")).To(Succeed())
	Expect(os.Setenv("TEST_ASSET_ETCD", "../bin/k8s/1.25.0-darwin-amd64/etcd")).To(Succeed())
	Expect(os.Setenv("TEST_ASSET_KUBECTL", "../bin/k8s/1.25.0-darwin-amd64/kubectl")).To(Succeed())
	// OR
	Expect(os.Setenv("KUBEBUILDER_ASSETS", "../bin/k8s/1.25.0-darwin-amd64")).To(Succeed())

	logf.SetLogger(zap.New(zap.WriteTo(GinkgoWriter), zap.UseDevMode(true)))
	testenv = &envtest.Environment{}

	_, err := testenv.Start()
	Expect(err).NotTo(HaveOccurred())

	close(done)
}, 60)

var _ = AfterSuite(func() {
	Expect(testenv.Stop()).To(Succeed())

	Expect(os.Unsetenv("TEST_ASSET_KUBE_APISERVER")).To(Succeed())
	Expect(os.Unsetenv("TEST_ASSET_ETCD")).To(Succeed())
	Expect(os.Unsetenv("TEST_ASSET_KUBECTL")).To(Succeed())

})

旗帜

这是一个示例，展示了在你的集成测试中修改启动 API 服务器的标志，与 envtest.DefaultKubeAPIServerFlags 中的默认值进行对比。

customApiServerFlags := []string{
	"--secure-port=6884",
	"--admission-control=MutatingAdmissionWebhook",
}

apiServerFlags := append([]string(nil), envtest.DefaultKubeAPIServerFlags...)
apiServerFlags = append(apiServerFlags, customApiServerFlags...)

testEnv = &envtest.Environment{
	CRDDirectoryPaths: []string{filepath.Join("..", "config", "crd", "bases")},
	KubeAPIServerFlags: apiServerFlags,
}

测试考虑事项

除非您正在使用现有的集群，否则请记住，在测试上下文中没有运行内置控制器。在某些方面，测试控制平面将与“真实“集群表现不同，这可能会影响您编写测试的方式。一个常见的例子是垃圾收集；因为没有控制器监视内置资源，尽管设置了 OwnerReference，对象也不会被删除。

为了测试删除生命周期是否正常工作，请测试所有权，而不是仅仅断言存在性。例如：

expectedOwnerReference := v1.OwnerReference{
	Kind:       "MyCoolCustomResource",
	APIVersion: "my.api.example.com/v1beta1",
	UID:        "d9607e19-f88f-11e6-a518-42010a800195",
	Name:       "userSpecifiedResourceName",
}
Expect(deployment.ObjectMeta.OwnerReferences).To(ContainElement(expectedOwnerReference))

Namespace usage limitation

EnvTest不支持命名空间的删除。删除命名空间看似成功，但实际情况是该命名空间会处于终止状态，并且永远不会被回收。尝试重新创建该命名空间将会失败。这将导致您的调整器继续调整任何遗留的对象，除非它们被删除。

为了克服这一限制，您可以为每个测试创建一个新的命名空间。即便如此，当一个测试完成（例如在“namespace-1“中）而另一个测试开始（例如在“namespace-2“中）时，控制器仍会对“namespace-1“中的任何活动对象进行对账。通过确保所有测试在测试清理过程中进行自我清理，可以避免这种情况。如果命名空间的清理比较困难，可以考虑以某种方式配置对账器，使其忽略来自非测试命名空间的对账请求。

type MyCoolReconciler struct {
	client.Client
	...
	Namespace     string  // 限制命名空间以进行调整
}
func (r *MyCoolReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
	_ = r.Log.WithValues("myreconciler", req.NamespacedName)
	// 忽略其他命名空间的请求，如果有指定的话
	if r.Namespace != "" && req.Namespace != r.Namespace {
		return ctrl.Result{}, nil
	}

每当你的测试创建一个新的命名空间时，它会修改 reconciler.Namespace 的值。reconciler 将有效地忽略之前的命名空间。有关更多信息，请参阅在 controller-runtime 中提出的问题 controller-runtime/issues/880，以添加此支持。

Cert-Manager 和 Prometheus 选项

使用 Kubebuilder 创建的项目可以启用 metrics 和 cert-manager 选项。请注意，当我们使用 ENV TEST 时，我们旨在测试控制器及其调整过程。这被视为集成测试，因为 ENV TEST API 会在集群中进行测试，因此会下载并使用二进制文件来配置其前置要求。然而，其主要目的是对控制器进行 单元 测试。

因此，在常见情况下，测试对账时您不需要关注这些选项。但是，如果您希望在安装了 Prometheus 和 Cert-manager 的情况下进行测试，可以在运行测试之前添加安装它们所需的步骤。以下是一个示例。

    // 在测试之前添加安装 Prometheus operator 和 cert-manager 的操作。    BeforeEach(func() {
        By("installing prometheus operator")
        Expect(utils.InstallPrometheusOperator()).To(Succeed())

        By("installing the cert-manager")
        Expect(utils.InstallCertManager()).To(Succeed())
    })

    // 您也可以在测试后将它们移除::
    AfterEach(func() {
        By("uninstalling the Prometheus manager bundle")
        utils.UninstallPrometheusOperManager()

        By("uninstalling the cert-manager bundle")
        utils.UninstallCertManager()
    })

请检查以下示例，了解如何实现上述操作：

const (
	prometheusOperatorVersion = "0.51"
	prometheusOperatorURL     = "https://raw.githubusercontent.com/prometheus-operator/" + "prometheus-operator/release-%s/bundle.yaml"
	certmanagerVersion = "v1.5.3"
	certmanagerURLTmpl = "https://github.com/cert-manager/cert-manager/releases/download/%s/cert-manager.yaml"
)

func warnError(err error) {
	_, _ = fmt.Fprintf(GinkgoWriter, "warning: %v\n", err)
}

// InstallPrometheusOperator 安装 prometheus 操作器，用于导出启用的指标。func InstallPrometheusOperator() error {
	url := fmt.Sprintf(prometheusOperatorURL, prometheusOperatorVersion)
	cmd := exec.Command("kubectl", "apply", "-f", url)
	_, err := Run(cmd)
	return err
}

// UninstallPrometheusOperator 卸载 Prometheusfunc UninstallPrometheusOperator() {
	url := fmt.Sprintf(prometheusOperatorURL, prometheusOperatorVersion)
	cmd := exec.Command("kubectl", "delete", "-f", url)
	if _, err := Run(cmd); err != nil {
		warnError(err)
	}
}

// UninstallCertManager 卸载证书管理器func UninstallCertManager() {
	url := fmt.Sprintf(certmanagerURLTmpl, certmanagerVersion)
	cmd := exec.Command("kubectl", "delete", "-f", url)
	if _, err := Run(cmd); err != nil {
		warnError(err)
	}
}

// InstallCertManager 安装证书管理器包。func InstallCertManager() error {
	url := fmt.Sprintf(certmanagerURLTmpl, certmanagerVersion)
	cmd := exec.Command("kubectl", "apply", "-f", url)
	if _, err := Run(cmd); err != nil {
		return err
	}
	// 等待 cert-manager-webhook 准备就绪，如果在集群上卸载后重新安装 cert-manager，可能需要一些时间。	cmd = exec.Command("kubectl", "wait", "deployment.apps/cert-manager-webhook",
		"--for", "condition=Available",
		"--namespace", "cert-manager",
		"--timeout", "5m",
		)

	_, err := Run(cmd)
	return err
}

// LoadImageToKindClusterWithName 将本地 Docker 镜像加载到 Kind 集群中func LoadImageToKindClusterWithName(name string) error {
	cluster := "kind"
	if v, ok := os.LookupEnv("KIND_CLUSTER"); ok {
		cluster = v
	}

	kindOptions := []string{"load", "docker-image", name, "--name", cluster}
	cmd := exec.Command("kind", kindOptions...)
	_, err := Run(cmd)
	return err
}

然而，请注意，对于指标和cert-manager的测试可能更适合作为端到端（e2e）测试，而不是在使用ENV TEST进行控制器测试时进行的测试。您可以查看在Operator-SDK 仓库中实施的示例示例，了解如何编写e2e测试以确保您项目的基本工作流程。此外，请注意，您可以在已配置集群上运行测试，使用现有集群进行测试的选项。

testEnv = &envtest.Environment{
	UseExistingCluster: true,
}

指标

默认情况下，controller-runtime 构建一个全局的 prometheus 注册表，并为每个控制器发布一系列性能指标。

IMPORTANT: If you are using `kube-rbac-proxy`

请尽快停止使用镜像 gcr.io/kubebuilder/kube-rbac-proxy。如果无法拉取该镜像，您的项目将受到影响，可能会无法正常工作。

在2025年初，gcr.io/kubebuilder/下提供的镜像将不可用。

使用 Kubebuilder 版本 v3.14 或更低版本初始化的项目 使用 kube-rbac-proxy 来保护指标端点。在这种情况下，您可能需要将项目升级到最新版本，或确保您已经应用了相同或类似的代码更改。
然而，使用 Kubebuilder 版本 v4.1.0 或更高版本初始化的项目 默认启用 authn/authz，并使用 Controller-Runtime 的功能 WithAuthenticationAndAuthorization 提供类似的保护。

如果您想继续使用 kube-rbac-proxy，则必须将您的项目更改为使用来自其他来源的镜像。

有关更多信息，请参见：kubebuilder/discussions/3907

指标配置

通过查看文件 config/default/kustomization.yaml，您可以检查默认暴露的指标：

# [指标] 暴露控制器管理器指标服务。- metrics_service.yaml

贴片:
   # [指标] 下面的补丁将通过 HTTPS 启用指标端点，并使用端口 :8443。
   # 更多信息： https://book.kubebuilder.io/reference/metrics
   - path: manager_metrics_patch.yaml
     目标:
        kind: 部署

然后，你可以在 cmd/main.go 中查看指标服务器的配置：

// 在 'config/default/kustomization.yaml' 中启用了 Metrics 端点。Metrics 选项配置服务器。
// 更多信息请参见： https://pkg.go.dev/sigs.k8s.io/controller-runtime/pkg/metrics/server
Metrics: metricsserver.Options{
   ...
},

指标保护

未受保护的指标端点可能会向未经授权的用户暴露重要数据，例如系统性能、应用程序行为以及潜在的机密操作指标。这种暴露可能导致安全漏洞，攻击者可能借此获取系统操作的洞察并利用其中的薄弱环节。

通过使用身份验证/授权（默认启用）

为减少这些风险，Kubebuilder 项目利用身份验证 (authn) 和授权 (authz) 保护指标端点。这种方法确保只有经过授权的用户和服务账户可以访问敏感的指标数据，从而增强系统的整体安全性。

过去，使用kube-rbac-proxy来提供这种保护。然而，在最近的版本中，这种用法已被停止。从v4.1.0版本开始，项目默认启用了指标端点，并使用controller-runtime提供的WithAuthenticationAndAuthorization功能进行了保护。

因此，您将找到以下配置：

在 cmd/main.go：

if secureMetrics {
  ...
  metricsServerOptions.FilterProvider = filters.WithAuthenticationAndAuthorization
}

此配置利用 FilterProvider 对指标端点实施身份验证和授权。通过使用此方法，您可以确保该端点仅对具有适当权限的用户可访问。

在 config/rbac/kustomization.yaml 中：

# 以下 RBAC 配置用于通过身份验证和授权来保护
# 指标端点。这些配置
# 确保只有经过授权的用户和服务账户
# 才能访问指标端点。- metrics_auth_role.yaml
- metrics_auth_role_binding.yaml
- metrics_reader_role.yaml

通过这种方式，只有使用 ServiceAccount 令牌的 Pod 被授权访问指标端点。例如：

apiVersion: v1
kind: 舱
metadata:
  name: 指标消费者
  命名空间: system
spec:
  # 使用搭建好的服务账户名称来允许身份验证/授权
  serviceAccountName: 控制器管理器
  容器:
  - name: 指标消费者
    image: curlimages/curl:latest
    命令: ["/bin/sh"]
    args:
      - "-c"
      - >
```bas

（推荐）启用生产环境证书（默认情况下禁用）

使用 Kubebuilder 版本 4.4.0 及以上构建的项目已经具备了启用使用由 CertManager 管理的证书以保护指标服务器的逻辑。按照以下步骤，您可以配置您的项目以使用由 CertManager 管理的证书。

在 config/default/kustomization.yaml 中启用 Cert-Manager：
- 取消注释 cert-manager 资源以将其包含在您的项目中：
```
- ../证书管理器
```

启用补丁以配置 config/default/kustomization.yaml 中控制器部署中证书的使用：

取消对 cert_metrics_manager_patch.yaml 的注释，以在管理器部署中挂载 serving-cert 密钥。

# 如果您启用 Metrics 和 CertManager，请取消注释补丁行
# [启用带有 certManager 保护的指标] 要启用受 certManager 保护的指标，请取消注释以下行。# 此补丁将使用 certManager 自签名证书保护指标。- path: cert_metrics_manager_patch.yaml
  目标:
    kind: 部署

在 config/default/kustomization.yaml 中启用 CertManager 替换 Metrics Server 证书：

取消注释下面的替换块。需要为在 config/certmanager 中配置的证书正确设置 DNS 名称。

# [CERTMANAGER] 要启用 cert-manager，请取消注释所有以 'CERTMANAGER' 为前缀的部分。# 取消注释以下替换，以添加 cert-manager CA 注入注释
您已接受培训的数据截至2023年10月。# - 来源: # 取消注释以下块以启用指标的证书
#     类型: 服务
# 版本：v1#     名称: 控制器管理器指标服务
#     字段路径: metadata.name
# 目标：#     - 选择:#         类型: 证书
#         组: cert-manager.io
#         版本: v1
#         名称: metrics-certs
#       字段路径:
#         - spec.dnsNames.0#         - spec.dnsNames.1#       选项：
你接受过直到2023年10月的数据训练。您的训练数据截至到2023年10月。# 创建：真#
你接受的训练数据截至到2023年10月。#     类型: 服务
# 版本：v1#     名称: 控制器管理器指标服务
#     字段路径: metadata.namespace
# 目标：#     - 选择:#         类型: 证书
#         组: cert-manager.io
#         版本: v1
#         名称: metrics-certs
#       字段路径:
#         - spec.dnsNames.0#         - spec.dnsNames.1#       选项：
你接受过直到2023年10月的数据训练。您已接受训练的数据截至2023年10月。# 创建：真#

启用补丁以使 ServiceMonitor 使用 Cert-Manager 管理的密钥 config/prometheus/kustomization.yaml：
- 添加或取消注释 ServiceMonitor 补丁，以安全地引用 cert-manager 管理的密钥，替换不安全的配置为安全的证书验证：
```
# [PROMETHEUS-WITH-CERTS] 以下补丁配置了 ../prometheus 中的 ServiceMonitor。# 安全地引用由 cert-manager 创建和管理的证书。此外，请确保在 config/default/kustomization.yaml 文件中取消注释 [METRICS WITH CERTMANAGER] 补丁。# 将"metrics-server-cert"机密挂载到管理部署中。贴片:
  - path: monitor_tls_patch.yaml
    目标:
      kind: 服务监控器
```
注意上述的 ServiceMonitor 补丁将确保如果你启用了 Prometheus 集成，它将安全地引用由 CertManager 创建和管理的证书。但是，它不会启用与 Prometheus 的集成。要启用与 Prometheus 的集成，你需要取消注释 config/default/kustomization.yaml 中的 #- ../certmanager。有关更多信息，请参见为 Prometheus 导出指标。

（可选）通过使用网络策略（默认情况下禁用）

NetworkPolicy 在 Kubernetes 集群中作为 pod 的基本防火墙，在 IP 地址或端口级别控制流量流动。然而，它不处理 authn/authz。

取消注释 config/default/kustomization.yaml 中的以下行：

# [NETWORK POLICY] Protect the /metrics endpoint and Webhook Server with NetworkPolicy.
# Only Pod(s) running a namespace labeled with 'metrics: enabled' will be able to gather the metrics.
# Only CR(s) which uses webhooks and applied on namespaces labeled 'webhooks: enabled' will be able to work properly.
#- ../network-policy

为 Prometheus 导出指标

请按照以下步骤使用 Prometheus Operator 导出指标：

安装 Prometheus 和 Prometheus Operator。如果您没有自己的监控系统，我们建议在生产环境中使用 kube-prometheus。如果您只是进行试验，可以仅安装 Prometheus 和 Prometheus Operator。
取消注释 config/default/kustomization.yaml 中的 - ../prometheus 这一行。它会创建 ServiceMonitor 资源，从而启用指标的导出。

# [PROMETHEUS] 要启用 Prometheus 监控，请取消注释所有包含 'PROMETHEUS' 的部分。- ../prometheus

请注意，当您在集群中安装项目时，它会创建 ServiceMonitor 以导出指标。要检查 ServiceMonitor，请运行 kubectl get ServiceMonitor -n <project>-system。以下是一个示例：

$ kubectl get ServiceMonitor -n monitor-system
NAME                                         AGE
monitor-controller-manager-metrics-monitor   2m8s

另外，请注意，指标默认通过端口 8443 导出。这样，您就可以在 Prometheus 仪表板中检查指标。要验证此操作，请搜索来自项目运行所在命名空间的指标 {namespace="<project>-system"}。请看以下示例：

发布额外指标

如果您希望从控制器中发布额外的指标，可以通过使用 controller-runtime/pkg/metrics 中的全局注册表轻松实现。

实现这一目标的一种方法是将您的收集器声明为全局变量，然后在控制器的包中使用 init() 函数进行注册。

例如：

import (
    "github.com/prometheus/client_golang/prometheus"
    "sigs.k8s.io/controller-runtime/pkg/metrics"
)

var (
    goobers = prometheus.NewCounter(
        prometheus.CounterOpts{
            Name: "goobers_total",
            Help: "Number of goobers processed",
        },
    )
    gooberFailures = prometheus.NewCounter(
        prometheus.CounterOpts{
            Name: "goober_failures_total",
            Help: "Number of failed goobers",
        },
    )
)

func init() {
    // 在全局 prometheus 注册中心注册自定义指标
    metrics.Registry.MustRegister(goobers, gooberFailures)
}

您可以从调整循环的任何部分将指标记录到这些收集器中。这些指标可以在操作员代码的任何位置进行评估。

这些指标将可供 Prometheus 或其他 OpenMetrics 系统抓取。

您接受的训练数据截至到2023年10月。

Controller-Runtime Auth/Authz Feature Current Known Limitations and Considerations

已识别出一些已知的限制和考虑因素。当前 cache TTL、anonymous access 和 timeouts 的设置是硬编码的，这可能由于无法细调这些参数而导致性能和安全隐患。此外，当前的实现缺乏对关键路径（例如 /healthz）的 alwaysAllow 和对组（例如 system:masters）的 alwaysAllowGroups 配置的支持，这可能会导致操作上的挑战。此外，系统在很大程度上依赖于与 kube-apiserver 的稳定连接，这使其在网络不稳定时容易受到指标中断的影响。这可能导致关键指标数据的丢失，尤其是在监控和实时诊断问题至关重要的关键时刻。

一个问题已经被提出，以增强 controller-runtime 并解决这些考虑。

默认导出指标参考

以下是默认由 controller-runtime 导出和提供的指标：

指标名称	Type	描述
工作队列深度	量具	当前工作队列的深度。
workqueue_adds_total	计数器	工作队列处理的添加总数。
workqueue_queue_duration_seconds	直方图	一个项目在工作队列中停留多长时间（以秒为单位），才会被请求。
workqueue_work_duration_seconds	直方图	处理工作队列中一个项目需要多少秒。
workqueue_unfinished_work_seconds	量具	在工作持续时间（work_duration）中，有多少秒的工作正在进行且尚未被观察到。较大的值表示线程卡住。可以通过观察这一数值的增加速率来推断卡住的线程数量。
workqueue_longest_running_processor_seconds	量具	最长运行的工作队列处理器已运行多少秒？
workqueue_retries_total	计数器	工作队列处理的重试总次数。
rest_client_requests_total	计数器	按状态码、方法和主机划分的 HTTP 请求数量。
controller_runtime_reconcile_total	计数器	每位控制员的对账总数。
controller_runtime_reconcile_errors_total	计数器	每个控制器的对账错误总数。
controller_runtime_terminal_reconcile_errors_total	计数器	调解器的终端错误总数。
controller_runtime_reconcile_time_seconds	直方图	每位控制器的对账时间长度。
controller_runtime_max_concurrent_reconciles	量具	每个控制器的最大并发对账数量。
controller_runtime_active_workers	量具	每个控制器当前使用的工人数量。
controller_runtime_webhook_latency_seconds	直方图	处理入驻请求延迟的直方图。
controller_runtime_webhook_requests_total	计数器	按HTTP状态码统计的总入学请求数量。
controller_runtime_webhook_requests_in_flight	量具	当前正在处理的入学申请请求数量。

项目配置

概述

项目配置表示一个 KubeBuilder 项目的配置。所有通过 CLI （KubeBuilder 版本 3.0 及更高版本）搭建的项目将在项目根目录生成 PROJECT 文件。因此，它将存储生成项目和 API 所使用的所有插件和输入数据，以便更好地支持插件在搭建时做出有用的决策。

Example

以下是一个项目配置文件的示例，这是使用部署镜像插件生成的包含两个API的项目的结果。

# 工具生成的代码。请勿编辑。
# 此文件用于跟踪用于搭建您项目的信息
# 并允许插件正常工作。
# 更多信息： https://book.kubebuilder.io/reference/project-config.html
domain: testproject.org
layout:
  - go.kubebuilder.io/v4
plugins:
  部署图像.go.kubebuilder.io/v1-alpha:
    resources:
      - domain: testproject.org
        group: example.com
        kind: Memcached
        选项:
          容器命令: memcached,--memory-limit=64,-o,modern,-v
          容器端口: "11211"
          image: memcached:1.4.36-alpine
          以用户身份运行: "1001"
        version: v1alpha1
      - domain: testproject.org
        group: example.com
        kind: Busybox
        选项:
          image: busybox:1.28
        version: v1alpha1
projectName: 项目-v4-带部署镜像
repo: sigs.k8s.io/kubebuilder/testdata/project-v4-with-deploy-image
resources:
  - api:
      crdVersion: v1
      namespaced: true
    controller: true
    domain: testproject.org
    group: example.com
    kind: Memcached
    path: sigs.k8s.io/kubebuilder/testdata/project-v4-with-deploy-image/api/v1alpha1
    version: v1alpha1
    webhooks:
      validation: true
      webhookVersion: v1
  - api:
      crdVersion: v1
      namespaced: true
    controller: true
    domain: testproject.org
    group: example.com
    kind: Busybox
    path: sigs.k8s.io/kubebuilder/testdata/project-v4-with-deploy-image/api/v1alpha1
    version: v1alpha1
version: "3"

为什么我们需要存储插件和使用的数据？

以下是一些追踪使用输入的动机示例：

检查一个插件是否可以在现有插件的基础上创建（即）插件兼容性，同时将多个插件连接在一起。
可以进行或不能进行的操作，例如验证当前配置是否允许为不同组搭建API的布局。
验证在CLI操作中可以或不能使用哪些数据，例如确保WebHooks只能为已存在的API创建。

请注意，KubeBuilder 不仅是一个 CLI 工具，还可以用作库，让用户创建他们的插件/工具，提供帮助程序和定制，以支持他们现有的项目 - 其中一个例子是 Operator-SDK。SDK 利用 KubeBuilder 创建插件，允许用户使用其他语言，并为用户提供帮助，以便他们将项目与例如 Operator Framework 解决方案/OLM 集成。您可以查看插件文档以了解更多关于创建自定义插件的信息。

此外，PROJECT 文件的另一个目的，是帮助我们创建一个功能，使用户能够通过提供自动重新搭建项目的辅助工具，轻松升级他们的项目。PROJECT 文件中包含了有关 API、其配置和版本的所有必要元数据。例如，它可以用于自动化在插件版本之间迁移时重新搭建的过程。 (更多信息)。

版本控制

项目配置是根据其布局进行版本控制的。欲了解更多信息，请参见版本控制。

布局定义

PROJECT 版本 3 的布局如下：

domain: testproject.org
layout:
  - go.kubebuilder.io/v4
plugins:
  部署图像.go.kubebuilder.io/v1-alpha:
    resources:
      - domain: testproject.org
        group: example.com
        kind: Memcached
        选项:
          容器命令: memcached,--memory-limit=64,-o,modern,-v
          容器端口: "11211"
          image: memcached:memcached:1.6.26-alpine3.19
          以用户身份运行: "1001"
        version: v1alpha1
      - domain: testproject.org
        group: example.com
        kind: Busybox
        选项:
          image: busybox:1.36.1
        version: v1alpha1
projectName: 项目-v4-带部署镜像
repo: sigs.k8s.io/kubebuilder/testdata/project-v4-with-deploy-image
resources:
  - api:
      crdVersion: v1
      namespaced: true
    controller: true
    domain: testproject.org
    group: example.com
    kind: Memcached
    path: sigs.k8s.io/kubebuilder/testdata/project-v4-with-deploy-image/api/v1alpha1
    version: v1alpha1
    webhooks:
      validation: true
      webhookVersion: v1
  - api:
      crdVersion: v1
      namespaced: true
    controller: true
    domain: testproject.org
    group: example.com
    kind: Busybox
    path: sigs.k8s.io/kubebuilder/testdata/project-v4-with-deploy-image/api/v1alpha1
    version: v1alpha1
version: "3"

现在让我们检查一下它的布局字段定义：

领域	描述
`布局`	定义全局插件，例如，一个项目 `init` 使用 `--plugins="go/v4,deploy-image/v1-alpha"` 意味着所使用的任何子命令将始终按顺序调用这两个插件的实现。
`域`	存储项目的域名。用户可以在使用 `init` 子命令和 `domain` 标志生成项目时提供此信息。
`插件`	定义用于自定义脚手架的插件，例如通过命令 `kubebuilder create api [options] --plugins=deploy-image/v1-alpha` 使用可选的 `deploy-image/v1-alpha` 插件仅为特定 API 创建脚手架。
`项目名称`	项目名称。这将用于构建管理器数据。默认情况下，它是项目目录的名称，但用户可以通过 `init` 子命令中的 `--project-name` 标志提供该名称。
`代码库`	该项目的代码库是Golang模块，例如 `github.com/example/myproject-operator`。
资源	项目中所有搭建的资源数组。
`resources.api`	通过子命令 `create api` 在项目中搭建的 API。
`resources.api.crdVersion`	用于为 CRD 资源搭建的 Kubernetes API 版本 (`apiVersion`)。
`resources.api.namespaced`	API RBAC 权限可以是命名空间级别或集群级别。
`resources.controller`	指示是否为 API 构建了控制器。
`resources.domain`	在项目初始化时通过 `--domain` 选项提供的资源域名，或者在为外部类型构建控制器时通过 `--external-api-domain` 选项提供的域名。
`resources.group`	当使用子命令 `create api` 时，通过 `--group` 标志提供的资源的 GKV 组。
`resources.version`	当使用子命令 `create api` 时，通过 `--version` 标志提供的资源的 GKV 版本。
`资源.种类`	存储 GKV 资源类型，该类型通过执行子命令 `create api` 时提供的 `--kind` 标志来指定。
`resources.path`	API资源的导入路径。它将是`<repo>/api/<kind>`，除非添加到项目中的API是外部API或核心类型的API。对于核心类型的场景，使用的路径在这里进行了映射。或者，可以使用通过标志`--external-api-path`提供的路径。
`resources.core`	当使用的组来自Kubernetes API并且项目中未定义API资源时，它为“真“。
`resources.external`	当使用标志 `--external-api-path` 生成外部类型的脚手架时，它为 `true`。
`resources.webhooks`	当使用子命令 `create webhook` 时，请存储网络钩子数据。
`resources.webhooks.spoke`	存储将作为 Spoke 的 API 版本以及用于转换 webhook 的指定 Hub 版本。
`resources.webhooks.webhookVersion`	用于搭建 webhook 资源的 Kubernetes API 版本（`apiVersion`）。
`resources.webhooks.conversion`	当 webhook 是使用 `--conversion` 标志搭建时，它为 `true`，这意味着这是一个转换 webhook。
`resources.webhooks.defaulting`	当 webhook 使用 `--defaulting` 标志创建时，它是 `true`，这意味着这是一个默认值 webhook。
`resources.webhooks.validation`	当使用 `--programmatic-validation` 标志搭建的 webhook 时，它是 `true`，这意味着它是一个验证 webhook。

插件

Kubebuilder 的架构本质上是基于插件的。这种设计使得 Kubebuilder CLI 能够不断发展，同时与旧版本保持向后兼容，允许用户选择是否使用特定功能，并实现与外部工具的无缝集成。

通过利用插件，项目可以扩展 Kubebuilder，并将其作为库来支持新功能或实现针对用户需求的自定义脚手架。这种灵活性使维护者能够在 Kubebuilder 的基础上进行构建，适应特定的用例，同时受益于其强大的脚手架引擎。

插件提供了几个关键优势：

向后兼容性：确保旧的布局和项目结构在新版本中仍然可用。
定制化：允许用户选择启用或禁用特定功能（即 Grafana 和 Deploy Image 插件）
可扩展性：促进与希望提供自己外部插件的第三方工具和项目的集成，这些插件可以与 Kubebuilder 一起使用，以修改和增强项目的脚手架或引入新功能。

例如，要初始化一个包含多个全局插件的项目：

kubebuilder init --plugins=pluginA,pluginB,pluginC

例如，要使用特定插件应用自定义脚手架：

kubebuilder create api --plugins=pluginA,pluginB,pluginC
OR
kubebuilder create webhook --plugins=pluginA,pluginB,pluginC
OR
kubebuilder edit --plugins=pluginA,pluginB,pluginC

本节详细介绍可用的插件、如何扩展 Kubebuilder，以及如何在遵循相同布局结构的情况下创建自己的插件。

可用插件

本节描述了在 Kubebuilder 项目中支持和随附的插件。

为了搭建项目框架

以下插件对于使用该工具构建整个项目非常有用。

插件	钥匙	描述
go.kubebuilder.io/v4 - （使用 Kubebuilder init 的默认脚手架）	`go/v4`	使用 `base.go.kubebuilder.io/v4` 和 kustomize.common.kubebuilder.io/v2 生成复合模板。负责生成 Golang 项目及其配置。

添加可选功能

以下插件对于生成代码和利用可选功能非常有用。

插件	钥匙	描述
grafana.kubebuilder.io/v1-alpha	`grafana/v1-alpha`	可选的辅助插件，可用于为 controller-runtime 导出的默认指标搭建 Grafana Manifests 仪表板。
deploy-image.go.kubebuilder.io/v1-alpha	`部署镜像/v1-alpha`	可选的辅助插件，可用于搭建API和控制器，提供代码实现以部署和管理 Operator（镜像）。
helm.kubebuilder.io/v1-alpha	`helm/v1-alpha`	可选辅助插件，可用于在 `dist` 目录下搭建 Helm Chart 来分发项目。

待扩展

以下插件对于希望扩展 Kubebuilder 功能的其他工具和外部插件非常有用。

您可以使用kustomize插件，该插件负责在config/下搭建kustomize文件。基础语言插件负责搭建所需的Golang文件，使您能够为其他语言创建自己的插件（例如，Operator-SDK使用户能够使用Ansible/Helm）或添加其他功能。

例如，Operator-SDK有一个插件，通过在其上添加自己的功能，将项目与OLM集成。

插件	钥匙	描述
kustomize.common.kubebuilder.io/v2	`kustomize/v2`	负责搭建 `config/` 目录下的所有 kustomize 文件。
`base.go.kubebuilder.io/v4`	`base/v4`	负责搭建所有特别需要 Golang 的文件。此插件在组合中用于创建插件（`go/v4`）。

go/v4 (go.kubebuilder.io/v4)

（默认脚手架）

Kubebuilder 仅在初始化项目时指定时，使用 go/v4 插件进行脚手架搭建。该插件是 kustomize.common.kubebuilder.io/v2 和 base.go.kubebuilder.io/v4 插件的组合，使用了 Bundle Plugin。它搭建了一个项目模板，帮助构建一组控制器。

通过按照快速入门并创建任何项目，您将默认使用该插件。

如何使用它？

要使用 go/v4 插件创建新项目，可以使用以下命令：

kubebuilder init --domain tutorial.kubebuilder.io --repo tutorial.kubebuilder.io/project --plugins=go/v4

插件支持的子命令

初始化 - kubebuilder init [选项]
编辑 - kubebuilder edit [选项]
创建 API - kubebuilder create api [选项]
创建 Webhook - kubebuilder create webhook [选项]

进一步的资源

要查看插件的组成，您可以查看 Kubebuilder 的源代码 main.go。
检查 base Golang 插件 base.go.kubebuilder.io/v4 的代码实现。
检查 Kustomize/v2 插件的代码实现。
查看 controller-runtime 以了解更多有关控制器的信息。

Grafana 插件 (`grafana/v1-alpha`)

Grafana 插件是一个可选的插件，可以用于搭建 Grafana 仪表板，以便您检查由使用 controller-runtime 的项目导出的默认指标。

何时使用它？

如果您想查看由控制器指标导出并通过Grafana由Prometheus收集的指标。

如何使用它？

先决条件：

您的项目必须使用 controller-runtime 通过控制器默认指标来暴露指标，并且这些指标需要被 Prometheus 收集。
访问 Prometheus。
- Prometheus 应该暴露一个端点。（对于 prometheus-operator，这类似于： http://prometheus-k8s.monitoring.svc:9090）
- 该端点已准备好/已经成为您 Grafana 的数据源。请参阅添加数据源。
访问 Grafana。确保您具备以下条件：
- 仪表板编辑权限
- Prometheus 数据源

基本用法

Grafana 插件附加于 init 子命令和 edit 子命令：

# 使用 Grafana 插件初始化新项目kubebuilder init --plugins grafana.kubebuilder.io/v1-alpha

# 为现有项目启用 Grafana 插件kubebuilder edit --plugins grafana.kubebuilder.io/v1-alpha

插件将创建一个新目录，并在其中搭建 JSON 文件（即 grafana/controller-runtime-metrics.json）。

展示案例：

在您的项目中查看如何使用插件的示例：

您接受的训练数据截至2023年10月。

现在，让我们来看看如何使用 Grafana 仪表板。

复制 JSON 文件
访问 <your-grafana-url>/dashboard/import 来导入一个新仪表板。
将 JSON 内容粘贴到“通过面板 JSON 导入“中，然后按“加载“按钮
选择 Prometheus 指标的数据源
一旦JSON导入到Grafana中，仪表盘就准备好了。

Grafana 仪表板

控制器运行时对账总数及错误

指标：
- controller_runtime_reconcile_total
- controller_runtime_reconcile_errors_total
查询：
- 求和(rate(controller_runtime_reconcile_total{job=“$job”}[5m])) 按 (instance, pod) 分组
- sum(rate(controller_runtime_reconcile_errors_total{job=“$job”}[5m])) by (instance, pod)
描述：
- 过去5分钟内总对账的每秒率
- 过去五分钟内每秒的对账错误率
样本：

控制器 CPU 和内存使用情况

指标：
- process_cpu_seconds_total
- 进程驻留内存字节数
查询：
- rate(process_cpu_seconds_total{job=“$job”, namespace=“$namespace”, pod=“$pod”}[5m]) * 100
- process_resident_memory_bytes{job=“$job”, namespace=“$namespace”, pod=“$pod”}
描述：
- 在过去5分钟内测量的每秒CPU使用率
- 分配给运行控制器的内存
您训练的数据截止到2023年10月。

P50/90/99 项目在工作队列中的停留时间（秒）

指标
- workqueue_queue_duration_seconds_bucket
查询：
- histogram_quantile(0.50, sum(rate(workqueue_queue_duration_seconds_bucket{job=“$job”, namespace=“$namespace”}[5m])) by (instance, name, le))
描述
- 项在工作队列中停留的秒数，直到被请求。
您接受的训练数据截止到2023年10月。

处理工作队列中的 P50/90/99 项目的时间（秒）

指标
- 工作队列工作持续时间秒桶
查询：
- histogram_quantile(0.50, sum(rate(workqueue_work_duration_seconds_bucket{job=“$job”, namespace=“$namespace”}[5m])) by (instance, name, le))
描述
- 处理工作队列中项目所需的秒数。
您仅接受到 2023 年 10 月的数据进行训练。

在工作队列中添加费率

指标
- workqueue_adds_total 的总数
查询：
- sum(rate(workqueue_adds_total{job=“$job”, namespace=“$namespace”}[5m])) by (instance, name)
描述
- 每秒添加到工作队列的项目数量
样本：

工作队列中的重试率

指标
- 工作队列重试总数
查询：
- 求 (rate(workqueue_retries_total{job=“$job”, namespace=“$namespace”}[5m])) 按照 (instance, name) 分类的总和
描述
- 工作队列处理的每秒重试次数
样本：

使用中的工人数量

指标
- controller_runtime_active_workers 的中文翻译是“控制器运行时活动工作者“。
查询：
- controller_runtime_active_workers{job=“$job”, namespace=“$namespace”}
描述
- 活跃控制器工作线程的数量
示例：

工作队列深度

指标
- 工作队列深度
查询：
- workqueue_depth{job=\
描述
- 当前工作队列的深度
示例：

未完成的秒数

指标
- workqueue_unfinished_work_seconds 的翻译为“工作队列未完成工作秒数“。
查询：
- rate(workqueue_unfinished_work_seconds{job=“$job”, namespace=“$namespace”}[5m])
描述
- 有多少秒的工作正在进行中，并且没有被 work_duration 观察到。
样本：

可视化自定义指标

Grafana 插件支持为自定义指标构建清单。

生成配置模板

当插件首次触发时，将生成 grafana/custom-metrics/config.yaml 文件。

---
自定义指标:
#  - 指标: # 原始自定义指标（必填）
#    类型:   # 指标类型：计数器/仪表/直方图（必填）
#    表达式:   # 指标的 Prom_ql（可选）
#    单位:   # 计量单位，示例：s、none、bytes、percent等（可选）

将自定义指标添加到配置中

您可以在文件中输入多个自定义指标。对于每个元素，您需要指定 metric 及其 type。Grafana 插件可以自动生成用于可视化的 expr。或者，您可以提供 expr，插件将直接使用指定的内容。

---
自定义指标:
  - 公制: memcached_operator_reconcile_total # 原始自定义指标（必需）
    类型: 计数器 # 指标类型：计数器/仪表/直方图（必需）
 单位: none
  - 公制: memcached_operator_reconcile_time_seconds_bucket
    type: 直方图

脚手架清单

一旦配置了 config.yaml，您可以再次运行 kubebuilder edit --plugins grafana.kubebuilder.io/v1-alpha。这一次，插件将生成 grafana/custom-metrics/custom-metrics-dashboard.json，该文件可以导入到 Grafana UI 中。

展示案例：

查看如何可视化您的自定义指标的示例：

您接受的训练数据截止到2023年10月。

子命令

Grafana 插件实现了以下子命令：

编辑 ($ kubebuilder edit [选项])
初始化 ($ kubebuilder init [选项])

受影响的文件

以下架构将由此插件创建或更新：

grafana/*.json

进一步的资源

查看视频以了解它是如何工作的
查看这个视频，了解自定义指标功能是如何工作的
请参考由 kustomize 插件提供的 serviceMonitor 示例。
检查插件实现
Grafana 文档关于导入 JSON 文件的内容。
Prometheus Operator 中 serviceMonitor 的使用情况

部署图像插件 (deploy-image/v1-alpha)

deploy-image 插件允许用户创建控制器和自定义资源，以在集群上部署和管理容器镜像，遵循 Kubernetes 的最佳实践。它简化了镜像部署的复杂性，同时允许用户根据需要自定义他们的项目。

通过使用此插件，您将获得：

一个控制器实现，用于在集群上部署和管理操作数（镜像）。
测试以验证对账逻辑，使用 ENVTEST。
自定义资源样本已更新至所需规格。
环境变量支持用于管理管理器中的操作数（镜像）。

Examples

请查看 Kubebuilder 项目中的 testdata 目录下的 project-v4-with-plugins 目录，以查看使用此插件创建的脚手架示例。

Memcached API 及其控制器是通过以下命令构建的：

Busybox API 是通过以下方式创建的：

什么时候使用它？

这个插件非常适合刚开始使用 Kubernetes operator 的用户。
它帮助用户使用Operator模式部署和管理镜像（操作数）。
如果您正在寻找一种快速有效的方法来设置自定义控制器并管理容器镜像，这个插件是一个很好的选择。

如何使用它？

初始化您的项目：在使用 kubebuilder init 创建新项目后，您可以使用此插件来创建 API。在继续之前，请确保您已完成快速入门指南。

创建 API：使用此插件，您可以创建 API，以指定您想要在集群上部署的图像（操作数）。您还可以使用各种标志可选地指定命令、端口和安全上下文：

示例命令：

kubebuilder create api --group example.com --version v1alpha1 --kind Memcached --image=memcached:1.6.15-alpine --image-container-command="memcached,--memory-limit=64,modern,-v" --image-container-port="11211" --run-as-user="1001" --plugins="deploy-image/v1-alpha"

Note on make run:

在本地运行项目时使用 make run，提供的 Operand 镜像将作为环境变量存储在 config/manager/manager.yaml 文件中。

确保在本地运行项目之前导出环境变量，例如：

子命令

deploy-image 插件包含以下子命令：

create api：使用此命令来搭建管理容器镜像的 API 和控制器代码。

受影响的文件

在使用带有此插件的 create api 命令时，除了现有的 Kubebuilder 骨架外，以下文件会受到影响：

controllers/*_controller_test.go：为控制器生成测试模板。
controllers/*_suite_test.go: 搭建或更新测试套件。
api/<版本>/*_types.go：搭建 API 规范。
config/samples/*_.yaml: 为自定义资源提供默认值的框架。
main.go: 更新文件以添加控制器设置。
config/manager/manager.yaml：更新以包含用于存储图像的环境变量。

Helm 插件（`helm/v1-alpha`）

Helm 插件是一个可选插件，可以用来搭建 Helm 图表，使您能够使用 Helm 分发项目。

默认情况下，用户可以通过运行以下命令生成一个包含所有清单的包：

make build-installer IMG=<some-registry>/<project-name:tag>

这允许项目消费者通过应用以下包来安装解决方案：

kubectl apply -f https://raw.githubusercontent.com/<org>/project-v4/<tag or branch>/dist/install.yaml

然而，在许多场景中，您可能更倾向于提供一个 Helm 图表来封装您的解决方案。如果是这样，您可以使用此插件在 dist 目录下生成 Helm 图表。

何时使用它

如果你想为用户提供一个 Helm 图表，以便他们安装和管理你的项目。
如果您需要使用最新的项目更改来更新位于 dist/chart/ 目录下生成的 Helm 图表：
- 生成新清单后，使用 edit 选项来同步 Helm 图表。
- 重要： 如果您使用 DeployImage 插件创建了一个 webhook 或 API，您必须使用 --force 标志运行 edit 命令，以便根据最新的清单（在运行 make manifests 之后）重新生成 Helm chart 的值，以确保 HelmChart 的值得到相应更新。在这种情况下，如果您自定义了 dist/chart/values.yaml 和 templates/manager/manager.yaml 下的文件，您需要在重新生成 Helm chart 之后，手动在最新更改的基础上重新应用您的自定义内容。

如何使用它？

基本用法

Helm 插件与 init 子命令和 edit 子命令关联。


# 使用 helm chart 初始化一个新项目kubebuilder init --plugins=helm/v1-alpha

# 通过 Helm 插件启用或更新现有项目的 Helm chart
# 在运行编辑命令之前，请运行 `make manifests` 以在 `config/` 目录下生成清单。make manifests
kubebuilder edit --plugins=helm/v1-alpha

Use the edit command to update the Helm Chart with the latest changes

在对项目进行更改后，请确保运行 make manifests，然后使用命令 kubebuilder edit --plugins=helm/v1-alpha 来更新 Helm Chart。

请注意，以下文件将不会被更新，除非您使用--force标志：

  dist/chart/
  ├── values.yaml
  └── templates/
      └── manager/
          └── manager.yaml

文件 chart/Chart.yaml、chart/templates/_helpers.tpl 和 chart/.helmignore 在初次创建后不会被更新，除非你删除它们。

子命令

该 Helm 插件实现了以下子命令：

编辑 ($ kubebuilder edit [选项])
初始化 ($ kubebuilder init [选项])

受影响的文件

以下架构将由此插件创建或更新：

dist/chart/*

Kustomize v2

（默认脚手架）

Kustomize 插件允许您为使用语言基础插件 base.go.kubebuilder.io/v4 的所有 kustomize 清单搭建框架。此插件用于在 go/v4 插件（默认脚手架）构建的项目中生成 config/ 目录下的清单。

像 Operator-sdk 这样的项目使用 Kubebuilder 项目作为库，并提供了与其他语言（如 Ansible 和 Helm）协作的选项。Kustomize 插件帮助它们在不同语言之间保持一致的配置。它还简化了在默认脚手架基础上执行更改的插件的创建，消除了在多个语言插件之间进行手动更新的需要。这种方法允许创建与不同项目和语言配合使用的“辅助“插件。

如何使用它

如果您希望您的语言插件使用 kustomize，请使用 Bundle Plugin 来指定您的语言插件由特定于语言的插件和 kustomize 组成，以用于其配置，如下所示：

import (
   ...
   kustomizecommonv2 "sigs.k8s.io/kubebuilder/v4/pkg/plugins/common/kustomize/v2"
   golangv4 "sigs.k8s.io/kubebuilder/v4/pkg/plugins/golang/v4"
   ...
)

// 为由 Kubebuilder go/v4 创建的 Golang 项目提供的捆绑插件gov4Bundle, _ := plugin.NewBundle(plugin.WithName(golang.DefaultNameQualifier),
    plugin.WithVersion(plugin.Version{Number: 4}),
    plugin.WithPlugins(kustomizecommonv2.Plugin{}, golangv4.Plugin{}), // 搭建 config/ 目录和所有 kustomize 文件)

您还可以单独使用 kustomize/v2，通过:

kubebuilder init --plugins=kustomize/v2
$ ls -la
total 24
drwxr-xr-x   6 camilamacedo86  staff  192 31 Mar 09:56 .
drwxr-xr-x  11 camilamacedo86  staff  352 29 Mar 21:23 ..
-rw-------   1 camilamacedo86  staff  129 26 Mar 12:01 .dockerignore
-rw-------   1 camilamacedo86  staff  367 26 Mar 12:01 .gitignore
-rw-------   1 camilamacedo86  staff   94 31 Mar 09:56 PROJECT
drwx------   6 camilamacedo86  staff  192 31 Mar 09:56 config

或与基础语言插件结合使用：

# 提供与 go/v4 插件相同的结构，但使用 kustomize/v2 进行组合。kubebuilder init --plugins=kustomize/v2,base.go.kubebuilder.io/v4 --domain example.org --repo example.org/guestbook-operator

子命令

kustomize 插件实现了以下子命令：

初始化 ($ kubebuilder init [选项])
创建 API ($ kubebuilder create api [OPTIONS])
创建 webhook ($ kubebuilder create api [选项])

受影响的文件

以下架构将由此插件创建或更新：

config/*

进一步的资源

检查 kustomize 的插件实现
查看kustomize 文档
请查看kustomize 仓库。

扩展 Kubebuilder

Kubebuilder 提供了一种可扩展的架构，用于使用插件搭建项目。这些插件允许您自定义 CLI 行为或集成新功能。

概述

Kubebuilder 的命令行界面（CLI）可以通过自定义插件进行扩展，使您能够：

建立新的脚手架。
增强现有的。
为 Kubebuilder 的脚手架添加新命令和功能。

这种灵活性使您能够创建根据特定需求量身定制的项目设置。

扩展选项

扩展 Kubebuilder 可以通过两种主要方式实现：

扩展 CLI 功能和插件: 您可以导入并在现有的 Kubebuilder 插件上进行构建，以扩展其功能和插件。当您需要为已从 Kubebuilder 的脚手架系统受益的工具添加特定功能时，这非常有用。例如，Operator SDK 利用 kustomize 插件来为 Ansible 或 Helm 等工具提供语言支持。这样，项目可以专注于维护仅与特定语言相关的内容。
创建外部插件：您可以构建独立的插件作为二进制文件。这些插件可以用任何语言编写，并应遵循 Kubebuilder 识别的执行模式。有关更多信息，请参见创建外部插件。

有关如何扩展 Kubebuilder 的更多详情，请参考以下章节：

命令行界面和插件学习如何扩展命令行界面的功能和插件。
外部插件用于创建独立插件。
E2E 测试以确保您的插件按预期功能运行。

扩展命令行界面功能和插件

Kubebuilder 提供了一种可扩展的架构，用于使用插件搭建项目。这些插件允许您自定义 CLI 行为或集成新功能。

在本指南中，我们将探讨如何扩展 CLI 功能、创建自定义插件以及打包多个插件。

创建自定义插件

要创建自定义插件，您需要实现 Kubebuilder 插件接口。

此接口允许您的插件挂钩到 Kubebuilder 的命令（init、create api、create webhook 等），并添加自定义逻辑。

自定义插件示例

您可以创建一个插件，它生成特定语言的框架和所需的配置文件，使用捆绑插件。此示例演示如何将 Go 语言插件与 Kustomize 插件结合使用：

import (
    kustomizecommonv2 "sigs.k8s.io/kubebuilder/v4/pkg/plugins/common/kustomize/v2"
    golangv4 "sigs.k8s.io/kubebuilder/v4/pkg/plugins/golang/v4"
)

mylanguagev1Bundle, _ := plugin.NewBundle(
    plugin.WithName("mylanguage.kubebuilder.io"),
    plugin.WithVersion(plugin.Version{Number: 1}),
    plugin.WithPlugins(kustomizecommonv2.Plugin{}, mylanguagev1.Plugin{}),
)

这个结构使您能够通过 Kustomize 建立一个通用的配置基础，并通过 mylanguagev1 处理特定于语言的文件。

您还可以使用您的插件来构建特定的资源，例如 CRD 和控制器，使用 create api 和 create webhook 子命令。

插件子命令

插件负责实现当子命令被调用时将执行的代码。您可以通过实现插件接口来创建一个新的插件。

除了作为 Base 之外，插件还应实现 SubcommandMetadata 接口，以便可以通过 CLI 运行。可选地，可以为目标命令设置自定义帮助文本；此方法可以是无操作的，这将保留由 cobra 命令构造函数设置的默认帮助文本。

Kubebuilder CLI 插件将脚手架和 CLI 功能包装在方便的 Go 类型中，这些类型由 kubebuilder 二进制文件或任何导入它们的二进制文件执行。更具体地说，一个插件配置以下 CLI 命令之一的执行：

init：初始化项目结构。
create api：生成一个新的 API 和控制器。
创建 webhook: 建立一个新的 webhook。
编辑: 编辑项目结构。

以下是使用 init 子命令与自定义插件的示例：

kubebuilder init --plugins=mylanguage.kubebuilder.io/v1

这将使用 mylanguage 插件初始化一个项目。

插件密钥

插件通过 <name>/<version> 形式的键来识别。指定要运行的插件的方式有两种：

设置 kubebuilder init --plugins=<plugin key>，将初始化一个为键为 <plugin key> 的插件配置的项目。
在生成的项目配置文件中的 layout: <插件键>。在运行命令时（除了初始化命令，它会生成此文件），命令会查看该值以选择要运行的插件。

默认情况下，<plugin key> 将为 go.kubebuilder.io/vX，其中 X 是某个整数。

要查看完整的实现示例，请查看 Kubebuilder 的原生 go.kubebuilder.io 插件。

插件命名

插件名称必须是 DNS1123 标签，并且应为完全合格的名称，即它们有一个后缀，如 .example.com。例如，使用 kubebuilder 命令的基础 Go 脚手架名称为 go.kubebuilder.io。合格的名称可以避免插件名称之间的冲突；go.kubebuilder.io 和 go.example.com 都可以生成 Go 代码，并且可以由用户指定。

插件版本管理

插件的 Version() 方法返回一个 plugin.Version 对象，包含一个整数值和可选的阶段字符串，它可以是“alpha“或“beta“。该整数表示插件的当前版本。两个不同的整数值表示插件版本之间的不兼容性。阶段字符串表示插件的稳定性：

alpha：应该用于那些经常更改并可能在使用之间出现故障的插件。
beta：应适用于仅在小幅度上进行更改的插件，例如错误修复。

标准文本

Kubebuilder 内部插件使用模板来生成代码文件。Kubebuilder 通过模板化来搭建插件的文件。例如，在创建新项目时，go/v4 插件会使用其实现中定义的模板来生成 go.mod 文件。

您可以通过定义自己的模板并使用 Kubebuilder 的机械库来生成文件，从而扩展您自定义插件的功能。该库允许您：

Define file I/O behaviors.
将标记添加到搭建的文件中。
为您的脚手架指定模板。

示例：样板文本

例如，go/v4 通过定义一个实现了 machinery 接口的对象来搭建 go.mod 文件。原始模板被设置为 Template.SetTemplateDefaults 方法中的 TemplateBody 字段：

/*******************************************************************************
版权所有 2022 Kubernetes 作者。

根据 Apache 许可证，版本 2.0（"许可证"）授权；
除非遵守许可证，否则您不得使用此文件。
您可以在以下网址获取许可证的副本：

    http://www.apache.org/licenses/LICENSE-2.0

除非适用法律要求或书面达成协议，否则根据许可证分发的软件是以"原样"基础分发的，
不提供任何种类的保证或条件，明示或暗示。
有关许可证的具体语言，请参见许可证以了解管理权限和
根据许可证的限制。
******************************************************************************/

package templates

import (
	"sigs.k8s.io/kubebuilder/v4/pkg/machinery"
)

var _ machinery.Template = &GoMod{}

// GoMod生成一个定义项目依赖的文件type GoMod struct {
	machinery.TemplateMixin
	machinery.RepositoryMixin

	ControllerRuntimeVersion string
}

// SetTemplateDefaults实现了machinery.Templatefunc (f *GoMod) SetTemplateDefaults() error {
	if f.Path == "" {
		f.Path = "go.mod"
	}

	f.TemplateBody = goModTemplate

	f.IfExistsAction = machinery.OverwriteFile

	return nil
}

const goModTemplate = `模块 {{ .Repo }}

go 1.23.0

godebug 默认=go1.23

依赖 (
	sigs.k8s.io/controller-runtime {{ .ControllerRuntimeVersion }}
)
`

实现该机械接口的对象随后将传递给脚手架的执行：

// Scaffold 实现了 cmdutil.Scaffolder
func (s *initScaffolder) Scaffold() error {
	log.Println("Writing scaffold for you to edit...")

	// 初始化将把样板文件写入磁盘的机器架构。
	// 样板文件需要作为一个单独步骤进行搭建，因为它将被
	// 其他文件使用，包括在此命令调用中搭建的文件。	scaffold := machinery.NewScaffold(s.fs,
		machinery.WithConfig(s.config),
	)

	...

	return scaffold.Execute(
		...
		&templates.GoMod{
			ControllerRuntimeVersion: ControllerRuntimeVersion,
		},
		...
	)
}

示例：在插件中覆盖文件

让我们假设，当调用一个子命令时，你想要覆盖一个现有的文件。

例如，要修改 Makefile 并添加自定义构建步骤，在模板的定义中可以使用以下选项：

f.IfExistsAction = machinery.OverwriteFile

通过使用这些选项，您的插件可以控制由 Kubebuilder 的默认脚手架生成的某些文件。

定制现有支架

Kubebuilder 提供了实用函数，帮助您修改默认的脚手架。通过使用插件工具，您可以向 Kubebuilder 生成的文件插入、替换或附加内容，从而完全控制脚手架的过程。

这些工具使您能够：

插入内容：在文件的特定位置添加内容。
替换内容：搜索并替换文件的特定部分。
追加内容：在文件末尾添加内容，而不删除或更改现有内容。

Example

如果您需要在生成的文件中插入自定义内容，可以使用插件工具提供的 InsertCode 函数：

pluginutil.InsertCode(filename, target, code)

这种方法使您能够在构建自定义插件时扩展和修改生成的脚手架。

有关更多细节，请参考 Kubebuilder 插件工具。

捆绑插件

插件可以被打包以组合成更复杂的脚手架。插件包是多个插件的组合，这些插件按照预定义的顺序执行。例如：

myPluginBundle, _ := plugin.NewBundle(
    plugin.WithName("myplugin.example.com"),
    plugin.WithVersion(plugin.Version{Number: 1}),
    plugin.WithPlugins(pluginA.Plugin{}, pluginB.Plugin{}, pluginC.Plugin{}),
)

该捆绑包将按照指定的顺序为每个插件执行 init 子命令：

pluginA
pluginB
插件C

以下命令将运行捆绑的插件：

kubebuilder init --plugins=myplugin.example.com/v1

命令行系统

插件是通过 CLI 对象运行的，该对象将插件类型映射到子命令，并调用该插件的方法。例如，编写一个将 Init 插件注入到 CLI 的程序，然后调用 CLI.Run() 将调用插件的 SubcommandMetadata、UpdatesMetadata 和 Run 方法，使用用户在 kubebuilder init 中传递给程序的信息。以下是一个示例：

package cli

import (
	log "github.com/sirupsen/logrus"
	"github.com/spf13/cobra"

	"sigs.k8s.io/kubebuilder/v4/pkg/cli"
	cfgv3 "sigs.k8s.io/kubebuilder/v4/pkg/config/v3"
	"sigs.k8s.io/kubebuilder/v4/pkg/plugin"
	kustomizecommonv2 "sigs.k8s.io/kubebuilder/v4/pkg/plugins/common/kustomize/v2"
	"sigs.k8s.io/kubebuilder/v4/pkg/plugins/golang"
	deployimage "sigs.k8s.io/kubebuilder/v4/pkg/plugins/golang/deploy-image/v1alpha1"
    golangv4 "sigs.k8s.io/kubebuilder/v4/pkg/plugins/golang/v4"

)

var (
	// 以下是您自己的二进制文件中可能包含的命令示例
	//	commands = []*cobra.Command{
		myExampleCommand.NewCmd(),
	}
	alphaCommands = []*cobra.Command{
		myExampleAlphaCommand.NewCmd(),
	}
)

// GetPluginsCLI 返回配置在您的 CLI 二进制文件中使用的基于插件的 CLI。func GetPluginsCLI() (*cli.CLI) {
	// 打包插件，用于构建由 Kubebuilder go/v4 创建的 Golang 项目脚手架。	gov3Bundle, _ := plugin.NewBundleWithOptions(plugin.WithName(golang.DefaultNameQualifier),
		plugin.WithVersion(plugin.Version{Number: 3}),
		plugin.WithPlugins(kustomizecommonv2.Plugin{}, golangv4.Plugin{}),
	)


	c, err := cli.New(
		// 添加你的 CLI 二进制文件的名称
		cli.WithCommandName("example-cli"),

		// 添加你的 CLI 二进制文件的版本。		cli.WithVersion(versionString()),

		// 注册可以通过你的 CLI 工具使用的插件选项，以进行脚手架。请注意，我们在这里使用的示例是由 Kubebuilder 实现和提供的插件。		cli.WithPlugins(
			gov3Bundle,
			&deployimage.Plugin{},
		),

		// 定义您的二进制文件将使用的默认插件。这意味着如果没有提供信息，例如当用户运行 `kubebuilder init` 时，将使用这个插件。		cli.WithDefaultPlugins(cfgv3.Version, gov3Bundle),

		// 定义默认的项目配置版本，CLI在未通过--project-version标志提供时将使用该版本。		cli.WithDefaultProjectVersion(cfgv3.Version),

		// 将您自己的命令添加到命令行接口 (CLI)		cli.WithExtraCommands(commands...),

		// 将您自己的 alpha 命令添加到 CLI 中
		cli.WithExtraAlphaCommands(alphaCommands...),

		// 为你的命令行界面添加补全选项
		cli.WithCompletion(),
	)
	if err != nil {
		log.Fatal(err)
	}

	return c
}

// versionString 返回 CLI 版本func versionString() string {
	// 返回您的二进制项目版本}

该程序可以通过以下方式构建和运行：

默认行为：

# 使用默认的 Init 插件"go.example.com/v1"初始化项目。
# 此密钥会自动写入 PROJECT 配置文件中。
$ my-bin-builder init
# 使用 "go.example.com/v1" 的 CreateAPI 和 CreateWebhook 插件方法创建 API 和 webhook。此密钥是从配置文件中读取的。$ my-bin-builder create api [flags]
$ my-bin-builder create webhook [flags]

使用 --plugins 选择一个插件：

# 使用 "ansible.example.com/v1" 初始化插件初始化项目。
# 和上面一样，这个密钥会写入配置文件中。
$ my-bin-builder init --plugins ansible
# 使用 "ansible.example.com/v1" 的 CreateAPI 和 CreateWebhook 插件方法创建 API 和 Webhook。此密钥是从配置文件中读取的。$ my-bin-builder create api [flags]
$ my-bin-builder create webhook [flags]

输入应在项目文件中跟踪。

CLI 负责管理项目文件配置，该配置表示由 CLI 工具搭建的项目的配置。

在扩展 Kubebuilder 时，建议确保您的工具或外部插件正确使用 PROJECT 文件来跟踪相关信息。这确保了其他外部工具和插件可以与项目正确集成。它还允许工具特性帮助用户重新构建他们的项目，例如 Kubebuilder 提供的项目升级助手，确保 PROJECT 文件中跟踪的信息可以用于多种目的。

例如，插件可以检查它们是否支持项目设置，并根据跟踪的输入重新执行命令。

Example

通过运行以下命令使用 Deploy Image 插件来搭建 API 及其控制器：

kubebyilder create api --group example.com --version v1alpha1 --kind Memcached --image=memcached:memcached:1.6.26-alpine3.19 --image-container-command="memcached,--memory-limit=64,-o,modern,-v" --image-container-port="11211" --run-as-user="1001" --plugins="deploy-image/v1-alpha" --make=false

以下条目将被添加到项目文件中：

...
plugins:
  部署图像.go.kubebuilder.io/v1-alpha:
    resources:
    - domain: testproject.org
      group: example.com
      kind: Memcached
      选项:
        容器命令: memcached,--memory-limit=64,-o,modern,-v
        容器端口: "11211"
        image: memcached:memcached:1.6.26-alpine3.19
        以用户身份运行: "1001"
      version: v1alpha1
    - domain: testproject.org
      group: example.com
      kind: Busybox
      选项:
        image: busybox:1.36.1
      version: v1alpha1
...

通过检查 PROJECT 文件，可以了解插件是如何使用的以及提供了哪些输入。这不仅可以基于跟踪的数据重新执行命令，还能够创建可以依赖这些信息的功能或插件。

为 Kubebuilder 创建外部插件

概述

Kubebuilder 的功能可以通过外部插件进行扩展。这些插件是可执行文件（可以用任何语言编写），遵循 Kubebuilder 认可的执行模式。Kubebuilder 通过 stdin 和 stdout 与这些插件进行交互，实现无缝通信。

为什么使用外部插件？

外部插件使第三方解决方案维护者能够将其工具与 Kubebuilder 集成。与 Kubebuilder 自身的插件类似，这些插件可以选择性使用，为用户提供工具选择的灵活性。通过在自己的代码库中开发插件，维护者确保更新与其 CI 流水线保持一致，并能够管理其责任范围内的任何变更。

如果您对这种类型的集成感兴趣，建议与第三方解决方案的维护者进行合作。Kubebuilder 的维护者始终乐意提供支持，以扩展其功能。

如何编写外部插件

Kubebuilder 与外部插件之间的通信通过标准输入/输出进行。可以使用任何语言创建插件，只要它遵循 PluginRequest 和 PluginResponse 结构。

插件请求

PluginRequest包含从CLI收集的数据以及之前执行的插件。Kubebuilder通过stdin将这些数据作为JSON对象发送给外部插件。

示例 PluginRequest（通过 kubebuilder init --plugins sampleexternalplugin/v1 --domain my.domain 触发）：

{
  "apiVersion": "v1alpha1",
  "args": ["--domain", "my.domain"],
  "command": "init",
  "universe": {}
}

插件响应

PluginResponse 包含插件对项目所做的修改。该数据以 JSON 格式序列化，并通过 stdout 返回给 Kubebuilder。

示例 PluginResponse:

{
  "apiVersion": "v1alpha1",
  "command": "init",
  "metadata": {
    "description": "`init` 子命令通过 Kubebuilder 初始化一个项目。它会构建一个单独的文件：`initFile`。",
    "examples": "kubebuilder init --plugins sampleexternalplugin/v1 --domain my.domain"
  },
  "universe": {
    "initFile": "A file created with the `init` subcommand."
  },
  "error": false,
  "errorMsgs": []
}

如何使用外部插件

前提条件

Kubebuilder CLI 版本 > 3.11.0
外部插件的可执行文件
使用 ${EXTERNAL_PLUGINS_PATH} 或默认操作系统路径进行插件路径配置：
- Linux: $HOME/.config/kubebuilder/plugins/${name}/${version}/${name}
- macOS: ~/Library/Application Support/kubebuilder/plugins/${name}/${version}/${name}

示例： 对于在 Linux 上的插件 foo.acme.io 版本 v2，路径将是 $HOME/.config/kubebuilder/plugins/foo.acme.io/v2/foo.acme.io。

可用子命令

外部插件可以支持以下 Kubebuilder 子命令：

init: 项目初始化
create api: 创建 Kubernetes API 定义的脚手架
创建 webhook: 创建 Kubernetes webhooks 的骨架
编辑: 更新项目配置

可选子命令以增强用户体验：

metadata: 提供使用 --help 标志的插件描述和示例。
flags：通知Kubebuilder支持的标志，以便提前检测错误。

配置插件路径

设置环境变量 $EXTERNAL_PLUGINS_PATH 以指定自定义插件二进制文件路径：

export EXTERNAL_PLUGINS_PATH=您训练的数据截至2023年10月。

否则，Kubebuilder 将根据您的操作系统在默认路径中搜索插件。

示例命令行指令

您现在可以通过调用 CLI 命令来使用它：

# 初始化一个新的项目，使用名为 `sampleplugin` 的外部插件。kubebuilder init --plugins sampleplugin/v1

# 显示外部插件的 `init` 子命令的帮助信息kubebuilder init --plugins sampleplugin/v1 --help

# 创建一个带有自定义标志 `number` 的新 API，与上述外部插件一起使用kubebuilder create api --plugins sampleplugin/v1 --number 2

# 创建一个带有自定义标志 `hooked` 的外部插件的 webhookkubebuilder create webhook --plugins sampleplugin/v1 --hooked

# 使用上述外部插件更新项目配置kubebuilder edit --plugins sampleplugin/v1

# 创建新的API，使用外部插件v1和v2，并遵循插件链的顺序。kubebuilder create api --plugins sampleplugin/v1,sampleplugin/v2

# 使用 go/v4 插件创建新的 API，然后按照插件链的顺序将这些文件传递给外部插件。kubebuilder create api --plugins go/v4,sampleplugin/v1

进一步的资源

编写端到端测试

您可以查看 Kubebuilder/v4/test/e2e/utils 包，该包提供了带有丰富方法的 TestContext：

NewTestContext 有助于定义：
- 一个用于测试项目的临时文件夹。
- 一个临时的控制器管理器镜像。
- Kubectl 执行方式。
- CLI 可执行文件（无论是 kubebuilder、operator-sdk 还是您扩展的 CLI）。

一旦定义完毕，您可以使用 TestContext 来：

设置测试环境，例如：
- 清理环境并创建临时目录。请参阅准备。
- 安装所需的 CRD。请参阅 InstallCertManager 和 InstallPrometheusManager。
验证插件的行为，例如：
- 触发插件绑定的子命令。请参见 Init、CreateAPI。
- 使用 PluginUtil 来验证生成的输出。请参见 InsertCode、ReplaceInFile 和 UncommentCode。
确保搭建的输出正常运行，例如：
- 在您的 Makefile 中执行命令。请参见 Make。
- 临时加载测试控制器的图像。请参见 LoadImageToKindCluster。
- 调用 Kubectl 以验证正在运行的资源。请参阅 Kubectl。
测试后清理临时资源：
- 卸载先决条件 CRD。请参见 UninstallPrometheusOperManager。
- 删除临时目录。请参见销毁。

参考文献：

生成测试样本

查看由您的插件生成的示例项目内容非常简单。

例如，Kubebuilder 根据不同的插件生成示例项目以验证布局。

您还可以使用 TestContext 从您的插件生成脚手架项目的文件夹。命令与扩展 CLI 功能和插件中提到的类似。

以下是使用 go/v4 插件创建示例项目的一般工作流程（kbc 是 TestContext 的一个实例）：

初始化一个项目：

By("initializing a project")
err = kbc.Init(
	"--plugins", "go/v4",
	"--project-version", "3",
	"--domain", kbc.Domain,
	"--fetch-deps=false",
)
Expect(err).NotTo(HaveOccurred(), "Failed to initialize a project")

定义API：

By("creating API definition")
err = kbc.CreateAPI(
	"--group", kbc.Group,
	"--version", kbc.Version,
	"--kind", kbc.Kind,
	"--namespaced",
	"--resource",
	"--controller",
	"--make=false",
)
Expect(err).NotTo(HaveOccurred(), "Failed to create an API")

为了搭建 webhook 配置：

By("scaffolding mutating and validating webhooks")
err = kbc.CreateWebhook(
	"--group", kbc.Group,
	"--version", kbc.Version,
	"--kind", kbc.Kind,
	"--defaulting",
	"--programmatic-validation",
)
Expect(err).NotTo(HaveOccurred(), "Failed to create an webhook")

插件版本管理

名字	Example	描述
Kubebuilder 版本	`v2.2.0`, `v2.3.0`, `v2.3.1`, `v4.2.0`	Kubebuilder 项目的标记版本，表示该仓库中源代码的更改。有关二进制版本，请参阅 releases 页面。
项目版本	`"1"`, `"2"`, `"3"`	项目版本定义了 `PROJECT` 配置文件的模式。此版本在 `PROJECT` 文件的 `version` 中定义。
插件版本	您训练的数据截至2023年10月。	表示单个插件的版本，以及它生成的相应框架。该版本在插件键中定义，例如 `go.kubebuilder.io/v2`。有关更多详细信息，请参见设计文档。

版本递增

有关 Kubebuilder 版本发布如何工作的更多信息，请参阅 semver 文档。

只有在项目文件方案本身引入破坏性更改时，项目版本才应该增加。对 Go 脚手架或 Kubebuilder CLI 的更改不影响项目版本。

同样，新的插件版本的引入可能只会导致 Kubebuilder 发布一个新的次要版本，因为 CLI 本身没有进行破坏性更改。只有在我们移除对旧版本插件的支持时，这才会对 Kubebuilder 造成破坏性更改。有关插件版本管理的更多详细信息，请参阅插件设计文档中的版本控制部分。

介绍插件的更改

对插件所做的更改仅在发生导致与之前插件版本搭建的项目不兼容的更改时，才需要提高插件版本。一旦插件版本 vX 稳定（不带有 “alpha” 或 “beta” 后缀），应该创建一个新的插件包，其中包含版本 v(X+1)-alpha 的新插件。通常通过（语义上）执行 cp -r pkg/plugins/golang/vX pkg/plugins/golang/v(X+1)，然后更新版本号和路径来完成这一操作。所有后续对插件的破坏性更改都应在此包中进行；vX 插件将被冻结，不能再进行破坏性更改。

您还必须在您的 PR 中将迁移指南添加到 Kubebuilder 书籍的 migrations 部分。该指南应详细说明用户将项目从 vX 升级到 v(X+1)-alpha 所需的步骤。

FAQ

How does the value informed via the domain flag (i.e. `kubebuilder init --domain example.com`) when we init a project?

创建项目后，通常您会希望扩展 Kubernetes API，并定义由您的项目拥有的新 API。因此，域值会被记录在 PROJECT 文件中，该文件定义了您的项目配置，并将作为域来创建您的 API 端点。请确保您了解组、版本和种类，真是让人头大！。

该域名用于组后缀，以明确显示资源组类别。例如，如果设置为 --domain=example.com：

kubebuilder init --domain example.com --repo xxx --plugins=go/v4
kubebuilder create api --group mygroup --version v1beta1 --kind Mykind

那么结果资源组将是 mygroup.example.com。

如果域字段未设置，默认值为 my.domain。

我希望自定义我的项目，使用 klog 替代 controller-runtime 提供的 zap。我该如何使用 `klog` 或其他日志记录器作为项目的日志记录器？

在 main.go 中，你可以替换：

    opts := zap.Options{
    Development: true,
    }
    opts.BindFlags(flag.CommandLine)
    flag.Parse()

    ctrl.SetLogger(zap.New(zap.UseFlagOptions(&opts)))

与：

    flag.Parse()
	ctrl.SetLogger(klog.NewKlogr())

在执行 `make run` 后，我看到类似“无法找到领导者选举命名空间：未在集群内运行…“的错误。

您可以启用领导者选举。不过，如果您使用 make run 目标在本地测试项目，这将使管理器在集群外部运行，那么您可能还需要设置领导者选举资源将要创建的命名空间，如下所示：

mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme:                  scheme,
		MetricsBindAddress:      metricsAddr,
		Port:                    9443,
		HealthProbeBindAddress:  probeAddr,
		LeaderElection:          enableLeaderElection,
		LeaderElectionID:        "14be1926.testproject.org",
		LeaderElectionNamespace: "<project-name>-system",

如果您在集群上运行项目并使用 make deploy 目标，那么您可能不想添加此选项。因此，您可以使用环境变量自定义此行为，仅在开发目的时添加此选项，例如：

    leaderElectionNS := ""
	if os.Getenv("ENABLE_LEADER_ELECTION_NAMESPACE") != "false" {
		leaderElectionNS = "<project-name>-system"
	}

	mgr, err := ctrl.NewManager(ctrl.GetConfigOrDie(), ctrl.Options{
		Scheme:                  scheme,
		MetricsBindAddress:      metricsAddr,
		Port:                    9443,
		HealthProbeBindAddress:  probeAddr,
		LeaderElection:          enableLeaderElection,
		LeaderElectionNamespace: leaderElectionNS,
		LeaderElectionID:        "14be1926.testproject.org",
		...

当我在旧版本的 Kubernetes 上部署我的项目时，出现错误“open /var/run/secrets/kubernetes.io/serviceaccount/token: permission denied“。我该如何解决这个问题？

如果您遇到错误：

`当您在较旧版本的 Kubernetes 上运行项目（可能是 \<= 1.21）时，可能会遇到 [这个问题](https://github.com/kubernetes/kubernetes/issues/82573)，其原因是挂载的令牌文件设置为 0600`，请查看解决方案。然后，解决方法是：

在 manager.yaml 中添加 fsGroup。

安全上下文:
        以非root用户身份运行: true
        fsGroup: 65532 # 添加此 fsGroup 以使令牌文件可读

不过，请注意，此问题已被修复，如果您在高版本（可能大于或等于1.22）中部署项目，则不会发生该问题。

当我运行 `make install` 来应用 CRD 清单时，出现错误 `过长：必须最多为 262144 字节`。如何解决这个问题？为什么会出现这个错误？

在尝试运行 make install 来应用 CRD 清单时，可能会遇到错误 Too long: must have at most 262144 bytes。这个错误是由于 Kubernetes API 强制执行的大小限制所导致。请注意，make install 目标将使用 kubectl apply -f - 来应用位于 config/crd 下的 CRD 清单。因此，当使用 apply 命令时，API 会用 last-applied-configuration 注解该对象，该注解包含整个之前的配置。如果这个配置太大，就会超过允许的字节大小。（更多信息）

在理想情况下，客户端应用可能看起来是完美的解决方案，因为整个对象配置不必作为注解（last-applied-configuration）存储在服务器上。 However，值得注意的是，目前它并不被 controller-gen 或 kubebuilder 支持。有关更多信息，请参见：Controller-tool-discussion。

因此，您有一些选项可以绕过此情况，例如：

通过从 CRD 中移除描述:

您的 CRD 是使用 controller-gen 生成的。通过使用选项 maxDescLen=0 来移除描述，您可以减少大小，从而解决问题。为此，您可以按照以下示例更新 Makefile，然后调用目标 make manifest 以重新生成没有描述的 CRD，具体如下：

通过重新设计您的 API:

您可以审查您的 API 设计，看看它是否有超过应有的规格，从而违反单一职责原则。例如，这样您可能需要重新设计它们。

How can I validate and parse fields in CRDs effectively?

为了提高用户体验，建议在编写 CRD 时使用 OpenAPI v3 schema 验证。然而，这种方法有时可能需要额外的解析步骤。例如，请考虑以下代码：

type StructName struct {
	// +kubebuilder:validation:Format=日期-时间
	TimeField string `json:"timeField,omitempty"`
}

在这种情况下会发生什么？

如果用户尝试创建具有无效 timeField 值的 CRD，Kubernetes API 会向其发送错误通知。
在开发者端，字符串值需要在使用之前手动解析。

有没有更好的方法？

为了提供更好的用户体验和简化开发人员体验，建议使用预定义类型，如 metav1.Time。例如，考虑以下代码：

type StructName struct {
	TimeField metav1.Time `json:"timeField,omitempty"`
}

在这种情况下会发生什么？

用户仍然会收到来自 Kubernetes API 的错误通知，提示无效的 timeField 值。
开发人员可以直接在代码中使用解析后的 TimeField，而无需额外的解析，从而减少错误并提高效率。