Skip to content

Commit

Permalink
KEP-2170: Expose the TrainingRuntime and ClusterTrainingRuntime Kind
Browse files Browse the repository at this point in the history
Signed-off-by: Yuki Iwai <[email protected]>
  • Loading branch information
tenzen-y committed Oct 14, 2024
1 parent a0cae9a commit a527f86
Show file tree
Hide file tree
Showing 8 changed files with 19 additions and 11 deletions.
7 changes: 7 additions & 0 deletions pkg/apis/kubeflow.org/v2alpha1/trainingruntime_types.go
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,13 @@ import (
jobsetv1alpha2 "sigs.k8s.io/jobset/api/jobset/v1alpha2"
)

const (
// TrainingRuntimeKind is the GroupVersionKind Kind name for the TrainingRuntime.
TrainingRuntimeKind string = "TrainingRuntime"
// ClusterTrainingRuntimeKind is the GroupVersionKind Kind name for the ClusterTrainingRuntime.
ClusterTrainingRuntimeKind string = "ClusterTrainingRuntime"
)

// +genclient
// +genclient:nonNamespaced
// +k8s:deepcopy-gen:interfaces=k8s.io/apimachinery/pkg/runtime.Object
Expand Down
2 changes: 1 addition & 1 deletion pkg/runtime.v2/core/clustertrainingruntime.go
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,7 @@ var _ runtime.Runtime = (*ClusterTrainingRuntime)(nil)

var ClusterTrainingRuntimeGroupKind = schema.GroupKind{
Group: kubeflowv2.GroupVersion.Group,
Kind: "ClusterTrainingRuntime",
Kind: kubeflowv2.ClusterTrainingRuntimeKind,
}.String()

func NewClusterTrainingRuntime(context.Context, client.Client, client.FieldIndexer) (runtime.Runtime, error) {
Expand Down
4 changes: 2 additions & 2 deletions pkg/runtime.v2/core/clustertrainingruntime_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ func TestClusterTrainingRuntimeNewObjects(t *testing.T) {
"succeeded to build JobSet and PodGroup": {
trainJob: testingutil.MakeTrainJobWrapper(t, metav1.NamespaceDefault, "test-job").
UID("uid").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind("ClusterTrainingRuntime"), "test-runtime").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind(kubeflowv2.ClusterTrainingRuntimeKind), "test-runtime").
Trainer(
testingutil.MakeTrainJobTrainerWrapper(t).
ContainerImage("test:trainjob").
Expand Down Expand Up @@ -93,7 +93,7 @@ func TestClusterTrainingRuntimeNewObjects(t *testing.T) {
"missing trainingRuntime resource": {
trainJob: testingutil.MakeTrainJobWrapper(t, metav1.NamespaceDefault, "test-job").
UID("uid").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind("ClusterTrainingRuntime"), "test-runtime").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind(kubeflowv2.ClusterTrainingRuntimeKind), "test-runtime").
Trainer(
testingutil.MakeTrainJobTrainerWrapper(t).
ContainerImage("test:trainjob").
Expand Down
2 changes: 1 addition & 1 deletion pkg/runtime.v2/core/trainingruntime.go
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ type TrainingRuntime struct {

var TrainingRuntimeGroupKind = schema.GroupKind{
Group: kubeflowv2.GroupVersion.Group,
Kind: "TrainingRuntime",
Kind: kubeflowv2.TrainingRuntimeKind,
}.String()

var _ runtime.Runtime = (*TrainingRuntime)(nil)
Expand Down
4 changes: 2 additions & 2 deletions pkg/runtime.v2/core/trainingruntime_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ func TestTrainingRuntimeNewObjects(t *testing.T) {
"succeeded to build JobSet and PodGroup": {
trainJob: testingutil.MakeTrainJobWrapper(t, metav1.NamespaceDefault, "test-job").
UID("uid").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind("TrainingRuntime"), "test-runtime").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind(kubeflowv2.TrainingRuntimeKind), "test-runtime").
Trainer(
testingutil.MakeTrainJobTrainerWrapper(t).
ContainerImage("test:trainjob").
Expand Down Expand Up @@ -93,7 +93,7 @@ func TestTrainingRuntimeNewObjects(t *testing.T) {
"missing trainingRuntime resource": {
trainJob: testingutil.MakeTrainJobWrapper(t, metav1.NamespaceDefault, "test-job").
UID("uid").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind("TrainingRuntime"), "test-runtime").
TrainingRuntimeRef(kubeflowv2.SchemeGroupVersion.WithKind(kubeflowv2.TrainingRuntimeKind), "test-runtime").
Trainer(
testingutil.MakeTrainJobTrainerWrapper(t).
ContainerImage("test:trainjob").
Expand Down
2 changes: 1 addition & 1 deletion pkg/runtime.v2/indexer/indexer.go
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,7 @@ func IndexTrainJobTrainingRuntimes(obj client.Object) []string {
Kind: ptr.Deref(trainJob.Spec.TrainingRuntimeRef.Kind, ""),
}
if runtimeRefGroupKind.Group == kubeflowv2.GroupVersion.Group &&
(runtimeRefGroupKind.Kind == "TrainingRuntime" || runtimeRefGroupKind.Kind == "ClusterTrainingRuntime") {
(runtimeRefGroupKind.Kind == kubeflowv2.TrainingRuntimeKind || runtimeRefGroupKind.Kind == kubeflowv2.ClusterTrainingRuntimeKind) {
return []string{trainJob.Spec.TrainingRuntimeRef.Name}
}
return nil
Expand Down
4 changes: 2 additions & 2 deletions pkg/util.v2/testing/wrapper.go
Original file line number Diff line number Diff line change
Expand Up @@ -238,7 +238,7 @@ func MakeTrainingRuntimeWrapper(t *testing.T, namespace, name string) *TrainingR
TrainingRuntime: kubeflowv2.TrainingRuntime{
TypeMeta: metav1.TypeMeta{
APIVersion: kubeflowv2.SchemeGroupVersion.String(),
Kind: "TrainingRuntime",
Kind: kubeflowv2.TrainingRuntimeKind,
},
ObjectMeta: metav1.ObjectMeta{
Namespace: namespace,
Expand Down Expand Up @@ -309,7 +309,7 @@ func MakeClusterTrainingRuntimeWrapper(t *testing.T, name string) *ClusterTraini
ClusterTrainingRuntime: kubeflowv2.ClusterTrainingRuntime{
TypeMeta: metav1.TypeMeta{
APIVersion: kubeflowv2.SchemeGroupVersion.String(),
Kind: "ClusterTrainingRuntime",
Kind: kubeflowv2.ClusterTrainingRuntimeKind,
},
ObjectMeta: metav1.ObjectMeta{
Name: name,
Expand Down
5 changes: 3 additions & 2 deletions pkg/webhook.v2/setup.go
Original file line number Diff line number Diff line change
Expand Up @@ -19,15 +19,16 @@ package webhookv2
import (
ctrl "sigs.k8s.io/controller-runtime"

kubeflowv2 "github.com/kubeflow/training-operator/pkg/apis/kubeflow.org/v2alpha1"
runtime "github.com/kubeflow/training-operator/pkg/runtime.v2"
)

func Setup(mgr ctrl.Manager, runtimes map[string]runtime.Runtime) (string, error) {
if err := setupWebhookForClusterTrainingRuntime(mgr, runtimes); err != nil {
return "ClusterTrainingRuntime", err
return kubeflowv2.ClusterTrainingRuntimeKind, err
}
if err := setupWebhookForTrainingRuntime(mgr, runtimes); err != nil {
return "TrainingRuntime", err
return kubeflowv2.TrainingRuntimeKind, err
}
if err := setupWebhookForTrainJob(mgr, runtimes); err != nil {
return "TrainJob", err
Expand Down

0 comments on commit a527f86

Please sign in to comment.