--- apiVersion: apiextensions.k8s.io/v1 kind: CustomResourceDefinition metadata: name: mpijobs.kubeflow.org spec: group: kubeflow.org names: kind: MPIJob plural: mpijobs shortNames: - mj - mpij singular: mpijob scope: Namespaced versions: - name: v2beta1 schema: openAPIV3Schema: properties: spec: properties: mpiImplementation: enum: - OpenMPI - Intel type: string mpiReplicaSpecs: properties: Launcher: properties: replicas: maximum: 1 minimum: 1 type: integer restartPolicy: enum: - Never - OnFailure type: string template: type: object x-kubernetes-preserve-unknown-fields: true type: object Worker: properties: replicas: minimum: 1 type: integer restartPolicy: enum: - Never - OnFailure type: string template: type: object x-kubernetes-preserve-unknown-fields: true type: object required: - Launcher type: object runPolicy: properties: activeDeadlineSeconds: description: | Defines the duration in seconds, relative to its start time, that the launcher Job may be active before the system tries to terminate it. Defaults to infinite. minimum: 0 type: integer backoffLimit: description: Specifies the number of retries before marking the launcher Job as failed. Defaults to 6. minimum: 0 type: integer cleanPodPolicy: description: Defines which worker Pods must be deleted after the Job completes enum: - None - Running - All type: string ttlSecondsAfterFinished: description: | Defines the TTL to clean up the launcher Job. Defaults to infinite. Requires kubernetes 1.21+. minimum: 0 type: integer type: object slotsPerWorker: minimum: 1 type: integer sshAuthMountPath: type: string type: object status: properties: completionTime: format: date-time type: string conditions: items: properties: lastTransitionTime: format: date-time type: string lastUpdateTime: format: date-time type: string message: type: string reason: type: string status: enum: - "True" - "False" - Unknown type: string type: enum: - Created - Running - Restarting - Succeeded - Failed type: string type: object type: array lastReconcileTime: format: date-time type: string replicaStatuses: properties: Launcher: properties: active: type: integer failed: type: integer succeeded: type: integer type: object Worker: properties: active: type: integer failed: type: integer succeeded: type: integer type: object type: object startTime: format: date-time type: string type: object type: object served: true storage: true subresources: status: {}