training

package
v0.9.14 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Apr 10, 2024 License: Apache-2.0 Imports: 5 Imported by: 8

Documentation

Index

Constants

This section is empty.

Variables

View Source
var DefaultCommonSubmitArgs = types.CommonSubmitArgs{
	WorkingDir:  "/root",
	WorkerCount: 1,
	Shell:       "sh",
}
View Source
var DefaultSubmitTensorboardArgs = types.SubmitTensorboardArgs{
	TensorboardImage: "registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel",
	TrainingLogdir:   "/training_logs",
}

Functions

This section is empty.

Types

type DeepSpeedJobBuilder added in v0.9.9

type DeepSpeedJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewDeepSpeedJobBuilder added in v0.9.9

func NewDeepSpeedJobBuilder() *DeepSpeedJobBuilder

func (*DeepSpeedJobBuilder) Annotations added in v0.9.9

func (b *DeepSpeedJobBuilder) Annotations(annotations map[string]string) *DeepSpeedJobBuilder

Annotations is used to add annotations for job pods,match option --annotation

func (*DeepSpeedJobBuilder) Build added in v0.9.9

func (b *DeepSpeedJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*DeepSpeedJobBuilder) CPU added in v0.9.9

CPU assign cpu limits,match option --cpu

func (*DeepSpeedJobBuilder) Command added in v0.9.9

func (b *DeepSpeedJobBuilder) Command(args []string) *DeepSpeedJobBuilder

Command is used to set job command

func (*DeepSpeedJobBuilder) ConfigFiles added in v0.9.9

func (b *DeepSpeedJobBuilder) ConfigFiles(files map[string]string) *DeepSpeedJobBuilder

ConfigFiles is used to mapping config files form local to job containers,match option --config-file

func (*DeepSpeedJobBuilder) DataDirs added in v0.9.9

func (b *DeepSpeedJobBuilder) DataDirs(volumes map[string]string) *DeepSpeedJobBuilder

DataDirs is used to mount host files to job containers,match option --data-dir

func (*DeepSpeedJobBuilder) Datas added in v0.9.9

func (b *DeepSpeedJobBuilder) Datas(volumes map[string]string) *DeepSpeedJobBuilder

Datas is used to mount k8s pvc to job pods,match option --data

func (*DeepSpeedJobBuilder) EnableRDMA added in v0.9.9

func (b *DeepSpeedJobBuilder) EnableRDMA() *DeepSpeedJobBuilder

EnableRDMA is used to enabled rdma,match option --rdma

func (*DeepSpeedJobBuilder) EnableTensorboard added in v0.9.9

func (b *DeepSpeedJobBuilder) EnableTensorboard() *DeepSpeedJobBuilder

EnableTensorboard is used to enable tensorboard

func (*DeepSpeedJobBuilder) Envs added in v0.9.9

Envs is used to set env of job containers,match option --env

func (*DeepSpeedJobBuilder) GPUCount added in v0.9.9

func (b *DeepSpeedJobBuilder) GPUCount(count int) *DeepSpeedJobBuilder

GPUCount is used to set count of gpu for the job,match the option --gpus

func (*DeepSpeedJobBuilder) Image added in v0.9.9

Image is used to set job image,match the option --image

func (*DeepSpeedJobBuilder) ImagePullSecrets added in v0.9.9

func (b *DeepSpeedJobBuilder) ImagePullSecrets(secrets []string) *DeepSpeedJobBuilder

ImagePullSecrets is used to set image pull secrests,match option --image-pull-secret

func (*DeepSpeedJobBuilder) Labels added in v0.9.9

func (b *DeepSpeedJobBuilder) Labels(labels map[string]string) *DeepSpeedJobBuilder

Labels is used to add labels for job

func (*DeepSpeedJobBuilder) LogDir added in v0.9.9

LogDir is used to set log directory,match option --logdir

func (*DeepSpeedJobBuilder) Memory added in v0.9.9

func (b *DeepSpeedJobBuilder) Memory(memory string) *DeepSpeedJobBuilder

Memory assign memory limits,match option --memory

func (*DeepSpeedJobBuilder) Name added in v0.9.9

Name is used to set job name,match option --name

func (*DeepSpeedJobBuilder) NodeSelectors added in v0.9.9

func (b *DeepSpeedJobBuilder) NodeSelectors(selectors map[string]string) *DeepSpeedJobBuilder

NodeSelectors is used to set node selectors for scheduling job,match option --selector

func (*DeepSpeedJobBuilder) Priority added in v0.9.9

func (b *DeepSpeedJobBuilder) Priority(priority string) *DeepSpeedJobBuilder

Priority sets the priority

func (*DeepSpeedJobBuilder) Shell added in v0.9.9

Shell is used to set bash or sh

func (*DeepSpeedJobBuilder) SyncImage added in v0.9.9

func (b *DeepSpeedJobBuilder) SyncImage(image string) *DeepSpeedJobBuilder

SyncImage is used to set syncing image,match option --sync-image

func (*DeepSpeedJobBuilder) SyncMode added in v0.9.9

func (b *DeepSpeedJobBuilder) SyncMode(mode string) *DeepSpeedJobBuilder

SyncMode is used to set syncing mode,match option --sync-mode

func (*DeepSpeedJobBuilder) SyncSource added in v0.9.9

func (b *DeepSpeedJobBuilder) SyncSource(source string) *DeepSpeedJobBuilder

SyncSource is used to set syncing source,match option --sync-source

func (*DeepSpeedJobBuilder) TensorboardImage added in v0.9.9

func (b *DeepSpeedJobBuilder) TensorboardImage(image string) *DeepSpeedJobBuilder

TensorboardImage is used to enable tensorboard image

func (*DeepSpeedJobBuilder) Tolerations added in v0.9.9

func (b *DeepSpeedJobBuilder) Tolerations(tolerations []string) *DeepSpeedJobBuilder

Tolerations is used to set tolerations for tolerate nodes,match option --toleration

func (*DeepSpeedJobBuilder) WorkerCount added in v0.9.9

func (b *DeepSpeedJobBuilder) WorkerCount(count int) *DeepSpeedJobBuilder

WorkerCount is used to set count of worker

func (*DeepSpeedJobBuilder) WorkingDir added in v0.9.9

func (b *DeepSpeedJobBuilder) WorkingDir(dir string) *DeepSpeedJobBuilder

WorkingDir is used to set working directory of job containers,default is '/root' match option --working-dir

type ETJobBuilder

type ETJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewETJobBuilder

func NewETJobBuilder() *ETJobBuilder

func (*ETJobBuilder) Annotations

func (b *ETJobBuilder) Annotations(annotations map[string]string) *ETJobBuilder

Annotations is used to add annotations for job pods,match option --annotation

func (*ETJobBuilder) Build

func (b *ETJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*ETJobBuilder) CPU

func (b *ETJobBuilder) CPU(cpu string) *ETJobBuilder

CPU assign cpu limts,match option --cpu

func (*ETJobBuilder) Command

func (b *ETJobBuilder) Command(args []string) *ETJobBuilder

Command is used to set job command

func (*ETJobBuilder) ConfigFiles

func (b *ETJobBuilder) ConfigFiles(files map[string]string) *ETJobBuilder

ConfigFiles is used to mapping config files form local to job containers,match option --config-file

func (*ETJobBuilder) DataDirs

func (b *ETJobBuilder) DataDirs(volumes map[string]string) *ETJobBuilder

DataDirs is used to mount host files to job containers,match option --data-dir

func (*ETJobBuilder) Datas

func (b *ETJobBuilder) Datas(volumes map[string]string) *ETJobBuilder

Datas is used to mount k8s pvc to job pods,match option --data

func (*ETJobBuilder) EnableRDMA

func (b *ETJobBuilder) EnableRDMA() *ETJobBuilder

EnableRDMA is used to enabled rdma,match option --rdma

func (*ETJobBuilder) EnableTensorboard

func (b *ETJobBuilder) EnableTensorboard() *ETJobBuilder

EnableTensorboard is used to enable tensorboard

func (*ETJobBuilder) Envs

func (b *ETJobBuilder) Envs(envs map[string]string) *ETJobBuilder

Envs is used to set env of job containers,match option --env

func (*ETJobBuilder) GPUCount

func (b *ETJobBuilder) GPUCount(count int) *ETJobBuilder

GPUCount is used to set count of gpu for the job,match the option --gpus

func (*ETJobBuilder) Image

func (b *ETJobBuilder) Image(image string) *ETJobBuilder

Image is used to set job image,match the option --image

func (*ETJobBuilder) ImagePullSecrets

func (b *ETJobBuilder) ImagePullSecrets(secrets []string) *ETJobBuilder

ImagePullSecrets is used to set image pull secrests,match option --image-pull-secret

func (*ETJobBuilder) Labels added in v0.8.7

func (b *ETJobBuilder) Labels(labels map[string]string) *ETJobBuilder

Labels is used to add labels for job

func (*ETJobBuilder) LogDir

func (b *ETJobBuilder) LogDir(dir string) *ETJobBuilder

LogDir is used to set log directory,match option --logdir

func (*ETJobBuilder) MaxWorkers

func (b *ETJobBuilder) MaxWorkers(count int) *ETJobBuilder

MaxWorkers assign max workers,match option --max-workers

func (*ETJobBuilder) Memory

func (b *ETJobBuilder) Memory(memory string) *ETJobBuilder

Memory assign memory limits,match option --memory

func (*ETJobBuilder) MinWorkers

func (b *ETJobBuilder) MinWorkers(count int) *ETJobBuilder

MinWorkers assign min workers,match option --min-workers

func (*ETJobBuilder) Name

func (b *ETJobBuilder) Name(name string) *ETJobBuilder

Name is used to set job name,match option --name

func (*ETJobBuilder) NodeSelectors

func (b *ETJobBuilder) NodeSelectors(selectors map[string]string) *ETJobBuilder

NodeSelectors is used to set node selectors for scheduling job,match option --selector

func (*ETJobBuilder) Priority

func (b *ETJobBuilder) Priority(priority string) *ETJobBuilder

Priority sets the priority

func (*ETJobBuilder) Shell added in v0.8.9

func (b *ETJobBuilder) Shell(shell string) *ETJobBuilder

Shell is used to set bash or sh

func (*ETJobBuilder) SyncImage

func (b *ETJobBuilder) SyncImage(image string) *ETJobBuilder

SyncImage is used to set syncing image,match option --sync-image

func (*ETJobBuilder) SyncMode

func (b *ETJobBuilder) SyncMode(mode string) *ETJobBuilder

SyncMode is used to set syncing mode,match option --sync-mode

func (*ETJobBuilder) SyncSource

func (b *ETJobBuilder) SyncSource(source string) *ETJobBuilder

SyncSource is used to set syncing source,match option --sync-source

func (*ETJobBuilder) TensorboardImage

func (b *ETJobBuilder) TensorboardImage(image string) *ETJobBuilder

TensorboardImage is used to enable tensorboard image

func (*ETJobBuilder) Tolerations

func (b *ETJobBuilder) Tolerations(tolerations []string) *ETJobBuilder

Tolerations is used to set tolerations for tolerate nodes,match option --toleration

func (*ETJobBuilder) WorkerCount

func (b *ETJobBuilder) WorkerCount(count int) *ETJobBuilder

WorkerCount is used to set count of worker

func (*ETJobBuilder) WorkingDir

func (b *ETJobBuilder) WorkingDir(dir string) *ETJobBuilder

WorkingDir is used to set working directory of job containers,default is '/root' match option --working-dir

type HorovodJobBuilder

type HorovodJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewHorovodJobBuilder

func NewHorovodJobBuilder() *HorovodJobBuilder

func (*HorovodJobBuilder) Annotations

func (b *HorovodJobBuilder) Annotations(annotations map[string]string) *HorovodJobBuilder

Annotations is used to add annotations for job pods,match option --annotation

func (*HorovodJobBuilder) Build

func (b *HorovodJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*HorovodJobBuilder) CPU

CPU assign cpu limts,match option --cpu

func (*HorovodJobBuilder) Command

func (b *HorovodJobBuilder) Command(args []string) *HorovodJobBuilder

Command is used to set job command

func (*HorovodJobBuilder) ConfigFiles

func (b *HorovodJobBuilder) ConfigFiles(files map[string]string) *HorovodJobBuilder

ConfigFiles is used to mapping config files form local to job containers,match option --config-file

func (*HorovodJobBuilder) DataDirs

func (b *HorovodJobBuilder) DataDirs(volumes map[string]string) *HorovodJobBuilder

DataDirs is used to mount host files to job containers,match option --data-dir

func (*HorovodJobBuilder) Datas

func (b *HorovodJobBuilder) Datas(volumes map[string]string) *HorovodJobBuilder

Datas is used to mount k8s pvc to job pods,match option --data

func (*HorovodJobBuilder) EnableRDMA

func (b *HorovodJobBuilder) EnableRDMA() *HorovodJobBuilder

EnableRDMA is used to enabled rdma,match option --rdma

func (*HorovodJobBuilder) EnableTensorboard

func (b *HorovodJobBuilder) EnableTensorboard() *HorovodJobBuilder

EnableTensorboard is used to enable tensorboard

func (*HorovodJobBuilder) Envs

func (b *HorovodJobBuilder) Envs(envs map[string]string) *HorovodJobBuilder

Envs is used to set env of job containers,match option --env

func (*HorovodJobBuilder) GPUCount

func (b *HorovodJobBuilder) GPUCount(count int) *HorovodJobBuilder

GPUCount is used to set count of gpu for the job,match the option --gpus

func (*HorovodJobBuilder) Image

func (b *HorovodJobBuilder) Image(image string) *HorovodJobBuilder

Image is used to set job image,match the option --image

func (*HorovodJobBuilder) ImagePullSecrets

func (b *HorovodJobBuilder) ImagePullSecrets(secrets []string) *HorovodJobBuilder

ImagePullSecrets is used to set image pull secrests,match option --image-pull-secret

func (*HorovodJobBuilder) LogDir

func (b *HorovodJobBuilder) LogDir(dir string) *HorovodJobBuilder

LogDir is used to set log directory,match option --logdir

func (*HorovodJobBuilder) Memory

func (b *HorovodJobBuilder) Memory(memory string) *HorovodJobBuilder

Memory assign memory limits,match option --memory

func (*HorovodJobBuilder) Name

Name is used to set job name,match option --name

func (*HorovodJobBuilder) NodeSelectors

func (b *HorovodJobBuilder) NodeSelectors(selectors map[string]string) *HorovodJobBuilder

NodeSelectors is used to set node selectors for scheduling job,match option --selector

func (*HorovodJobBuilder) Priority

func (b *HorovodJobBuilder) Priority(priority string) *HorovodJobBuilder

Priority sets the priority

func (*HorovodJobBuilder) SSHPort

func (b *HorovodJobBuilder) SSHPort(port int) *HorovodJobBuilder

SSHPort set the ssh port,match option --ssh-port

func (*HorovodJobBuilder) Shell added in v0.8.9

func (b *HorovodJobBuilder) Shell(shell string) *HorovodJobBuilder

Shell is used to set bash or sh

func (*HorovodJobBuilder) SyncImage

func (b *HorovodJobBuilder) SyncImage(image string) *HorovodJobBuilder

SyncImage is used to set syncing image,match option --sync-image

func (*HorovodJobBuilder) SyncMode

func (b *HorovodJobBuilder) SyncMode(mode string) *HorovodJobBuilder

SyncMode is used to set syncing mode,match option --sync-mode

func (*HorovodJobBuilder) SyncSource

func (b *HorovodJobBuilder) SyncSource(source string) *HorovodJobBuilder

SyncSource is used to set syncing source,match option --sync-source

func (*HorovodJobBuilder) TensorboardImage

func (b *HorovodJobBuilder) TensorboardImage(image string) *HorovodJobBuilder

TensorboardImage is used to enable tensorboard image

func (*HorovodJobBuilder) Tolerations

func (b *HorovodJobBuilder) Tolerations(tolerations []string) *HorovodJobBuilder

Tolerations is used to set tolerations for tolerate nodes,match option --toleration

func (*HorovodJobBuilder) WorkerCount

func (b *HorovodJobBuilder) WorkerCount(count int) *HorovodJobBuilder

WorkerCount is used to set count of worker

func (*HorovodJobBuilder) WorkingDir

func (b *HorovodJobBuilder) WorkingDir(dir string) *HorovodJobBuilder

WorkingDir is used to set working directory of job containers,default is '/root' match option --working-dir

type Job

type Job struct {
	// contains filtered or unexported fields
}

Job defines the base job

func NewJob

func NewJob(name string, jobType types.TrainingJobType, args interface{}) *Job

func (*Job) Args

func (b *Job) Args() interface{}

func (*Job) Name

func (b *Job) Name() string

func (*Job) Type

func (j *Job) Type() types.TrainingJobType

type MPIJobBuilder

type MPIJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewMPIJobBuilder

func NewMPIJobBuilder() *MPIJobBuilder

func (*MPIJobBuilder) Annotations

func (b *MPIJobBuilder) Annotations(annotations map[string]string) *MPIJobBuilder

Annotations is used to add annotations for job pods,match option --annotation

func (*MPIJobBuilder) Build

func (b *MPIJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*MPIJobBuilder) CPU

func (b *MPIJobBuilder) CPU(cpu string) *MPIJobBuilder

CPU assign cpu limts,match option --cpu

func (*MPIJobBuilder) CleanPodPolicy added in v0.9.0

func (b *MPIJobBuilder) CleanPodPolicy(policy string) *MPIJobBuilder

CleanPodPolicy is used to set cleaning pod policy,match option --clean-task-policy

func (*MPIJobBuilder) Command

func (b *MPIJobBuilder) Command(args []string) *MPIJobBuilder

Command is used to set job command

func (*MPIJobBuilder) ConfigFiles

func (b *MPIJobBuilder) ConfigFiles(files map[string]string) *MPIJobBuilder

ConfigFiles is used to mapping config files form local to job containers,match option --config-file

func (*MPIJobBuilder) DataDirs

func (b *MPIJobBuilder) DataDirs(volumes map[string]string) *MPIJobBuilder

DataDirs is used to mount host files to job containers,match option --data-dir

func (*MPIJobBuilder) Datas

func (b *MPIJobBuilder) Datas(volumes map[string]string) *MPIJobBuilder

Datas is used to mount k8s pvc to job pods,match option --data

func (*MPIJobBuilder) EnableGPUTopology added in v0.8.1

func (b *MPIJobBuilder) EnableGPUTopology() *MPIJobBuilder

EnableGPUTopology is used to enable gpu topology scheduling

func (*MPIJobBuilder) EnableMountPVCOnLauncher added in v0.8.8

func (b *MPIJobBuilder) EnableMountPVCOnLauncher() *MPIJobBuilder

EnableMountPVCOnLauncher is used to enable mount pvcs on launcher

func (*MPIJobBuilder) EnableRDMA

func (b *MPIJobBuilder) EnableRDMA() *MPIJobBuilder

EnableRDMA is used to enabled rdma,match option --rdma

func (*MPIJobBuilder) EnableTensorboard

func (b *MPIJobBuilder) EnableTensorboard() *MPIJobBuilder

EnableTensorboard is used to enable tensorboard

func (*MPIJobBuilder) Envs

func (b *MPIJobBuilder) Envs(envs map[string]string) *MPIJobBuilder

Envs is used to set env of job containers,match option --env

func (*MPIJobBuilder) GPUCount

func (b *MPIJobBuilder) GPUCount(count int) *MPIJobBuilder

GPUCount is used to set count of gpu for the job,match the option --gpus

func (*MPIJobBuilder) Image

func (b *MPIJobBuilder) Image(image string) *MPIJobBuilder

Image is used to set job image,match the option --image

func (*MPIJobBuilder) ImagePullSecrets

func (b *MPIJobBuilder) ImagePullSecrets(secrets []string) *MPIJobBuilder

ImagePullSecrets is used to set image pull secrests,match option --image-pull-secret

func (*MPIJobBuilder) Labels added in v0.8.7

func (b *MPIJobBuilder) Labels(labels map[string]string) *MPIJobBuilder

Labels is used to add labels for job

func (*MPIJobBuilder) LogDir

func (b *MPIJobBuilder) LogDir(dir string) *MPIJobBuilder

LogDir is used to set log directory,match option --logdir

func (*MPIJobBuilder) Memory

func (b *MPIJobBuilder) Memory(memory string) *MPIJobBuilder

Memory assign memory limits,match option --memory

func (*MPIJobBuilder) Name

func (b *MPIJobBuilder) Name(name string) *MPIJobBuilder

Name is used to set job name,match option --name

func (*MPIJobBuilder) NodeSelectors

func (b *MPIJobBuilder) NodeSelectors(selectors map[string]string) *MPIJobBuilder

NodeSelectors is used to set node selectors for scheduling job,match option --selector

func (*MPIJobBuilder) Priority

func (b *MPIJobBuilder) Priority(priority string) *MPIJobBuilder

Priority sets the priority

func (*MPIJobBuilder) Shell added in v0.8.9

func (b *MPIJobBuilder) Shell(shell string) *MPIJobBuilder

Shell is used to set bash or sh

func (*MPIJobBuilder) SyncImage

func (b *MPIJobBuilder) SyncImage(image string) *MPIJobBuilder

SyncImage is used to set syncing image,match option --sync-image

func (*MPIJobBuilder) SyncMode

func (b *MPIJobBuilder) SyncMode(mode string) *MPIJobBuilder

SyncMode is used to set syncing mode,match option --sync-mode

func (*MPIJobBuilder) SyncSource

func (b *MPIJobBuilder) SyncSource(source string) *MPIJobBuilder

SyncSource is used to set syncing source,match option --sync-source

func (*MPIJobBuilder) TensorboardImage

func (b *MPIJobBuilder) TensorboardImage(image string) *MPIJobBuilder

TensorboardImage is used to enable tensorboard image

func (*MPIJobBuilder) Tolerations

func (b *MPIJobBuilder) Tolerations(tolerations []string) *MPIJobBuilder

Tolerations is used to set tolerations for tolerate nodes,match option --toleration

func (*MPIJobBuilder) WorkerCount

func (b *MPIJobBuilder) WorkerCount(count int) *MPIJobBuilder

WorkerCount is used to set count of worker

func (*MPIJobBuilder) WorkingDir

func (b *MPIJobBuilder) WorkingDir(dir string) *MPIJobBuilder

WorkingDir is used to set working directory of job containers,default is '/root' match option --working-dir

type PytorchJobBuilder

type PytorchJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewPytorchJobBuilder

func NewPytorchJobBuilder() *PytorchJobBuilder

func (*PytorchJobBuilder) ActiveDeadlineSeconds added in v0.9.9

func (b *PytorchJobBuilder) ActiveDeadlineSeconds(act int64) *PytorchJobBuilder

ActiveDeadlineSeconds match option --running-timeout

func (*PytorchJobBuilder) Annotations

func (b *PytorchJobBuilder) Annotations(annotations map[string]string) *PytorchJobBuilder

Annotations is used to add annotations for job pods,match option --annotation

func (*PytorchJobBuilder) Build

func (b *PytorchJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*PytorchJobBuilder) CPU added in v0.8.0

CPU assign cpu limts,match option --cpu

func (*PytorchJobBuilder) CleanPodPolicy

func (b *PytorchJobBuilder) CleanPodPolicy(policy string) *PytorchJobBuilder

CleanPodPolicy is used to set cleaning pod policy,match option --clean-task-policy

func (*PytorchJobBuilder) Command

func (b *PytorchJobBuilder) Command(args []string) *PytorchJobBuilder

Command is used to set job command

func (*PytorchJobBuilder) ConfigFiles

func (b *PytorchJobBuilder) ConfigFiles(files map[string]string) *PytorchJobBuilder

ConfigFiles is used to mapping config files form local to job containers,match option --config-file

func (*PytorchJobBuilder) DataDirs

func (b *PytorchJobBuilder) DataDirs(volumes map[string]string) *PytorchJobBuilder

DataDirs is used to mount host files to job containers,match option --data-dir

func (*PytorchJobBuilder) Datas

func (b *PytorchJobBuilder) Datas(volumes map[string]string) *PytorchJobBuilder

Datas is used to mount k8s pvc to job pods,match option --data

func (*PytorchJobBuilder) EnableRDMA

func (b *PytorchJobBuilder) EnableRDMA() *PytorchJobBuilder

EnableRDMA is used to enabled rdma,match option --rdma

func (*PytorchJobBuilder) EnableTensorboard

func (b *PytorchJobBuilder) EnableTensorboard() *PytorchJobBuilder

EnableTensorboard is used to enable tensorboard

func (*PytorchJobBuilder) Envs

func (b *PytorchJobBuilder) Envs(envs map[string]string) *PytorchJobBuilder

Envs is used to set env of job containers,match option --env

func (*PytorchJobBuilder) GPUCount

func (b *PytorchJobBuilder) GPUCount(count int) *PytorchJobBuilder

GPUCount is used to set count of gpu for the job,match the option --gpus

func (*PytorchJobBuilder) Image

func (b *PytorchJobBuilder) Image(image string) *PytorchJobBuilder

Image is used to set job image,match the option --image

func (*PytorchJobBuilder) ImagePullSecrets

func (b *PytorchJobBuilder) ImagePullSecrets(secrets []string) *PytorchJobBuilder

ImagePullSecrets is used to set image pull secrests,match option --image-pull-secret

func (*PytorchJobBuilder) Labels added in v0.8.7

func (b *PytorchJobBuilder) Labels(labels map[string]string) *PytorchJobBuilder

Labels is used to add labels for job

func (*PytorchJobBuilder) LogDir

func (b *PytorchJobBuilder) LogDir(dir string) *PytorchJobBuilder

LogDir is used to set log directory,match option --logdir

func (*PytorchJobBuilder) Memory added in v0.8.0

func (b *PytorchJobBuilder) Memory(memory string) *PytorchJobBuilder

Memory assign memory limits,match option --memory

func (*PytorchJobBuilder) Name

Name is used to set job name,match option --name

func (*PytorchJobBuilder) NodeSelectors

func (b *PytorchJobBuilder) NodeSelectors(selectors map[string]string) *PytorchJobBuilder

NodeSelectors is used to set node selectors for scheduling job,match option --selector

func (*PytorchJobBuilder) Priority

func (b *PytorchJobBuilder) Priority(priority string) *PytorchJobBuilder

Priority sets the priority

func (*PytorchJobBuilder) Shell added in v0.8.9

func (b *PytorchJobBuilder) Shell(shell string) *PytorchJobBuilder

Shell is used to set bash or sh

func (*PytorchJobBuilder) SyncImage

func (b *PytorchJobBuilder) SyncImage(image string) *PytorchJobBuilder

SyncImage is used to set syncing image,match option --sync-image

func (*PytorchJobBuilder) SyncMode

func (b *PytorchJobBuilder) SyncMode(mode string) *PytorchJobBuilder

SyncMode is used to set syncing mode,match option --sync-mode

func (*PytorchJobBuilder) SyncSource

func (b *PytorchJobBuilder) SyncSource(source string) *PytorchJobBuilder

SyncSource is used to set syncing source,match option --sync-source

func (*PytorchJobBuilder) TTLSecondsAfterFinished added in v0.9.7

func (b *PytorchJobBuilder) TTLSecondsAfterFinished(ttl int32) *PytorchJobBuilder

TTLSecondsAfterFinished match option --ttl-after-finished

func (*PytorchJobBuilder) TensorboardImage

func (b *PytorchJobBuilder) TensorboardImage(image string) *PytorchJobBuilder

TensorboardImage is used to enable tensorboard image

func (*PytorchJobBuilder) Tolerations

func (b *PytorchJobBuilder) Tolerations(tolerations []string) *PytorchJobBuilder

Tolerations is used to set tolerations for tolerate nodes,match option --toleration

func (*PytorchJobBuilder) WorkerCount

func (b *PytorchJobBuilder) WorkerCount(count int) *PytorchJobBuilder

WorkerCount is used to set count of worker

func (*PytorchJobBuilder) WorkingDir

func (b *PytorchJobBuilder) WorkingDir(dir string) *PytorchJobBuilder

WorkingDir is used to set working directory of job containers,default is '/root' match option --working-dir

type ScaleInETJobBuilder

type ScaleInETJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewScaleInETJobBuilder

func NewScaleInETJobBuilder() *ScaleInETJobBuilder

func (*ScaleInETJobBuilder) Build

func (b *ScaleInETJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*ScaleInETJobBuilder) Count

func (b *ScaleInETJobBuilder) Count(count int) *ScaleInETJobBuilder

Retry is used to set retry times

func (*ScaleInETJobBuilder) Envs

Envs is used to set envs

func (*ScaleInETJobBuilder) Name

Name is used to set job name,match option --name

func (*ScaleInETJobBuilder) Retry

func (b *ScaleInETJobBuilder) Retry(count int) *ScaleInETJobBuilder

Retry is used to set retry times

func (*ScaleInETJobBuilder) Script

Script is used to set scale script

func (*ScaleInETJobBuilder) Timeout

Timeout is used to set timeout seconds

type ScaleOutETJobBuilder

type ScaleOutETJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewScaleOutETJobBuilder

func NewScaleOutETJobBuilder() *ScaleOutETJobBuilder

func (*ScaleOutETJobBuilder) Build

func (b *ScaleOutETJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*ScaleOutETJobBuilder) Count

Retry is used to set retry times

func (*ScaleOutETJobBuilder) Envs

Envs is used to set envs

func (*ScaleOutETJobBuilder) Name

Name is used to set job name,match option --name

func (*ScaleOutETJobBuilder) Retry

Retry is used to set retry times

func (*ScaleOutETJobBuilder) Script

Script is used to set scale script

func (*ScaleOutETJobBuilder) Timeout

Timeout is used to set timeout seconds

type SparkJobBuilder

type SparkJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewSparkJobBuilder

func NewSparkJobBuilder() *SparkJobBuilder

func (*SparkJobBuilder) Annotations added in v0.8.7

func (b *SparkJobBuilder) Annotations(annotations map[string]string) *SparkJobBuilder

func (*SparkJobBuilder) Build

func (b *SparkJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*SparkJobBuilder) DriverCPURequest

func (b *SparkJobBuilder) DriverCPURequest(request int) *SparkJobBuilder

func (*SparkJobBuilder) DriverMemoryRequest

func (b *SparkJobBuilder) DriverMemoryRequest(memory string) *SparkJobBuilder

func (*SparkJobBuilder) ExecutorCPURequest

func (b *SparkJobBuilder) ExecutorCPURequest(request int) *SparkJobBuilder

func (*SparkJobBuilder) ExecutorMemoryRequest

func (b *SparkJobBuilder) ExecutorMemoryRequest(memory string) *SparkJobBuilder

func (*SparkJobBuilder) ExecutorReplicas

func (b *SparkJobBuilder) ExecutorReplicas(replicas int) *SparkJobBuilder

func (*SparkJobBuilder) Image

func (b *SparkJobBuilder) Image(image string) *SparkJobBuilder

func (*SparkJobBuilder) Jar

func (b *SparkJobBuilder) Jar(jar string) *SparkJobBuilder

func (*SparkJobBuilder) Labels added in v0.8.7

func (b *SparkJobBuilder) Labels(labels map[string]string) *SparkJobBuilder

func (*SparkJobBuilder) MainClass

func (b *SparkJobBuilder) MainClass(mainClass string) *SparkJobBuilder

func (*SparkJobBuilder) Name

func (b *SparkJobBuilder) Name(name string) *SparkJobBuilder

Name is used to set job name,match option --name

type TFJobBuilder

type TFJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewTFJobBuilder

func NewTFJobBuilder(args *types.SubmitTFJobArgs) *TFJobBuilder

func (*TFJobBuilder) ActiveDeadlineSeconds added in v0.9.9

func (b *TFJobBuilder) ActiveDeadlineSeconds(act int64) *TFJobBuilder

func (*TFJobBuilder) Annotations

func (b *TFJobBuilder) Annotations(annotations map[string]string) *TFJobBuilder

func (*TFJobBuilder) Build

func (b *TFJobBuilder) Build() (*Job, error)

func (*TFJobBuilder) ChiefCPU

func (b *TFJobBuilder) ChiefCPU(cpu string) *TFJobBuilder

func (*TFJobBuilder) ChiefCPULimit added in v0.9.1

func (b *TFJobBuilder) ChiefCPULimit(cpu string) *TFJobBuilder

func (*TFJobBuilder) ChiefMemory

func (b *TFJobBuilder) ChiefMemory(mem string) *TFJobBuilder

func (*TFJobBuilder) ChiefMemoryLimit added in v0.9.1

func (b *TFJobBuilder) ChiefMemoryLimit(mem string) *TFJobBuilder

func (*TFJobBuilder) ChiefPort

func (b *TFJobBuilder) ChiefPort(port int) *TFJobBuilder

func (*TFJobBuilder) ChiefSelectors

func (b *TFJobBuilder) ChiefSelectors(selectors map[string]string) *TFJobBuilder

func (*TFJobBuilder) CleanPodPolicy

func (b *TFJobBuilder) CleanPodPolicy(policy string) *TFJobBuilder

func (*TFJobBuilder) Command

func (b *TFJobBuilder) Command(args []string) *TFJobBuilder

func (*TFJobBuilder) ConfigFiles

func (b *TFJobBuilder) ConfigFiles(files map[string]string) *TFJobBuilder

func (*TFJobBuilder) DataDirs

func (b *TFJobBuilder) DataDirs(volumes map[string]string) *TFJobBuilder

func (*TFJobBuilder) Datas

func (b *TFJobBuilder) Datas(volumes map[string]string) *TFJobBuilder

func (*TFJobBuilder) EnableChief

func (b *TFJobBuilder) EnableChief() *TFJobBuilder

func (*TFJobBuilder) EnableEvaluator

func (b *TFJobBuilder) EnableEvaluator() *TFJobBuilder

func (*TFJobBuilder) EnableRDMA

func (b *TFJobBuilder) EnableRDMA() *TFJobBuilder

func (*TFJobBuilder) EnableTensorboard

func (b *TFJobBuilder) EnableTensorboard() *TFJobBuilder

func (*TFJobBuilder) Envs

func (b *TFJobBuilder) Envs(envs map[string]string) *TFJobBuilder

func (*TFJobBuilder) EvaluatorCPU

func (b *TFJobBuilder) EvaluatorCPU(cpu string) *TFJobBuilder

func (*TFJobBuilder) EvaluatorCPULimit added in v0.9.1

func (b *TFJobBuilder) EvaluatorCPULimit(cpu string) *TFJobBuilder

func (*TFJobBuilder) EvaluatorMemory

func (b *TFJobBuilder) EvaluatorMemory(mem string) *TFJobBuilder

func (*TFJobBuilder) EvaluatorMemoryLimit added in v0.9.1

func (b *TFJobBuilder) EvaluatorMemoryLimit(mem string) *TFJobBuilder

func (*TFJobBuilder) EvaluatorSelectors

func (b *TFJobBuilder) EvaluatorSelectors(selectors map[string]string) *TFJobBuilder

func (*TFJobBuilder) GPUCount

func (b *TFJobBuilder) GPUCount(count int) *TFJobBuilder

func (*TFJobBuilder) GetArgValues added in v0.8.4

func (b *TFJobBuilder) GetArgValues() map[string]interface{}

func (*TFJobBuilder) Image

func (b *TFJobBuilder) Image(image string) *TFJobBuilder

func (*TFJobBuilder) ImagePullSecrets

func (b *TFJobBuilder) ImagePullSecrets(secrets []string) *TFJobBuilder

func (*TFJobBuilder) Labels added in v0.8.7

func (b *TFJobBuilder) Labels(labels map[string]string) *TFJobBuilder

func (*TFJobBuilder) LogDir

func (b *TFJobBuilder) LogDir(dir string) *TFJobBuilder

func (*TFJobBuilder) Name

func (b *TFJobBuilder) Name(name string) *TFJobBuilder

func (*TFJobBuilder) NodeSelectors

func (b *TFJobBuilder) NodeSelectors(selectors map[string]string) *TFJobBuilder

func (*TFJobBuilder) Priority

func (b *TFJobBuilder) Priority(priority string) *TFJobBuilder

func (*TFJobBuilder) PsCPU

func (b *TFJobBuilder) PsCPU(cpu string) *TFJobBuilder

func (*TFJobBuilder) PsCPULimit added in v0.9.1

func (b *TFJobBuilder) PsCPULimit(cpu string) *TFJobBuilder

func (*TFJobBuilder) PsCount

func (b *TFJobBuilder) PsCount(count int) *TFJobBuilder

func (*TFJobBuilder) PsGPU added in v0.8.6

func (b *TFJobBuilder) PsGPU(gpu int) *TFJobBuilder

func (*TFJobBuilder) PsImage

func (b *TFJobBuilder) PsImage(image string) *TFJobBuilder

func (*TFJobBuilder) PsMemory

func (b *TFJobBuilder) PsMemory(mem string) *TFJobBuilder

func (*TFJobBuilder) PsMemoryLimit added in v0.9.1

func (b *TFJobBuilder) PsMemoryLimit(mem string) *TFJobBuilder

func (*TFJobBuilder) PsPort

func (b *TFJobBuilder) PsPort(port int) *TFJobBuilder

func (*TFJobBuilder) PsSelectors

func (b *TFJobBuilder) PsSelectors(selectors map[string]string) *TFJobBuilder

func (*TFJobBuilder) RoleSequence added in v0.8.0

func (b *TFJobBuilder) RoleSequence(roles []string) *TFJobBuilder

func (*TFJobBuilder) Shell added in v0.8.9

func (b *TFJobBuilder) Shell(shell string) *TFJobBuilder

Shell is used to set bash or sh

func (*TFJobBuilder) SyncImage

func (b *TFJobBuilder) SyncImage(image string) *TFJobBuilder

func (*TFJobBuilder) SyncMode

func (b *TFJobBuilder) SyncMode(mode string) *TFJobBuilder

func (*TFJobBuilder) SyncSource

func (b *TFJobBuilder) SyncSource(source string) *TFJobBuilder

func (*TFJobBuilder) TTLSecondsAfterFinished added in v0.9.7

func (b *TFJobBuilder) TTLSecondsAfterFinished(ttl int32) *TFJobBuilder

func (*TFJobBuilder) TensorboardImage

func (b *TFJobBuilder) TensorboardImage(image string) *TFJobBuilder

func (*TFJobBuilder) Tolerations

func (b *TFJobBuilder) Tolerations(tolerations []string) *TFJobBuilder

func (*TFJobBuilder) WorkerCPU

func (b *TFJobBuilder) WorkerCPU(cpu string) *TFJobBuilder

func (*TFJobBuilder) WorkerCPULimit added in v0.9.1

func (b *TFJobBuilder) WorkerCPULimit(cpu string) *TFJobBuilder

func (*TFJobBuilder) WorkerCount

func (b *TFJobBuilder) WorkerCount(count int) *TFJobBuilder

func (*TFJobBuilder) WorkerImage

func (b *TFJobBuilder) WorkerImage(image string) *TFJobBuilder

func (*TFJobBuilder) WorkerMemory

func (b *TFJobBuilder) WorkerMemory(mem string) *TFJobBuilder

func (*TFJobBuilder) WorkerMemoryLimit added in v0.9.1

func (b *TFJobBuilder) WorkerMemoryLimit(mem string) *TFJobBuilder

func (*TFJobBuilder) WorkerPort

func (b *TFJobBuilder) WorkerPort(port int) *TFJobBuilder

func (*TFJobBuilder) WorkerSelectors

func (b *TFJobBuilder) WorkerSelectors(selectors map[string]string) *TFJobBuilder

func (*TFJobBuilder) WorkingDir

func (b *TFJobBuilder) WorkingDir(dir string) *TFJobBuilder

type VolcanoJobBuilder

type VolcanoJobBuilder struct {
	argsbuilder.ArgsBuilder
	// contains filtered or unexported fields
}

func NewVolcanoJobBuilder

func NewVolcanoJobBuilder() *VolcanoJobBuilder

func (*VolcanoJobBuilder) Annotations added in v0.8.7

func (b *VolcanoJobBuilder) Annotations(annotations map[string]string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) Build

func (b *VolcanoJobBuilder) Build() (*Job, error)

Build is used to build the job

func (*VolcanoJobBuilder) Command

func (b *VolcanoJobBuilder) Command(args []string) *VolcanoJobBuilder

Command is used to set job command

func (*VolcanoJobBuilder) Labels added in v0.8.7

func (b *VolcanoJobBuilder) Labels(labels map[string]string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) MinAvailable

func (b *VolcanoJobBuilder) MinAvailable(minAvailable int) *VolcanoJobBuilder

func (*VolcanoJobBuilder) Name

Name is used to set job name,match option --name

func (*VolcanoJobBuilder) Queue

func (b *VolcanoJobBuilder) Queue(queue string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) SchedulerName

func (b *VolcanoJobBuilder) SchedulerName(name string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) TaskCPU

func (b *VolcanoJobBuilder) TaskCPU(cpu string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) TaskImages

func (b *VolcanoJobBuilder) TaskImages(images []string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) TaskMemory

func (b *VolcanoJobBuilder) TaskMemory(mem string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) TaskName

func (b *VolcanoJobBuilder) TaskName(name string) *VolcanoJobBuilder

func (*VolcanoJobBuilder) TaskPort

func (b *VolcanoJobBuilder) TaskPort(port int) *VolcanoJobBuilder

func (*VolcanoJobBuilder) TaskReplicas

func (b *VolcanoJobBuilder) TaskReplicas(replicas int) *VolcanoJobBuilder

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL