Documentation
¶
Index ¶
- Constants
- func ExtractEssentialJobMetadata(jobRun *executorapi.JobRunLease) (*job.RunMeta, error)
- type ClusterAllocationService
- type ClusterAllocator
- type IssueHandler
- type JobLeaseRequester
- type JobRequester
- type JobStateReporter
- type LeaseRequest
- type LeaseRequester
- type LeaseResponse
- type PodIssueHandler
- type ResourceCleanupService
Constants ¶
View Source
const ( UnableToSchedule podIssueType = iota StuckStartingUp StuckTerminating ActiveDeadlineExceeded ExternallyDeleted ErrorDuringIssueHandling FailedStartingUp )
Variables ¶
This section is empty.
Functions ¶
func ExtractEssentialJobMetadata ¶ added in v0.3.57
func ExtractEssentialJobMetadata(jobRun *executorapi.JobRunLease) (*job.RunMeta, error)
Types ¶
type ClusterAllocationService ¶
type ClusterAllocationService struct {
// contains filtered or unexported fields
}
func NewClusterAllocationService ¶
func NewClusterAllocationService( clusterId executorContext.ClusterIdentity, eventReporter reporter.EventReporter, jobRunStateManager job.RunStateStore, submitter job.Submitter, clusterHealthMonitor healthmonitor.HealthMonitor, ) *ClusterAllocationService
func (*ClusterAllocationService) AllocateSpareClusterCapacity ¶
func (allocationService *ClusterAllocationService) AllocateSpareClusterCapacity()
type ClusterAllocator ¶ added in v0.3.47
type ClusterAllocator interface {
AllocateSpareClusterCapacity()
}
type IssueHandler ¶ added in v0.3.77
type JobLeaseRequester ¶ added in v0.3.47
type JobLeaseRequester struct {
// contains filtered or unexported fields
}
func NewJobLeaseRequester ¶ added in v0.3.47
func NewJobLeaseRequester( executorApiClient executorapi.ExecutorApiClient, clusterIdentity clusterContext.ClusterIdentity, ) *JobLeaseRequester
func (*JobLeaseRequester) LeaseJobRuns ¶ added in v0.3.47
func (requester *JobLeaseRequester) LeaseJobRuns(ctx *armadacontext.Context, request *LeaseRequest) (*LeaseResponse, error)
type JobRequester ¶ added in v0.3.57
type JobRequester struct {
// contains filtered or unexported fields
}
func NewJobRequester ¶ added in v0.3.57
func NewJobRequester( clusterId executorContext.ClusterIdentity, eventReporter reporter.EventReporter, leaseRequester LeaseRequester, jobRunStateStore job.RunStateStore, utilisationService utilisation.UtilisationService, podDefaults *configuration.PodDefaults, maxLeasedJobs int, maxRequestDuration time.Duration, ) *JobRequester
func (*JobRequester) RequestJobsRuns ¶ added in v0.3.57
func (r *JobRequester) RequestJobsRuns()
type JobStateReporter ¶ added in v0.16.2
type JobStateReporter struct {
// contains filtered or unexported fields
}
func NewJobStateReporter ¶ added in v0.16.2
func NewJobStateReporter( clusterContext clusterContext.ClusterContext, eventReporter reporter.EventReporter, podIssueHandler IssueHandler, ) (*JobStateReporter, error)
func (*JobStateReporter) ReportMissingJobEvents ¶ added in v0.16.2
func (stateReporter *JobStateReporter) ReportMissingJobEvents()
type LeaseRequest ¶ added in v0.3.57
type LeaseRequest struct { AvailableResource armadaresource.ComputeResources Nodes []*executorapi.NodeInfo UnassignedJobRunIds []string MaxJobsToLease uint32 }
type LeaseRequester ¶ added in v0.3.47
type LeaseRequester interface {
LeaseJobRuns(ctx *armadacontext.Context, request *LeaseRequest) (*LeaseResponse, error)
}
type LeaseResponse ¶ added in v0.3.57
type LeaseResponse struct { LeasedRuns []*executorapi.JobRunLease RunIdsToCancel []string RunIdsToPreempt []string }
type PodIssueHandler ¶ added in v0.16.2
type PodIssueHandler struct {
// contains filtered or unexported fields
}
func NewPodIssuerHandler ¶ added in v0.16.2
func NewPodIssuerHandler( jobRunState job.RunStateStore, clusterContext executorContext.ClusterContext, eventReporter reporter.EventReporter, stateChecksConfig configuration.StateChecksConfiguration, pendingPodChecker podchecks.PodChecker, failedPodChecker failedpodchecks.RetryChecker, stuckTerminatingPodExpiry time.Duration, ) (*PodIssueHandler, error)
func (*PodIssueHandler) DetectAndRegisterFailedPodIssue ¶ added in v0.16.2
func (p *PodIssueHandler) DetectAndRegisterFailedPodIssue(pod *v1.Pod) (bool, error)
func (*PodIssueHandler) HandlePodIssues ¶ added in v0.16.2
func (p *PodIssueHandler) HandlePodIssues()
func (*PodIssueHandler) HasIssue ¶ added in v0.16.2
func (p *PodIssueHandler) HasIssue(runId string) bool
type ResourceCleanupService ¶
type ResourceCleanupService struct {
// contains filtered or unexported fields
}
func NewResourceCleanupService ¶
func NewResourceCleanupService( clusterContext clusterContext.ClusterContext, kubernetesConfiguration configuration.KubernetesConfiguration, ) (*ResourceCleanupService, error)
func (*ResourceCleanupService) CleanupResources ¶
func (r *ResourceCleanupService) CleanupResources()
CleanupResources
- This function finds and delete old resources. It does this in two ways:
- - By deleting all expired terminated pods
- - Deleting non-expired terminated pods when then MaxTerminatedPods limit is exceeded
Click to show internal directories.
Click to hide internal directories.