Documentation ¶
Index ¶
Constants ¶
View Source
const ( FlexKey = "f" // Monitor all GPUs if MIG is disabled or all GPU instances if MIG is enabled MajorKey = "g" // Monitor top-level entities: GPUs or NvSwitches or CPUs MinorKey = "i" // Monitor sub-level entities: GPU instances/NvLinks/CPUCores - GPUI cannot be specified if MIG is disabled )
View Source
const ( CLIFieldsFile = "collectors" CLIAddress = "address" CLICollectInterval = "collect-interval" CLIKubernetes = "kubernetes" CLIKubernetesGPUIDType = "kubernetes-gpu-id-type" CLIUseOldNamespace = "use-old-namespace" CLIRemoteHEInfo = "remote-hostengine-info" CLIGPUDevices = "devices" CLISwitchDevices = "switch-devices" CLICPUDevices = "cpu-devices" CLINoHostname = "no-hostname" CLIUseFakeGPUs = "fake-gpus" CLIConfigMapData = "configmap-data" CLIWebSystemdSocket = "web-systemd-socket" CLIWebConfigFile = "web-config-file" CLIXIDCountWindowSize = "xid-count-window-size" CLIReplaceBlanksInModelName = "replace-blanks-in-model-name" CLIDebugMode = "debug" CLIClockEventsCountWindowSize = "clock-events-count-window-size" CLIEnableDCGMLog = "enable-dcgm-log" CLIDCGMLogLevel = "dcgm-log-level" CLIPodResourcesKubeletSocket = "pod-resources-kubelet-socket" CLIHPCJobMappingDir = "hpc-job-mapping-dir" CLINvidiaResourceNames = "nvidia-resource-names" )
View Source
const ( DCGMDbgLvlNone = "NONE" DCGMDbgLvlFatal = "FATAL" DCGMDbgLvlError = "ERROR" DCGMDbgLvlWarn = "WARN" DCGMDbgLvlInfo = "INFO" DCGMDbgLvlDebug = "DEBUG" DCGMDbgLvlVerb = "VERB" )
DCGMDbgLvl is a DCGM library debug level.
Variables ¶
View Source
var DCGMDbgLvlValues = []string{ DCGMDbgLvlNone, DCGMDbgLvlFatal, DCGMDbgLvlError, DCGMDbgLvlWarn, DCGMDbgLvlInfo, DCGMDbgLvlDebug, DCGMDbgLvlVerb, }
Functions ¶
Types ¶
This section is empty.
Click to show internal directories.
Click to hide internal directories.