Documentation
¶
Index ¶
Constants ¶
View Source
const ( HPACPUDefaultAverageUtilization = 80 DefaultUserId = "default" DefaultOrgId = "default" DynamoServicePort = 8000 DynamoServicePortName = "http" DynamoContainerPortName = "http" DynamoPlannerMetricsPort = 9085 DynamoMetricsPortName = "metrics" DynamoSystemPort = 9090 DynamoSystemPortName = "system" MpiRunSshPort = 2222 EnvDynamoServicePort = "DYNAMO_PORT" KubeLabelDynamoSelector = "nvidia.com/selector" KubeAnnotationEnableGrove = "nvidia.com/enable-grove" KubeAnnotationDisableImagePullSecretDiscovery = "nvidia.com/disable-image-pull-secret-discovery" KubeLabelDynamoGraphDeploymentName = "nvidia.com/dynamo-graph-deployment-name" KubeLabelDynamoComponent = "nvidia.com/dynamo-component" KubeLabelDynamoNamespace = "nvidia.com/dynamo-namespace" KubeLabelDynamoDeploymentTargetType = "nvidia.com/dynamo-deployment-target-type" KubeLabelDynamoComponentType = "nvidia.com/dynamo-component-type" KubeLabelValueFalse = "false" KubeLabelValueTrue = "true" KubeLabelDynamoComponentPod = "nvidia.com/dynamo-component-pod" KubeResourceGPUNvidia = "nvidia.com/gpu" DynamoDeploymentConfigEnvVar = "DYN_DEPLOYMENT_CONFIG" ComponentTypePlanner = "planner" ComponentTypeFrontend = "frontend" ComponentTypeWorker = "worker" ComponentTypeDefault = "default" PlannerServiceAccountName = "planner-serviceaccount" DefaultIngressSuffix = "local" DefaultGroveTerminationDelay = 15 * time.Minute // Metrics related constants KubeAnnotationEnableMetrics = "nvidia.com/enable-metrics" // User-provided annotation to control metrics KubeLabelMetricsEnabled = "nvidia.com/metrics-enabled" // Controller-managed label for pod selection // Kai-scheduler related constants KubeAnnotationKaiSchedulerQueue = "nvidia.com/kai-scheduler-queue" // User-provided annotation to specify queue name KubeLabelKaiSchedulerQueue = "kai.scheduler/queue" // Label injected into pods for kai-scheduler KaiSchedulerName = "kai-scheduler" // Scheduler name for kai-scheduler DefaultKaiSchedulerQueue = "dynamo" // Default queue name when none specified // Grove multinode role suffixes GroveRoleSuffixLeader = "ldr" GroveRoleSuffixWorker = "wkr" )
Variables ¶
View Source
var ( // Grove GroupVersionResources for scaling operations PodCliqueGVR = schema.GroupVersionResource{ Group: "grove.io", Version: "v1alpha1", Resource: "podcliques", } PodCliqueScalingGroupGVR = schema.GroupVersionResource{ Group: "grove.io", Version: "v1alpha1", Resource: "podcliquescalinggroups", } // KAI-Scheduler GroupVersionResource for queue validation QueueGVR = schema.GroupVersionResource{ Group: "scheduling.run.ai", Version: "v2", Resource: "queues", } )
GroupVersionResources for external APIs
Functions ¶
This section is empty.
Types ¶
type MultinodeDeploymentType ¶
type MultinodeDeploymentType string
const ( MultinodeDeploymentTypeGrove MultinodeDeploymentType = "grove" MultinodeDeploymentTypeLWS MultinodeDeploymentType = "lws" )
Click to show internal directories.
Click to hide internal directories.