You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
description: Whether automated GPU node failover should be enabled for this cluster. By default, it is disabled.
8510
+
auto_scaled:
8511
+
type: boolean
8512
+
default: false
8513
+
description: Whether GPU cluster should be auto-scaled based on the workload. By default, it is not auto-scaled.
8514
+
auto_scale_max_gpus:
8515
+
type: integer
8516
+
description: Maximum number of GPUs to which the cluster can be auto-scaled up. This field is required if auto_scaled is true.
8517
+
format: uint32
8518
+
slurm_shm_size_gib:
8519
+
type: integer
8520
+
description: Shared memory size in GiB for Slurm cluster. This field is required if cluster_type is SLURM.
8521
+
capacity_pool_id:
8522
+
type: string
8523
+
description: ID of the capacity pool to use for the cluster. This field is optional and only applicable if the cluster is created from a capacity pool.
8524
+
provision_at_ts:
8525
+
type: string
8526
+
description: Provision timestamp of the cluster. This field is required for SCHEDULED_CAPACITY billing to specify the provision time for the cluster. If not provided, the cluster will be provisioned immediately.
8527
+
format: date-time
8528
+
decommission_at_ts:
8529
+
type: string
8530
+
description: Decommission timestamp of the cluster. This field is required for SCHEDULED_CAPACITY billing to specify the decommission time for the cluster.
8531
+
format: date-time
8532
+
oidc_config:
8533
+
$ref: '#/components/schemas/GPUClusterOIDCConfig'
8534
+
install_traefik:
8535
+
type: boolean
8536
+
default: false
8537
+
description: Whether to install Traefik ingress controller in the cluster. This field is only applicable for Kubernetes clusters and is false by default.
8538
+
cuda_version:
8539
+
type: string
8540
+
description: CUDA version for this cluster. For example, 12.5
8541
+
nvidia_driver_version:
8542
+
type: string
8543
+
description: Nvidia driver version for this cluster. For example, 550. Only some combination of cuda_version and nvidia_driver_version are supported.
8544
+
GPUClusterOIDCConfig:
8545
+
type: object
8546
+
properties:
8547
+
issuer_url:
8548
+
type: string
8549
+
description: OIDC issuer URL for authentication. For example, https://accounts.google.com
8550
+
client_id:
8551
+
type: string
8552
+
description: OIDC client ID for authentication.
8553
+
username_claim:
8554
+
type: string
8555
+
description: JWT claim to use as the username. For example, 'sub' or 'email'
8556
+
username_prefix:
8557
+
type: string
8558
+
description: Prefix to add to the username claim to form the final username. For example, 'oidc:'
8559
+
group_claim:
8560
+
type: string
8561
+
description: JWT claim to use for user groups. For example, 'groups'
8562
+
group_prefix:
8563
+
type: string
8564
+
description: Prefix to add to the group claim to form the final group name. For example, 'oidc:'
8565
+
ca_cert:
8566
+
type: string
8567
+
description: CA certificate in PEM format to validate the OIDC issuer's TLS certificate. This field is optional but recommended if the issuer uses a private CA or self-signed certificate.
0 commit comments