From 7e87599a184604101b328cd7f06c53004dd5fbe1 Mon Sep 17 00:00:00 2001
From: codeflare-machine-account
 <codeflare-machine-account@users.noreply.github.com>
Date: Mon, 13 May 2024 14:18:42 +0000
Subject: [PATCH] Changes in docs for release: v0.16.1

---
 .../cluster/cluster.html                      | 158 +++++++++++-------
 .../cluster/config.html                       |  82 ++++++---
 .../utils/generate_yaml.html                  |  72 +++++---
 .../utils/pretty_print.html                   |   4 +-
 4 files changed, 212 insertions(+), 104 deletions(-)
diff --git a/docs/detailed-documentation/cluster/cluster.html b/docs/detailed-documentation/cluster/cluster.html
index eed1e1544..efb6ccfed 100644
--- a/docs/detailed-documentation/cluster/cluster.html
+++ b/docs/detailed-documentation/cluster/cluster.html
@@ -50,6 +50,7 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
 cluster setup queue, a list of all existing clusters, and the user&#39;s working namespace.
 &#34;&#34;&#34;
 
+import re
 from time import sleep
 from typing import List, Optional, Tuple, Dict
 
@@ -73,11 +74,13 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
     RayClusterStatus,
 )
 from kubernetes import client, config
+from kubernetes.utils import parse_quantity
 import yaml
 import os
 import requests
 
 from kubernetes import config
+from kubernetes.client.rest import ApiException
 
 
 class Cluster:
@@ -216,6 +219,7 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
         write_to_file = self.config.write_to_file
         verify_tls = self.config.verify_tls
         local_queue = self.config.local_queue
+        labels = self.config.labels
         return generate_appwrapper(
             name=name,
             namespace=namespace,
@@ -240,6 +244,7 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
             write_to_file=write_to_file,
             verify_tls=verify_tls,
             local_queue=local_queue,
+            labels=labels,
         )
 
     # creates a new cluster with the provided or default spec
@@ -248,6 +253,10 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
         Applies the AppWrapper yaml, pushing the resource request onto
         the MCAD queue.
         &#34;&#34;&#34;
+
+        # check if RayCluster CustomResourceDefinition exists if not throw RuntimeError
+        self._throw_for_no_raycluster()
+
         namespace = self.config.namespace
 
         try:
@@ -278,12 +287,32 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
         except Exception as e:  # pragma: no cover
             return _kube_api_error_handling(e)
 
+    def _throw_for_no_raycluster(self):
+        api_instance = client.CustomObjectsApi(api_config_handler())
+        try:
+            api_instance.list_namespaced_custom_object(
+                group=&#34;ray.io&#34;,
+                version=&#34;v1&#34;,
+                namespace=self.config.namespace,
+                plural=&#34;rayclusters&#34;,
+            )
+        except ApiException as e:
+            if e.status == 404:
+                raise RuntimeError(
+                    &#34;RayCluster CustomResourceDefinition unavailable contact your administrator.&#34;
+                )
+            else:
+                raise RuntimeError(
+                    &#34;Failed to get RayCluster CustomResourceDefinition: &#34; + str(e)
+                )
+
     def down(self):
         &#34;&#34;&#34;
         Deletes the AppWrapper yaml, scaling-down and deleting all resources
         associated with the cluster.
         &#34;&#34;&#34;
         namespace = self.config.namespace
+        self._throw_for_no_raycluster()
         try:
             config_check()
             api_instance = client.CustomObjectsApi(api_config_handler())
@@ -520,26 +549,18 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.cluster</code></h1>
             namespace=rc[&#34;metadata&#34;][&#34;namespace&#34;],
             machine_types=machine_types,
             num_workers=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;minReplicas&#34;],
-            min_cpus=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;requests&#34;][&#34;cpu&#34;]
-            ),
-            max_cpus=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;limits&#34;][&#34;cpu&#34;]
-            ),
-            min_memory=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;requests&#34;][&#34;memory&#34;][:-1]
-            ),
-            max_memory=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;limits&#34;][&#34;memory&#34;][:-1]
-            ),
+            min_cpus=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;requests&#34;][&#34;cpu&#34;],
+            max_cpus=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;limits&#34;][&#34;cpu&#34;],
+            min_memory=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;requests&#34;][&#34;memory&#34;],
+            max_memory=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;limits&#34;][&#34;memory&#34;],
             num_gpus=int(
                 rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
                     &#34;resources&#34;
@@ -1265,6 +1286,7 @@ <h2 class="section-title" id="header-classes">Classes</h2>
         write_to_file = self.config.write_to_file
         verify_tls = self.config.verify_tls
         local_queue = self.config.local_queue
+        labels = self.config.labels
         return generate_appwrapper(
             name=name,
             namespace=namespace,
@@ -1289,6 +1311,7 @@ <h2 class="section-title" id="header-classes">Classes</h2>
             write_to_file=write_to_file,
             verify_tls=verify_tls,
             local_queue=local_queue,
+            labels=labels,
         )
 
     # creates a new cluster with the provided or default spec
@@ -1297,6 +1320,10 @@ <h2 class="section-title" id="header-classes">Classes</h2>
         Applies the AppWrapper yaml, pushing the resource request onto
         the MCAD queue.
         &#34;&#34;&#34;
+
+        # check if RayCluster CustomResourceDefinition exists if not throw RuntimeError
+        self._throw_for_no_raycluster()
+
         namespace = self.config.namespace
 
         try:
@@ -1327,12 +1354,32 @@ <h2 class="section-title" id="header-classes">Classes</h2>
         except Exception as e:  # pragma: no cover
             return _kube_api_error_handling(e)
 
+    def _throw_for_no_raycluster(self):
+        api_instance = client.CustomObjectsApi(api_config_handler())
+        try:
+            api_instance.list_namespaced_custom_object(
+                group=&#34;ray.io&#34;,
+                version=&#34;v1&#34;,
+                namespace=self.config.namespace,
+                plural=&#34;rayclusters&#34;,
+            )
+        except ApiException as e:
+            if e.status == 404:
+                raise RuntimeError(
+                    &#34;RayCluster CustomResourceDefinition unavailable contact your administrator.&#34;
+                )
+            else:
+                raise RuntimeError(
+                    &#34;Failed to get RayCluster CustomResourceDefinition: &#34; + str(e)
+                )
+
     def down(self):
         &#34;&#34;&#34;
         Deletes the AppWrapper yaml, scaling-down and deleting all resources
         associated with the cluster.
         &#34;&#34;&#34;
         namespace = self.config.namespace
+        self._throw_for_no_raycluster()
         try:
             config_check()
             api_instance = client.CustomObjectsApi(api_config_handler())
@@ -1569,26 +1616,18 @@ <h2 class="section-title" id="header-classes">Classes</h2>
             namespace=rc[&#34;metadata&#34;][&#34;namespace&#34;],
             machine_types=machine_types,
             num_workers=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;minReplicas&#34;],
-            min_cpus=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;requests&#34;][&#34;cpu&#34;]
-            ),
-            max_cpus=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;limits&#34;][&#34;cpu&#34;]
-            ),
-            min_memory=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;requests&#34;][&#34;memory&#34;][:-1]
-            ),
-            max_memory=int(
-                rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                    &#34;resources&#34;
-                ][&#34;limits&#34;][&#34;memory&#34;][:-1]
-            ),
+            min_cpus=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;requests&#34;][&#34;cpu&#34;],
+            max_cpus=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;limits&#34;][&#34;cpu&#34;],
+            min_memory=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;requests&#34;][&#34;memory&#34;],
+            max_memory=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+                &#34;containers&#34;
+            ][0][&#34;resources&#34;][&#34;limits&#34;][&#34;memory&#34;],
             num_gpus=int(
                 rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
                     &#34;resources&#34;
@@ -1811,6 +1850,7 @@ <h3>Methods</h3>
     write_to_file = self.config.write_to_file
     verify_tls = self.config.verify_tls
     local_queue = self.config.local_queue
+    labels = self.config.labels
     return generate_appwrapper(
         name=name,
         namespace=namespace,
@@ -1835,6 +1875,7 @@ <h3>Methods</h3>
         write_to_file=write_to_file,
         verify_tls=verify_tls,
         local_queue=local_queue,
+        labels=labels,
     )</code></pre>
 </details>
 </dd>
@@ -1870,6 +1911,7 @@ <h3>Methods</h3>
     associated with the cluster.
     &#34;&#34;&#34;
     namespace = self.config.namespace
+    self._throw_for_no_raycluster()
     try:
         config_check()
         api_instance = client.CustomObjectsApi(api_config_handler())
@@ -1944,26 +1986,18 @@ <h3>Methods</h3>
         namespace=rc[&#34;metadata&#34;][&#34;namespace&#34;],
         machine_types=machine_types,
         num_workers=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;minReplicas&#34;],
-        min_cpus=int(
-            rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                &#34;resources&#34;
-            ][&#34;requests&#34;][&#34;cpu&#34;]
-        ),
-        max_cpus=int(
-            rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                &#34;resources&#34;
-            ][&#34;limits&#34;][&#34;cpu&#34;]
-        ),
-        min_memory=int(
-            rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                &#34;resources&#34;
-            ][&#34;requests&#34;][&#34;memory&#34;][:-1]
-        ),
-        max_memory=int(
-            rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
-                &#34;resources&#34;
-            ][&#34;limits&#34;][&#34;memory&#34;][:-1]
-        ),
+        min_cpus=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+            &#34;containers&#34;
+        ][0][&#34;resources&#34;][&#34;requests&#34;][&#34;cpu&#34;],
+        max_cpus=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+            &#34;containers&#34;
+        ][0][&#34;resources&#34;][&#34;limits&#34;][&#34;cpu&#34;],
+        min_memory=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+            &#34;containers&#34;
+        ][0][&#34;resources&#34;][&#34;requests&#34;][&#34;memory&#34;],
+        max_memory=rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][
+            &#34;containers&#34;
+        ][0][&#34;resources&#34;][&#34;limits&#34;][&#34;memory&#34;],
         num_gpus=int(
             rc[&#34;spec&#34;][&#34;workerGroupSpecs&#34;][0][&#34;template&#34;][&#34;spec&#34;][&#34;containers&#34;][0][
                 &#34;resources&#34;
@@ -2168,6 +2202,10 @@ <h3>Methods</h3>
     Applies the AppWrapper yaml, pushing the resource request onto
     the MCAD queue.
     &#34;&#34;&#34;
+
+    # check if RayCluster CustomResourceDefinition exists if not throw RuntimeError
+    self._throw_for_no_raycluster()
+
     namespace = self.config.namespace
 
     try:
diff --git a/docs/detailed-documentation/cluster/config.html b/docs/detailed-documentation/cluster/config.html
index c7b9ccfcd..1879afaf0 100644
--- a/docs/detailed-documentation/cluster/config.html
+++ b/docs/detailed-documentation/cluster/config.html
@@ -52,6 +52,7 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.config</code></h1>
 
 from dataclasses import dataclass, field
 import pathlib
+import typing
 
 dir = pathlib.Path(__file__).parent.parent.resolve()
 
@@ -66,15 +67,15 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.config</code></h1>
     name: str
     namespace: str = None
     head_info: list = field(default_factory=list)
-    head_cpus: int = 2
-    head_memory: int = 8
+    head_cpus: typing.Union[int, str] = 2
+    head_memory: typing.Union[int, str] = 8
     head_gpus: int = 0
     machine_types: list = field(default_factory=list)  # [&#34;m4.xlarge&#34;, &#34;g4dn.xlarge&#34;]
-    min_cpus: int = 1
-    max_cpus: int = 1
+    min_cpus: typing.Union[int, str] = 1
+    max_cpus: typing.Union[int, str] = 1
     num_workers: int = 1
-    min_memory: int = 2
-    max_memory: int = 2
+    min_memory: typing.Union[int, str] = 2
+    max_memory: typing.Union[int, str] = 2
     num_gpus: int = 0
     template: str = f&#34;{dir}/templates/base-template.yaml&#34;
     instascale: bool = False
@@ -85,12 +86,31 @@ <h1 class="title">Module <code>codeflare_sdk.cluster.config</code></h1>
     dispatch_priority: str = None
     write_to_file: bool = False
     verify_tls: bool = True
+    labels: dict = field(default_factory=dict)
 
     def __post_init__(self):
         if not self.verify_tls:
             print(
                 &#34;Warning: TLS verification has been disabled - Endpoint checks will be bypassed&#34;
             )
+        self._memory_to_string()
+        self._str_mem_no_unit_add_GB()
+
+    def _str_mem_no_unit_add_GB(self):
+        if isinstance(self.head_memory, str) and self.head_memory.isdecimal():
+            self.head_memory = f&#34;{self.head_memory}G&#34;
+        if isinstance(self.min_memory, str) and self.min_memory.isdecimal():
+            self.min_memory = f&#34;{self.min_memory}G&#34;
+        if isinstance(self.max_memory, str) and self.max_memory.isdecimal():
+            self.max_memory = f&#34;{self.max_memory}G&#34;
+
+    def _memory_to_string(self):
+        if isinstance(self.head_memory, int):
+            self.head_memory = f&#34;{self.head_memory}G&#34;
+        if isinstance(self.min_memory, int):
+            self.min_memory = f&#34;{self.min_memory}G&#34;
+        if isinstance(self.max_memory, int):
+            self.max_memory = f&#34;{self.max_memory}G&#34;
 
     local_queue: str = None</code></pre>
 </details>
@@ -106,7 +126,7 @@ <h2 class="section-title" id="header-classes">Classes</h2>
 <dl>
 <dt id="codeflare_sdk.cluster.config.ClusterConfiguration"><code class="flex name class">
 <span>class <span class="ident">ClusterConfiguration</span></span>
-<span>(</span><span>name: str, namespace: str = None, head_info: list = &lt;factory&gt;, head_cpus: int = 2, head_memory: int = 8, head_gpus: int = 0, machine_types: list = &lt;factory&gt;, min_cpus: int = 1, max_cpus: int = 1, num_workers: int = 1, min_memory: int = 2, max_memory: int = 2, num_gpus: int = 0, template: str = '/home/runner/work/codeflare-sdk/codeflare-sdk/src/codeflare_sdk/templates/base-template.yaml', instascale: bool = False, mcad: bool = False, envs: dict = &lt;factory&gt;, image: str = '', image_pull_secrets: list = &lt;factory&gt;, dispatch_priority: str = None, write_to_file: bool = False, verify_tls: bool = True, local_queue: str = None)</span>
+<span>(</span><span>name: str, namespace: str = None, head_info: list = &lt;factory&gt;, head_cpus: Union[int, str] = 2, head_memory: Union[int, str] = 8, head_gpus: int = 0, machine_types: list = &lt;factory&gt;, min_cpus: Union[int, str] = 1, max_cpus: Union[int, str] = 1, num_workers: int = 1, min_memory: Union[int, str] = 2, max_memory: Union[int, str] = 2, num_gpus: int = 0, template: str = '/home/runner/work/codeflare-sdk/codeflare-sdk/src/codeflare_sdk/templates/base-template.yaml', instascale: bool = False, mcad: bool = False, envs: dict = &lt;factory&gt;, image: str = '', image_pull_secrets: list = &lt;factory&gt;, dispatch_priority: str = None, write_to_file: bool = False, verify_tls: bool = True, labels: dict = &lt;factory&gt;, local_queue: str = None)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>This dataclass is used to specify resource requirements and other details, and
@@ -124,15 +144,15 @@ <h2 class="section-title" id="header-classes">Classes</h2>
     name: str
     namespace: str = None
     head_info: list = field(default_factory=list)
-    head_cpus: int = 2
-    head_memory: int = 8
+    head_cpus: typing.Union[int, str] = 2
+    head_memory: typing.Union[int, str] = 8
     head_gpus: int = 0
     machine_types: list = field(default_factory=list)  # [&#34;m4.xlarge&#34;, &#34;g4dn.xlarge&#34;]
-    min_cpus: int = 1
-    max_cpus: int = 1
+    min_cpus: typing.Union[int, str] = 1
+    max_cpus: typing.Union[int, str] = 1
     num_workers: int = 1
-    min_memory: int = 2
-    max_memory: int = 2
+    min_memory: typing.Union[int, str] = 2
+    max_memory: typing.Union[int, str] = 2
     num_gpus: int = 0
     template: str = f&#34;{dir}/templates/base-template.yaml&#34;
     instascale: bool = False
@@ -143,12 +163,31 @@ <h2 class="section-title" id="header-classes">Classes</h2>
     dispatch_priority: str = None
     write_to_file: bool = False
     verify_tls: bool = True
+    labels: dict = field(default_factory=dict)
 
     def __post_init__(self):
         if not self.verify_tls:
             print(
                 &#34;Warning: TLS verification has been disabled - Endpoint checks will be bypassed&#34;
             )
+        self._memory_to_string()
+        self._str_mem_no_unit_add_GB()
+
+    def _str_mem_no_unit_add_GB(self):
+        if isinstance(self.head_memory, str) and self.head_memory.isdecimal():
+            self.head_memory = f&#34;{self.head_memory}G&#34;
+        if isinstance(self.min_memory, str) and self.min_memory.isdecimal():
+            self.min_memory = f&#34;{self.min_memory}G&#34;
+        if isinstance(self.max_memory, str) and self.max_memory.isdecimal():
+            self.max_memory = f&#34;{self.max_memory}G&#34;
+
+    def _memory_to_string(self):
+        if isinstance(self.head_memory, int):
+            self.head_memory = f&#34;{self.head_memory}G&#34;
+        if isinstance(self.min_memory, int):
+            self.min_memory = f&#34;{self.min_memory}G&#34;
+        if isinstance(self.max_memory, int):
+            self.max_memory = f&#34;{self.max_memory}G&#34;
 
     local_queue: str = None</code></pre>
 </details>
@@ -162,7 +201,7 @@ <h3>Class variables</h3>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.head_cpus"><code class="name">var <span class="ident">head_cpus</span> : int</code></dt>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.head_cpus"><code class="name">var <span class="ident">head_cpus</span> : Union[int, str]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
@@ -174,7 +213,7 @@ <h3>Class variables</h3>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.head_memory"><code class="name">var <span class="ident">head_memory</span> : int</code></dt>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.head_memory"><code class="name">var <span class="ident">head_memory</span> : Union[int, str]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
@@ -190,6 +229,10 @@ <h3>Class variables</h3>
 <dd>
 <div class="desc"></div>
 </dd>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.labels"><code class="name">var <span class="ident">labels</span> : dict</code></dt>
+<dd>
+<div class="desc"></div>
+</dd>
 <dt id="codeflare_sdk.cluster.config.ClusterConfiguration.local_queue"><code class="name">var <span class="ident">local_queue</span> : str</code></dt>
 <dd>
 <div class="desc"></div>
@@ -198,11 +241,11 @@ <h3>Class variables</h3>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.max_cpus"><code class="name">var <span class="ident">max_cpus</span> : int</code></dt>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.max_cpus"><code class="name">var <span class="ident">max_cpus</span> : Union[int, str]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.max_memory"><code class="name">var <span class="ident">max_memory</span> : int</code></dt>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.max_memory"><code class="name">var <span class="ident">max_memory</span> : Union[int, str]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
@@ -210,11 +253,11 @@ <h3>Class variables</h3>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.min_cpus"><code class="name">var <span class="ident">min_cpus</span> : int</code></dt>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.min_cpus"><code class="name">var <span class="ident">min_cpus</span> : Union[int, str]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.min_memory"><code class="name">var <span class="ident">min_memory</span> : int</code></dt>
+<dt id="codeflare_sdk.cluster.config.ClusterConfiguration.min_memory"><code class="name">var <span class="ident">min_memory</span> : Union[int, str]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
@@ -276,6 +319,7 @@ <h4><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration" href="#co
 <li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.image" href="#codeflare_sdk.cluster.config.ClusterConfiguration.image">image</a></code></li>
 <li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.image_pull_secrets" href="#codeflare_sdk.cluster.config.ClusterConfiguration.image_pull_secrets">image_pull_secrets</a></code></li>
 <li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.instascale" href="#codeflare_sdk.cluster.config.ClusterConfiguration.instascale">instascale</a></code></li>
+<li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.labels" href="#codeflare_sdk.cluster.config.ClusterConfiguration.labels">labels</a></code></li>
 <li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.local_queue" href="#codeflare_sdk.cluster.config.ClusterConfiguration.local_queue">local_queue</a></code></li>
 <li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.machine_types" href="#codeflare_sdk.cluster.config.ClusterConfiguration.machine_types">machine_types</a></code></li>
 <li><code><a title="codeflare_sdk.cluster.config.ClusterConfiguration.max_cpus" href="#codeflare_sdk.cluster.config.ClusterConfiguration.max_cpus">max_cpus</a></code></li>
diff --git a/docs/detailed-documentation/utils/generate_yaml.html b/docs/detailed-documentation/utils/generate_yaml.html
index fc7147800..141901016 100644
--- a/docs/detailed-documentation/utils/generate_yaml.html
+++ b/docs/detailed-documentation/utils/generate_yaml.html
@@ -171,8 +171,8 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
                 # Leave head node resources as template default
                 resource[&#34;requests&#34;][&#34;cpu&#34;] = head_cpus
                 resource[&#34;limits&#34;][&#34;cpu&#34;] = head_cpus
-                resource[&#34;requests&#34;][&#34;memory&#34;] = str(head_memory) + &#34;G&#34;
-                resource[&#34;limits&#34;][&#34;memory&#34;] = str(head_memory) + &#34;G&#34;
+                resource[&#34;requests&#34;][&#34;memory&#34;] = head_memory
+                resource[&#34;limits&#34;][&#34;memory&#34;] = head_memory
                 resource[&#34;requests&#34;][&#34;nvidia.com/gpu&#34;] = head_gpus
                 resource[&#34;limits&#34;][&#34;nvidia.com/gpu&#34;] = head_gpus
 
@@ -189,9 +189,9 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
                                     resource[k][spec] = min_cpu
                             if spec == &#34;memory&#34;:
                                 if k == &#34;limits&#34;:
-                                    resource[k][spec] = str(max_memory) + &#34;G&#34;
+                                    resource[k][spec] = max_memory
                                 else:
-                                    resource[k][spec] = str(min_memory) + &#34;G&#34;
+                                    resource[k][spec] = min_memory
                             if spec == &#34;nvidia.com/gpu&#34;:
                                 if i == 0:
                                     resource[k][spec] = 0
@@ -244,12 +244,12 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
         requests = resource.get(&#34;resources&#34;).get(&#34;requests&#34;)
         if requests is not None:
             requests[&#34;cpu&#34;] = min_cpu
-            requests[&#34;memory&#34;] = str(min_memory) + &#34;G&#34;
+            requests[&#34;memory&#34;] = min_memory
             requests[&#34;nvidia.com/gpu&#34;] = gpu
         limits = resource.get(&#34;resources&#34;).get(&#34;limits&#34;)
         if limits is not None:
             limits[&#34;cpu&#34;] = max_cpu
-            limits[&#34;memory&#34;] = str(max_memory) + &#34;G&#34;
+            limits[&#34;memory&#34;] = max_memory
             limits[&#34;nvidia.com/gpu&#34;] = gpu
 
 
@@ -340,7 +340,11 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
 
 
 def write_components(
-    user_yaml: dict, output_file_name: str, namespace: str, local_queue: Optional[str]
+    user_yaml: dict,
+    output_file_name: str,
+    namespace: str,
+    local_queue: Optional[str],
+    labels: dict,
 ):
     # Create the directory if it doesn&#39;t exist
     directory_path = os.path.dirname(output_file_name)
@@ -350,6 +354,7 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
     components = user_yaml.get(&#34;spec&#34;, &#34;resources&#34;)[&#34;resources&#34;].get(&#34;GenericItems&#34;)
     open(output_file_name, &#34;w&#34;).close()
     lq_name = local_queue or get_default_kueue_name(namespace)
+    cluster_labels = labels
     with open(output_file_name, &#34;a&#34;) as outfile:
         for component in components:
             if &#34;generictemplate&#34; in component:
@@ -362,6 +367,7 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
                     ]
                     labels = component[&#34;generictemplate&#34;][&#34;metadata&#34;][&#34;labels&#34;]
                     labels.update({&#34;kueue.x-k8s.io/queue-name&#34;: lq_name})
+                    labels.update(cluster_labels)
                 outfile.write(&#34;---\n&#34;)
                 yaml.dump(
                     component[&#34;generictemplate&#34;], outfile, default_flow_style=False
@@ -370,11 +376,16 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
 
 
 def load_components(
-    user_yaml: dict, name: str, namespace: str, local_queue: Optional[str]
+    user_yaml: dict,
+    name: str,
+    namespace: str,
+    local_queue: Optional[str],
+    labels: dict,
 ):
     component_list = []
     components = user_yaml.get(&#34;spec&#34;, &#34;resources&#34;)[&#34;resources&#34;].get(&#34;GenericItems&#34;)
     lq_name = local_queue or get_default_kueue_name(namespace)
+    cluster_labels = labels
     for component in components:
         if &#34;generictemplate&#34; in component:
             if (
@@ -386,6 +397,7 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
                 ]
                 labels = component[&#34;generictemplate&#34;][&#34;metadata&#34;][&#34;labels&#34;]
                 labels.update({&#34;kueue.x-k8s.io/queue-name&#34;: lq_name})
+                labels.update(cluster_labels)
             component_list.append(component[&#34;generictemplate&#34;])
 
     resources = &#34;---\n&#34; + &#34;---\n&#34;.join(
@@ -426,6 +438,7 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
     write_to_file: bool,
     verify_tls: bool,
     local_queue: Optional[str],
+    labels,
 ):
     user_yaml = read_template(template)
     appwrapper_name, cluster_name = gen_names(name)
@@ -477,13 +490,13 @@ <h1 class="title">Module <code>codeflare_sdk.utils.generate_yaml</code></h1>
         if mcad:
             write_user_appwrapper(user_yaml, outfile)
         else:
-            write_components(user_yaml, outfile, namespace, local_queue)
+            write_components(user_yaml, outfile, namespace, local_queue, labels)
         return outfile
     else:
         if mcad:
             user_yaml = load_appwrapper(user_yaml, name)
         else:
-            user_yaml = load_components(user_yaml, name, namespace, local_queue)
+            user_yaml = load_components(user_yaml, name, namespace, local_queue, labels)
         return user_yaml</code></pre>
 </details>
 </section>
@@ -527,7 +540,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </details>
 </dd>
 <dt id="codeflare_sdk.utils.generate_yaml.generate_appwrapper"><code class="name flex">
-<span>def <span class="ident">generate_appwrapper</span></span>(<span>name: str, namespace: str, head_cpus: int, head_memory: int, head_gpus: int, min_cpu: int, max_cpu: int, min_memory: int, max_memory: int, gpu: int, workers: int, template: str, image: str, instascale: bool, mcad: bool, instance_types: list, env, image_pull_secrets: list, dispatch_priority: str, priority_val: int, write_to_file: bool, verify_tls: bool, local_queue: Optional[str])</span>
+<span>def <span class="ident">generate_appwrapper</span></span>(<span>name: str, namespace: str, head_cpus: int, head_memory: int, head_gpus: int, min_cpu: int, max_cpu: int, min_memory: int, max_memory: int, gpu: int, workers: int, template: str, image: str, instascale: bool, mcad: bool, instance_types: list, env, image_pull_secrets: list, dispatch_priority: str, priority_val: int, write_to_file: bool, verify_tls: bool, local_queue: Optional[str], labels)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
@@ -559,6 +572,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     write_to_file: bool,
     verify_tls: bool,
     local_queue: Optional[str],
+    labels,
 ):
     user_yaml = read_template(template)
     appwrapper_name, cluster_name = gen_names(name)
@@ -610,13 +624,13 @@ <h2 class="section-title" id="header-functions">Functions</h2>
         if mcad:
             write_user_appwrapper(user_yaml, outfile)
         else:
-            write_components(user_yaml, outfile, namespace, local_queue)
+            write_components(user_yaml, outfile, namespace, local_queue, labels)
         return outfile
     else:
         if mcad:
             user_yaml = load_appwrapper(user_yaml, name)
         else:
-            user_yaml = load_components(user_yaml, name, namespace, local_queue)
+            user_yaml = load_components(user_yaml, name, namespace, local_queue, labels)
         return user_yaml</code></pre>
 </details>
 </dd>
@@ -715,7 +729,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </details>
 </dd>
 <dt id="codeflare_sdk.utils.generate_yaml.load_components"><code class="name flex">
-<span>def <span class="ident">load_components</span></span>(<span>user_yaml: dict, name: str, namespace: str, local_queue: Optional[str])</span>
+<span>def <span class="ident">load_components</span></span>(<span>user_yaml: dict, name: str, namespace: str, local_queue: Optional[str], labels: dict)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
@@ -724,11 +738,16 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <span>Expand source code</span>
 </summary>
 <pre><code class="python">def load_components(
-    user_yaml: dict, name: str, namespace: str, local_queue: Optional[str]
+    user_yaml: dict,
+    name: str,
+    namespace: str,
+    local_queue: Optional[str],
+    labels: dict,
 ):
     component_list = []
     components = user_yaml.get(&#34;spec&#34;, &#34;resources&#34;)[&#34;resources&#34;].get(&#34;GenericItems&#34;)
     lq_name = local_queue or get_default_kueue_name(namespace)
+    cluster_labels = labels
     for component in components:
         if &#34;generictemplate&#34; in component:
             if (
@@ -740,6 +759,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
                 ]
                 labels = component[&#34;generictemplate&#34;][&#34;metadata&#34;][&#34;labels&#34;]
                 labels.update({&#34;kueue.x-k8s.io/queue-name&#34;: lq_name})
+                labels.update(cluster_labels)
             component_list.append(component[&#34;generictemplate&#34;])
 
     resources = &#34;---\n&#34; + &#34;---\n&#34;.join(
@@ -819,8 +839,8 @@ <h2 class="section-title" id="header-functions">Functions</h2>
                 # Leave head node resources as template default
                 resource[&#34;requests&#34;][&#34;cpu&#34;] = head_cpus
                 resource[&#34;limits&#34;][&#34;cpu&#34;] = head_cpus
-                resource[&#34;requests&#34;][&#34;memory&#34;] = str(head_memory) + &#34;G&#34;
-                resource[&#34;limits&#34;][&#34;memory&#34;] = str(head_memory) + &#34;G&#34;
+                resource[&#34;requests&#34;][&#34;memory&#34;] = head_memory
+                resource[&#34;limits&#34;][&#34;memory&#34;] = head_memory
                 resource[&#34;requests&#34;][&#34;nvidia.com/gpu&#34;] = head_gpus
                 resource[&#34;limits&#34;][&#34;nvidia.com/gpu&#34;] = head_gpus
 
@@ -837,9 +857,9 @@ <h2 class="section-title" id="header-functions">Functions</h2>
                                     resource[k][spec] = min_cpu
                             if spec == &#34;memory&#34;:
                                 if k == &#34;limits&#34;:
-                                    resource[k][spec] = str(max_memory) + &#34;G&#34;
+                                    resource[k][spec] = max_memory
                                 else:
-                                    resource[k][spec] = str(min_memory) + &#34;G&#34;
+                                    resource[k][spec] = min_memory
                             if spec == &#34;nvidia.com/gpu&#34;:
                                 if i == 0:
                                     resource[k][spec] = 0
@@ -1037,17 +1057,17 @@ <h2 class="section-title" id="header-functions">Functions</h2>
         requests = resource.get(&#34;resources&#34;).get(&#34;requests&#34;)
         if requests is not None:
             requests[&#34;cpu&#34;] = min_cpu
-            requests[&#34;memory&#34;] = str(min_memory) + &#34;G&#34;
+            requests[&#34;memory&#34;] = min_memory
             requests[&#34;nvidia.com/gpu&#34;] = gpu
         limits = resource.get(&#34;resources&#34;).get(&#34;limits&#34;)
         if limits is not None:
             limits[&#34;cpu&#34;] = max_cpu
-            limits[&#34;memory&#34;] = str(max_memory) + &#34;G&#34;
+            limits[&#34;memory&#34;] = max_memory
             limits[&#34;nvidia.com/gpu&#34;] = gpu</code></pre>
 </details>
 </dd>
 <dt id="codeflare_sdk.utils.generate_yaml.write_components"><code class="name flex">
-<span>def <span class="ident">write_components</span></span>(<span>user_yaml: dict, output_file_name: str, namespace: str, local_queue: Optional[str])</span>
+<span>def <span class="ident">write_components</span></span>(<span>user_yaml: dict, output_file_name: str, namespace: str, local_queue: Optional[str], labels: dict)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
@@ -1056,7 +1076,11 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <span>Expand source code</span>
 </summary>
 <pre><code class="python">def write_components(
-    user_yaml: dict, output_file_name: str, namespace: str, local_queue: Optional[str]
+    user_yaml: dict,
+    output_file_name: str,
+    namespace: str,
+    local_queue: Optional[str],
+    labels: dict,
 ):
     # Create the directory if it doesn&#39;t exist
     directory_path = os.path.dirname(output_file_name)
@@ -1066,6 +1090,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     components = user_yaml.get(&#34;spec&#34;, &#34;resources&#34;)[&#34;resources&#34;].get(&#34;GenericItems&#34;)
     open(output_file_name, &#34;w&#34;).close()
     lq_name = local_queue or get_default_kueue_name(namespace)
+    cluster_labels = labels
     with open(output_file_name, &#34;a&#34;) as outfile:
         for component in components:
             if &#34;generictemplate&#34; in component:
@@ -1078,6 +1103,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
                     ]
                     labels = component[&#34;generictemplate&#34;][&#34;metadata&#34;][&#34;labels&#34;]
                     labels.update({&#34;kueue.x-k8s.io/queue-name&#34;: lq_name})
+                    labels.update(cluster_labels)
                 outfile.write(&#34;---\n&#34;)
                 yaml.dump(
                     component[&#34;generictemplate&#34;], outfile, default_flow_style=False
diff --git a/docs/detailed-documentation/utils/pretty_print.html b/docs/detailed-documentation/utils/pretty_print.html
index e7c108256..2e7a69b81 100644
--- a/docs/detailed-documentation/utils/pretty_print.html
+++ b/docs/detailed-documentation/utils/pretty_print.html
@@ -167,7 +167,7 @@ <h1 class="title">Module <code>codeflare_sdk.utils.pretty_print</code></h1>
         name = cluster.name
         dashboard = cluster.dashboard
         workers = str(cluster.workers)
-        memory = str(cluster.worker_mem_min) + &#34;~&#34; + str(cluster.worker_mem_max)
+        memory = f&#34;{cluster.worker_mem_min}~{cluster.worker_mem_max}&#34;
         cpu = str(cluster.worker_cpu)
         gpu = str(cluster.worker_gpu)
 
@@ -345,7 +345,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
         name = cluster.name
         dashboard = cluster.dashboard
         workers = str(cluster.workers)
-        memory = str(cluster.worker_mem_min) + &#34;~&#34; + str(cluster.worker_mem_max)
+        memory = f&#34;{cluster.worker_mem_min}~{cluster.worker_mem_max}&#34;
         cpu = str(cluster.worker_cpu)
         gpu = str(cluster.worker_gpu)