Merge pull request #4 from openshift-psap/yaml-gen

Maxusmusti · web-flow · commit 18b91f73c46c · 2022-10-25T12:37:15.000-04:00
Added YAML Generation Script/Template
diff --git a/src/codeflare_sdk/templates/aw-kuberay.yaml b/src/codeflare_sdk/templates/aw-kuberay.yaml
@@ -0,0 +1,220 @@
+apiVersion: mcad.ibm.com/v1beta1
+kind: AppWrapper
+metadata:
+  name: aw-kuberay-glue
+  namespace: default
+spec:
+  priority: 9
+  resources:
+    Items: []
+    GenericItems:
+    - replicas: 1
+      custompodresources:
+      - replicas: 4
+        requests:
+          cpu: 2
+          memory: 12G
+          nvidia.com/gpu: 1
+        limits:
+          cpu: 2
+          memory: 12G
+          nvidia.com/gpu: 1
+      generictemplate:
+        # This config demonstrates KubeRay's Ray autoscaler integration.
+        # The resource requests and limits in this config are too small for production!
+        # For an example with more realistic resource configuration, see
+        # ray-cluster.autoscaler.large.yaml.
+        apiVersion: ray.io/v1alpha1
+        kind: RayCluster
+        metadata:
+          labels:
+            appwrapper.mcad.ibm.com: "aw-kuberay-glue"
+            controller-tools.k8s.io: "1.0"
+            # A unique identifier for the head node and workers of this cluster.
+          name: glue-cluster
+          # finalizers:
+          # - kubernetes
+        spec:
+          # The version of Ray you are using. Make sure all Ray containers are running this version of Ray.
+          rayVersion: '1.12.0'
+          # If enableInTreeAutoscaling is true, the autoscaler sidecar will be added to the Ray head pod.
+          # Ray autoscaler integration is supported only for Ray versions >= 1.11.0
+          # Ray autoscaler integration is Beta with KubeRay >= 0.3.0 and Ray >= 2.0.0.
+          enableInTreeAutoscaling: false
+          # autoscalerOptions is an OPTIONAL field specifying configuration overrides for the Ray autoscaler.
+          # The example configuration shown below below represents the DEFAULT values.
+          # (You may delete autoscalerOptions if the defaults are suitable.)
+          autoscalerOptions:
+            # upscalingMode is "Default" or "Aggressive."
+            # Conservative: Upscaling is rate-limited; the number of pending worker pods is at most the size of the Ray cluster.
+            # Default: Upscaling is not rate-limited.
+            # Aggressive: An alias for Default; upscaling is not rate-limited.
+            upscalingMode: Default
+            # idleTimeoutSeconds is the number of seconds to wait before scaling down a worker pod which is not using Ray resources.
+            idleTimeoutSeconds: 60
+            # image optionally overrides the autoscaler's container image.
+            # If instance.spec.rayVersion is at least "2.0.0", the autoscaler will default to the same image as
+            # the ray container. For older Ray versions, the autoscaler will default to using the Ray 2.0.0 image.
+            ## image: "my-repo/my-custom-autoscaler-image:tag"
+            # imagePullPolicy optionally overrides the autoscaler container's image pull policy.
+            imagePullPolicy: Always
+            # resources specifies optional resource request and limit overrides for the autoscaler container.
+            # For large Ray clusters, we recommend monitoring container resource usage to determine if overriding the defaults is required.
+            resources:
+              limits:
+                cpu: "500m"
+                memory: "512Mi"
+              requests:
+                cpu: "500m"
+                memory: "512Mi"
+          ######################headGroupSpec#################################
+          # head group template and specs, (perhaps 'group' is not needed in the name)
+          headGroupSpec:
+            # Kubernetes Service Type, valid values are 'ClusterIP', 'NodePort' and 'LoadBalancer'
+            serviceType: ClusterIP
+            # logical group name, for this called head-group, also can be functional
+            # pod type head or worker
+            # rayNodeType: head # Not needed since it is under the headgroup
+            # the following params are used to complete the ray start: ray start --head --block ...
+            rayStartParams:
+              # Flag "no-monitor" will be automatically set when autoscaling is enabled.
+              dashboard-host: '0.0.0.0'
+              block: 'true'
+              # num-cpus: '1' # can be auto-completed from the limits
+              # Use `resources` to optionally specify custom resource annotations for the Ray node.
+              # The value of `resources` is a string-integer mapping.
+              # Currently, `resources` must be provided in the specific format demonstrated below:
+              # resources: '"{\"Custom1\": 1, \"Custom2\": 5}"'
+              num-gpus: '0'
+            #pod template
+            template:
+              spec:
+                affinity:
+                  nodeAffinity:
+                    requiredDuringSchedulingIgnoredDuringExecution:
+                      nodeSelectorTerms:
+                      - matchExpressions:
+                        - key: role
+                          operator: In
+                          values:
+                          - "aw-kuberay-glue"
+                containers:
+                # The Ray head pod
+                - name: ray-head
+                  image: asm582/codeflare-tl-aws:latest
+                  env:
+                  - name: AWS_ACCESS_KEY_ID
+                    valueFrom:
+                      secretKeyRef:
+                        name: glue-s3-creds
+                        key: AWS_ACCESS_KEY_ID
+                  - name: AWS_SECRET_ACCESS_KEY
+                    valueFrom:
+                      secretKeyRef:
+                        name: glue-s3-creds
+                        key: AWS_SECRET_ACCESS_KEY
+                  - name: ENDPOINT_URL
+                    valueFrom:
+                      secretKeyRef:
+                        name: glue-s3-creds
+                        key: ENDPOINT_URL
+                  imagePullPolicy: Always
+                  ports:
+                  - containerPort: 6379
+                    name: gcs
+                  - containerPort: 8265
+                    name: dashboard
+                  - containerPort: 10001
+                    name: client
+                  lifecycle:
+                    preStop:
+                      exec:
+                        command: ["/bin/sh","-c","ray stop"]
+                  resources:
+                    limits:
+                      cpu: "2"
+                      memory: "12G"
+                      nvidia.com/gpu: "0"
+                    requests:
+                      cpu: "2"
+                      memory: "12G"
+                      nvidia.com/gpu: "0"
+          workerGroupSpecs:
+          # the pod replicas in this group typed worker
+          - replicas: 3
+            minReplicas: 3
+            maxReplicas: 3
+            # logical group name, for this called small-group, also can be functional
+            groupName: small-group
+            # if worker pods need to be added, we can simply increment the replicas
+            # if worker pods need to be removed, we decrement the replicas, and populate the podsToDelete list
+            # the operator will remove pods from the list until the number of replicas is satisfied
+            # when a pod is confirmed to be deleted, its name will be removed from the list below
+            #scaleStrategy:
+            #  workersToDelete:
+            #  - raycluster-complete-worker-small-group-bdtwh
+            #  - raycluster-complete-worker-small-group-hv457
+            #  - raycluster-complete-worker-small-group-k8tj7
+            # the following params are used to complete the ray start: ray start --block ...
+            rayStartParams:
+              block: 'true'
+              num-gpus: '1'
+            #pod template
+            template:
+              metadata:
+                labels:
+                  key: value
+                # annotations for pod
+                annotations:
+                  key: value
+                # finalizers:
+                # - kubernetes
+              spec:
+                affinity:
+                  nodeAffinity:
+                    requiredDuringSchedulingIgnoredDuringExecution:
+                      nodeSelectorTerms:
+                      - matchExpressions:
+                        - key: role
+                          operator: In
+                          values:
+                          - "aw-kuberay-glue"
+                initContainers:
+                # the env var $RAY_IP is set by the operator if missing, with the value of the head service name
+                - name: init-myservice
+                  image: busybox:1.28
+                  command: ['sh', '-c', "until nslookup $RAY_IP.$(cat /var/run/secrets/kubernetes.io/serviceaccount/namespace).svc.cluster.local; do echo waiting for myservice; sleep 2; done"]
+                containers:
+                - name: machine-learning # must consist of lower case alphanumeric characters or '-', and must start and end with an alphanumeric character (e.g. 'my-name',  or '123-abc'
+                  image: asm582/codeflare-tl-aws:latest
+                  env:
+                  - name: AWS_ACCESS_KEY_ID
+                    valueFrom:
+                      secretKeyRef:
+                        name: glue-s3-creds
+                        key: AWS_ACCESS_KEY_ID
+                  - name: AWS_SECRET_ACCESS_KEY
+                    valueFrom:
+                      secretKeyRef:
+                        name: glue-s3-creds
+                        key: AWS_SECRET_ACCESS_KEY
+                  - name: ENDPOINT_URL
+                    valueFrom:
+                      secretKeyRef:
+                        name: glue-s3-creds
+                        key: ENDPOINT_URL
+                  # environment variables to set in the container.Optional.
+                  # Refer to https://kubernetes.io/docs/tasks/inject-data-application/define-environment-variable-container/
+                  lifecycle:
+                    preStop:
+                      exec:
+                        command: ["/bin/sh","-c","ray stop"]
+                  resources:
+                    limits:
+                      cpu: "2"
+                      memory: "12G"
+                      nvidia.com/gpu: "1"
+                    requests:
+                      cpu: "2"
+                      memory: "12G"
+                      nvidia.com/gpu: "1"
diff --git a/src/codeflare_sdk/utils/generate_yaml.py b/src/codeflare_sdk/utils/generate_yaml.py
@@ -0,0 +1,109 @@
+import yaml
+import sys
+import argparse
+import uuid
+
+def readTemplate(template):
+    with open(template, "r") as stream:
+        try:
+            return yaml.safe_load(stream)
+        except yaml.YAMLError as exc:
+            print(exc)
+
+def gen_names():
+    gen_id = str(uuid.uuid4())
+    appwrapper_name = "appwrapper-" + gen_id
+    cluster_name = "cluster-" + gen_id
+    return appwrapper_name, cluster_name
+
+def update_names(yaml, item, appwrapper_name, cluster_name):
+    metadata = yaml.get("metadata")
+    metadata["name"] = appwrapper_name
+    lower_meta = item.get("generictemplate", {}).get("metadata")
+    lower_meta["labels"]["appwrapper.mcad.ibm.com"] = appwrapper_name
+    lower_meta["name"] = cluster_name
+
+def updateCustompodresources(item, cpu, memory, gpu, workers):
+    if 'custompodresources' in item.keys():
+        custompodresources = item.get('custompodresources')
+        for resource in custompodresources:
+            for k,v in resource.items():
+                if k == "replicas":
+                    resource[k] = workers
+                if k == "requests" or k == "limits":
+                    for spec,_ in v.items():
+                        if spec == "cpu":
+                            resource[k][spec] = cpu
+                        if spec == "memory":
+                            resource[k][spec] = str(memory) + "G"
+                        if spec == "nvidia.com/gpu":
+                            resource[k][spec] = gpu
+    else:
+        sys.exit("Error: malformed template")
+
+def update_affinity(spec, appwrapper_name):
+    node_selector_terms = spec.get("affinity").get("nodeAffinity").get("requiredDuringSchedulingIgnoredDuringExecution").get("nodeSelectorTerms")
+    node_selector_terms[0]["matchExpressions"][0]["values"][0] = appwrapper_name
+
+def update_resources(spec, cpu, memory, gpu):
+    container = spec.get("containers")
+    for resource in container:
+        requests = resource.get('resources').get('requests')
+        if requests is not None:
+            requests["cpu"] = cpu
+            requests["memory"] = str(memory) + "G"
+            requests["nvidia.com/gpu"] = gpu
+        limits = resource.get('resources').get('limits')
+        if limits is not None:
+            limits["cpu"] = cpu
+            limits["memory"] = str(memory) + "G"
+            limits["nvidia.com/gpu"] = gpu
+
+def update_nodes(item, appwrapper_name, cpu, memory, gpu, workers):
+    if "generictemplate" in item.keys():
+        head = item.get("generictemplate").get("spec").get("headGroupSpec")
+        worker = item.get("generictemplate").get("spec").get("workerGroupSpecs")[0]
+
+        # Head counts as first worker
+        worker["replicas"] = workers - 1
+        worker["minReplicas"] = workers - 1
+        worker["maxReplicas"] = workers - 1
+
+        for comp in [head, worker]:
+            spec = comp.get("template").get("spec")
+            update_affinity(spec, appwrapper_name)
+            update_resources(spec, cpu, memory, gpu)
+
+def generateAppwrapper(cpu, memory, gpu, workers, template):
+        user_yaml = readTemplate(template)
+        appwrapper_name, cluster_name = gen_names()
+        resources = user_yaml.get("spec","resources")
+        item = resources["resources"].get("GenericItems")[0]
+        update_names(user_yaml, item, appwrapper_name, cluster_name)
+        updateCustompodresources(item, cpu, memory, gpu, workers)
+        update_nodes(item, appwrapper_name, cpu, memory, gpu, workers)
+        writeUserAppwrapper(user_yaml, appwrapper_name)
+
+def writeUserAppwrapper(user_yaml, appwrapper_name):
+    with open(f'{appwrapper_name}.yaml','w') as outfile:
+        yaml.dump(user_yaml, outfile, default_flow_style=False)
+
+def main():
+    parser = argparse.ArgumentParser(description='Generate user AppWrapper')
+    parser.add_argument("--cpu", type=int, required=True, help="number of CPU(s) in a worker required for running job")
+    parser.add_argument("--memory", required=True, help="RAM required in a worker for running job")
+    parser.add_argument("--gpu",type=int, required=True, help="GPU(s) required in a worker for running job")
+    parser.add_argument("--workers", type=int, required=True, help="How many workers are required in the cluster")
+    parser.add_argument("--template", required=True, help="Template AppWrapper yaml file")
+    
+    args = parser.parse_args()
+    cpu = args.cpu
+    memory = args.memory
+    gpu = args.gpu
+    workers = args.workers
+    template = args.template
+
+    generateAppwrapper(cpu, memory, gpu, workers, template)
+
+if __name__=="__main__":
+    main()