From 403c3bbe97ddb31e79bd2d4b897ef3b911ee0859 Mon Sep 17 00:00:00 2001 From: SandraGH5 <80421934+SandraGH5@users.noreply.github.com> Date: Fri, 21 May 2021 00:34:03 -0700 Subject: [PATCH] Update config_flyte_deploy.py (#225) * Update config_flyte_deploy.py * update config-flyte-deploy (#232) Signed-off-by: Samhita Alla * Fix links & add flytectl references (#239) * update config-flyte-deploy Signed-off-by: Samhita Alla * fix links Signed-off-by: Samhita Alla Co-authored-by: Samhita Alla --- cookbook/deployment/cluster/README.rst | 9 + .../deployment/cluster/config_flyte_deploy.py | 8 - .../cluster/config_flyte_deploy.rst | 192 ++++++++++++++++++ cookbook/docs/conf.py | 6 + 4 files changed, 207 insertions(+), 8 deletions(-) delete mode 100644 cookbook/deployment/cluster/config_flyte_deploy.py create mode 100644 cookbook/deployment/cluster/config_flyte_deploy.rst diff --git a/cookbook/deployment/cluster/README.rst b/cookbook/deployment/cluster/README.rst index 7b658f6589..7bf7cde606 100644 --- a/cookbook/deployment/cluster/README.rst +++ b/cookbook/deployment/cluster/README.rst @@ -132,3 +132,12 @@ Using remote Flyte gives you the ability to: - Use caching to avoid calling the same task with the same inputs (for the same version) - Portability: You can reference pre-registered entities under any domain or project within your workflow code - Sharable executions: you can easily share links to your executions with your teammates + +.. toctree:: + :caption: Cluster Deployment + :hidden: + + config_flyte_deploy + auth_setup + monitoring + access_cloud_resources \ No newline at end of file diff --git a/cookbook/deployment/cluster/config_flyte_deploy.py b/cookbook/deployment/cluster/config_flyte_deploy.py deleted file mode 100644 index a932610b77..0000000000 --- a/cookbook/deployment/cluster/config_flyte_deploy.py +++ /dev/null @@ -1,8 +0,0 @@ -""" -Configuring Your Flyte Deployment --------------------------------------------- - -.. NOTE:: - - Coming soon 🛠 -""" diff --git a/cookbook/deployment/cluster/config_flyte_deploy.rst b/cookbook/deployment/cluster/config_flyte_deploy.rst new file mode 100644 index 0000000000..760d3e33fa --- /dev/null +++ b/cookbook/deployment/cluster/config_flyte_deploy.rst @@ -0,0 +1,192 @@ +################################# +Configuring Your Flyte Deployment +################################# + +As the complexity of your user base grows, you may find yourself tweaking resource assignments based on specific projects, domains, and workflows. This document walks through how and in what ways you can configure your Flyte deployment. + +.. _config_resource_types: + +*************************** +Configurable Resource Types +*************************** +Flyte allows these custom settings along with the following combination of dimensions: + +- domain +- project and domain +- project, domain, and name (must be either the name of a workflow name or a launch plan) + +Please see the :doc:`Control Plane ` document to get to know about projects and domains. +Along these dimensions, the following settings are configurable. + +.. admonition:: Alert + Not all three of the combinations mentioned above are valid for each of these settings. + +- Defaults are used for task resource requests and limits (when not specified by the author of the task). +- Settings for project-namespaced cluster resource configuration that feeds into admin's cluster resource manager. +- Execution queues that are used for dynamic workflows. Effectively, they're meant to be used with constructs like AWS Batch. + +.. note:: + Execution queues are used to determine where tasks yielded by a :py:func:`flytekit:flytekit.dynamic` workflow or ``map task`` run. + +- Determining how workflow executions are assigned to clusters in a multi-cluster Flyte deployment. + +.. tip:: + The proto definition is the definitive source encapsulating which :ref:`Matchable Resource ` attributes can be customized. + +Each of the four above settings is discussed below. + +Task Resources +============== +Configuring task resources includes setting default values for the requests and limits for the following resources: + +- cpu +- gpu +- memory +- storage + +In the absence of an override, the global +`default values `__ +in the FlyteAdmin config are used. + +The override values from the database are assigned at execution time. + +To update individual project-domain attributes, use the following command for your reference. + +.. prompt:: bash + + curl --request PUT 'https://flyte.company.net/api/v1/project_domain_attributes/projectname/staging' \ + --header 'Content-Type: application/json' --data-raw \ + '{"attributes":{"matchingAttributes":{"taskResourceAttributes":{"defaults":{"cpu": "1000", "memory": "5000Gi"}, "limits": {"cpu": "4000"}}}}' + +.. tip:: + The equivalent ``flytectl`` command is: + + .. prompt:: bash + flytectl update task-resource-attribute + + Refer to the :ref:`docs ` to learn more about the command and its supported flag(s). + +Cluster Resources +================= +These are free-form key-value pairs that are used when filling in the templates that the admin feeds into its cluster manager. The keys represent templatized variables in `cluster resource template YAML `__ and the values are what you want to see filled in. + +In the absence of custom override values, ``templateData`` from the `FlyteAdmin config `__ is used as a default. + +.. note:: + The above-referenced settings can only take on domain, project, and domain specificity. Since Flyte has not tied in the notion of a workflow or a launch plan to any Kubernetes constructs, specifying a workflow or launch plan name doesn't make any sense. + +Running the following will ensure that when the admin fills in cluster resource templates, the Kubernetes namespace ``flyteexamples-development`` will have a resource quota of 1000 CPU cores and 5TB of memory. + +.. prompt:: bash + + flyte-cli -h localhost:30081 -p flyteexamples -d development update-cluster-resource-attributes \ + --attributes projectQuotaCpu 1000 --attributes projectQuotaMemory 5000Gi + +.. tip:: + The equivalent ``flytectl`` command is: + + .. prompt:: bash + flytectl update cluster-resource-attribute + + Refer to the :ref:`docs ` to learn more about the command and its supported flag(s). + +The above-updated values will, in turn, be used to fill in the template fields. + +.. rli:: https://raw.githubusercontent.com/flyteorg/flyte/master/kustomize/base/single_cluster/headless/config/clusterresource-templates/ab_project-resource-quota.yaml + +The values can now be copied from the base of this repository to the ``flyteexamples-development`` namespace only. + +For other namespaces, the `platform defaults `__ apply. + +.. note:: + The template values, e.g. ``projectQuotaCpu`` or ``projectQuotaMemory`` are freeform strings. You must ensure that they match the template placeholders in your `template file `__ + for your changes to take effect. + +Execution Queues +================ +Execution queues themselves are currently defined in the +`flyteadmin config `__. + +The **attributes** associated with an execution queue must match the **tags** for workflow executions. The tags are associated with configurable resources +stored in the admin database. + +.. prompt:: bash + + flyte-cli -h localhost:30081 -p flyteexamples -d development update-execution-queue-attributes \ + --tags critical --tags gpu_intensive + +.. tip:: + The equivalent command in ``flytectl`` is: + + .. prompt:: bash + flytectl update execution-queue-attribute + + Refer to the :ref:`docs ` to learn more about the command and its supported flag(s). + +You can view existing attributes for which tags can be assigned by visiting ``protocol:///api/v1/matchable_attributes?resource_type=3``. + +Execution Cluster Label +======================= +This allows forcing a matching execution to consistently execute on a specific Kubernetes cluster. + +You can set this using flyte-cli: + +.. prompt:: bash + + flyte-cli -h localhost:30081 -p flyteexamples -d development update-execution-cluster-label --value mycluster + +.. tip:: + The equivalent command in ``flytectl`` is: + + .. prompt:: bash + flytectl update execution-cluster-label + + Refer to the :ref:`docs ` to learn more about the command and its supported flag(s). + +********* +Hierarchy +********* +Increasing specificity defines how matchable resource attributes get applied. The available configurations, in order of decreasing specifity, are: + +#. Domain, project, workflow name, and launch plan. + +#. Domain, project, and workflow name + +#. Domain and project + +#. Domain + +Default values for all and per-domain attributes may be specified in the FlyteAdmin config as documented in the :ref:`config_resource_types`. + +Example +======= +If the database includes the following: + ++------------+--------------+----------+-------------+-----------+ +| Domain | Project | Workflow | Launch Plan | Tags | ++============+==============+==========+=============+===========+ +| production | widgetmodels | | | critical | ++------------+--------------+----------+-------------+-----------+ +| production | widgetmodels | Demand | | supply | ++------------+--------------+----------+-------------+-----------+ + +Any inbound ``CreateExecution`` requests with **[Domain: Production, Project: widgetmodels, Workflow: Demand]** for any launch plan will have a tag value of "supply". + +Any inbound ``CreateExecution`` requests with **[Domain: Production, Project: widgetmodels]** for any workflow other than ``Demand`` and any launch plan will have a tag value "critical". + +All other inbound CreateExecution requests will use the default values specified in the FlyteAdmin config (if any). + +********* +Debugging +********* +To get the matchable resources of :ref:`execution queue attributes `, run the command: + +.. prompt:: bash + flytectl get execution-queue-attribute + +.. note:: + Alternatively, you can also hit the URL: ``protocol://``. + +To get the global state of the world, list all endpoints. For example, visit ``protocol:///api/v1/matchable_attributes?resource_type=2``. + +The resource type enum (int) is defined in the :ref:`Matchable Resource `. diff --git a/cookbook/docs/conf.py b/cookbook/docs/conf.py index 768e580604..705835aef3 100644 --- a/cookbook/docs/conf.py +++ b/cookbook/docs/conf.py @@ -17,6 +17,7 @@ import shutil import sys +from sphinx.errors import ConfigError from sphinx_gallery.sorting import FileNameSortKey sys.path.insert(0, os.path.abspath("../")) @@ -145,6 +146,7 @@ def __call__(self, filename): "sphinx-prompt", "sphinx_copybutton", "sphinx_search.extension", + "sphinxext.remoteliteralinclude", ] # Add any paths that contain templates here, relative to this directory. @@ -310,6 +312,9 @@ def __call__(self, filename): # }, } +if len(examples_dirs) != len(gallery_dirs): + raise ConfigError("examples_dirs and gallery_dirs aren't of the same length") + for i in range(len(sphinx_gallery_conf["examples_dirs"])): gallery_dir = sphinx_gallery_conf["gallery_dirs"][i] source_dir = sphinx_gallery_conf["examples_dirs"][i] @@ -338,4 +343,5 @@ def __call__(self, filename): # Uncomment for local development and change to your username # "flytekit": ("/Users/ytong/go/src/github.com/lyft/flytekit/docs/build/html", None), "flyteidl": ("https://docs.flyte.org/projects/flyteidl/en/latest", None), + "flytectl": ("https://docs.flyte.org/projects/flytectl/en/latest/", None), }