Separate out the distributed tuning doc, and make sure client_id is unique.

xingyousong · copybara-github · commit e0d923e0196e · 2025-01-06T09:57:38.000-08:00
User didn't realize `client_id` was supposed to be unique: #1215 (comment) PiperOrigin-RevId: 712563313
diff --git a/demos/run_vizier_client.py b/demos/run_vizier_client.py
@@ -36,7 +36,6 @@
 from absl import app
 from absl import flags
 from absl import logging
-
 from vizier import service
 from vizier.service import clients
 from vizier.service import pyvizier as vz
@@ -72,6 +71,12 @@
         ' and API.'
     ),
 )
+flags.DEFINE_string(
+    'client_id',
+    clients.UNUSED_CLIENT_ID,
+    'The client id to use for the study. NOTE: For distributed cases, this'
+    ' needs to be unique for every client.',
+)
 
 FLAGS = flags.FLAGS
 
@@ -138,7 +143,9 @@ def main(argv: Sequence[str]) -> None:
 
   # Evaluate the suggestion(s) and report the results to Vizier.
   for _ in range(FLAGS.max_num_iterations):
-    trials = study.suggest(count=FLAGS.suggestion_count)
+    trials = study.suggest(
+        count=FLAGS.suggestion_count, client_id=FLAGS.client_id
+    )
     for trial in trials:
       materialized_trial = trial.materialize()
       measurement = evaluate_trial(materialized_trial)
diff --git a/docs/guides/index.rst b/docs/guides/index.rst
@@ -8,6 +8,7 @@ For Users
     :maxdepth: 1
 
     user/running_vizier
+    user/distributed
     user/search_spaces
     user/converters
     Switching to Vertex <https://github.com/GoogleCloudPlatform/vertex-ai-samples/blob/main/notebooks/community/vizier/conversions_vertex_vizier_and_open_source_vizier.ipynb>
diff --git a/docs/guides/user/distributed.ipynb b/docs/guides/user/distributed.ipynb
@@ -0,0 +1,204 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "Xgqk7eHswDpB"
+      },
+      "source": [
+        "[![Open in Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/google/vizier/blob/main/docs/guides/user/distributed.ipynb)\n",
+        "\n",
+        "# Distributed Vizier\n",
+        "This documentation shows how to perform distributed optimization over multiple clients."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "O5RnMytPR8Aw"
+      },
+      "source": [
+        "## Installation and reference imports"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "kSG8XlxLvCJO"
+      },
+      "outputs": [],
+      "source": [
+        "!pip install google-vizier[jax]"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "fzYr0bPYSHfQ"
+      },
+      "outputs": [],
+      "source": [
+        "import multiprocessing\n",
+        "\n",
+        "from vizier import service\n",
+        "from vizier.service import clients\n",
+        "from vizier.service import pyvizier as vz\n",
+        "from vizier.service import servers"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "qJ1kRiHaKOVt"
+      },
+      "source": [
+        "## Regular setup\n",
+        "We setup a regular study configuration below."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "zX2G3_pcKYdG"
+      },
+      "outputs": [],
+      "source": [
+        "study_config = vz.StudyConfig()\n",
+        "study_config.search_space.root.add_float_param('x', 0.0, 1.0)\n",
+        "study_config.metric_information.append(vz.MetricInformation(name='metric', goal=vz.ObjectiveMetricGoal.MAXIMIZE))\n",
+        "study_config.algorithm = 'DEFAULT'\n",
+        "\n",
+        "\n",
+        "def evaluate(x: float) -\u003e float:\n",
+        "  return 2*x - x**2"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "w3m48cPsXcxD"
+      },
+      "source": [
+        "## Server creation\n",
+        "Unlike the single-client case, in the distributed case, we require a single explicit server to accept requests from all other client processses. Details such as the `host`, `port`, `database_url`, `policy_factory`, etc. can be configured in the server's initializer."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "V6ef6OfMXdpz"
+      },
+      "outputs": [],
+      "source": [
+        "server = servers.DefaultVizierServer()  # Ideally created on a separate process such as a server machine."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "ktExEiS0xlH_"
+      },
+      "source": [
+        "## Client parallelization\n",
+        "We may simultaneously create multiple clients to work on the same study, useful for parallelizing evaluation workload. All client processes (on a single machine or over multiple machines) will connect to this server via a globally specified `endpoint`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "EQR1_u-VxEwn"
+      },
+      "outputs": [],
+      "source": [
+        "clients.environment_variables.server_endpoint = server.endpoint  # Server address.\n",
+        "study_client = clients.Study.from_study_config(study_config, owner='owner', study_id = 'example_study_id')  # Now connects to the explicitly created server.\n",
+        "another_study_client = clients.Study.from_resource_name(study_client.resource_name)  # Another way to fork clients."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "Vh3eNsrAdaMJ"
+      },
+      "source": [
+        "## Distributed suggestions\n",
+        "We may now distribute our workflow, with each worker/client using the same loop below. Each client requires a unique `client_id` however, to ensure the server can identify client workers and distribute workloads properly."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "BnFKc7FadkJV"
+      },
+      "outputs": [],
+      "source": [
+        "def tuning_loop(client_id: str):\n",
+        "  for i in range(10):\n",
+        "    suggestions = study_client.suggest(count=1, client_id=client_id)\n",
+        "    for suggestion in suggestions:\n",
+        "      objective = evaluate(suggestion.parameters['x'])\n",
+        "      final_measurement = vz.Measurement({'metric': objective})\n",
+        "      suggestion.complete(final_measurement)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "NVGcVEzb0Gxe"
+      },
+      "source": [
+        "For example, we may perform a threadpool and construct multiple clients to parallelize evaluations on a single machine."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "R0pcPViUz9zC"
+      },
+      "outputs": [],
+      "source": [
+        "NUM_CLIENTS = 10\n",
+        "NUM_TRIALS_PER_CLIENT = 50\n",
+        "\n",
+        "pool = multiprocessing.pool.ThreadPool(NUM_CLIENTS)\n",
+        "pool.map(tuning_loop, range(NUM_CLIENTS))"
+      ]
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "last_runtime": {
+        "build_target": "//ads/thresholds/kumamon/colab:notebook",
+        "kind": "shared"
+      },
+      "name": "Distributed.ipynb",
+      "private_outputs": true,
+      "provenance": [
+        {
+          "file_id": "/piper/depot/http://github.com/google/vizier/tree/main/vizier/docs/guides/user/running_vizier.ipynb",
+          "timestamp": 1673247218127
+        },
+        {
+          "file_id": "1q87rsDDUJLHci3o9Gv-sU0g7H3O3lAbU",
+          "timestamp": 1659555396142
+        }
+      ]
+    },
+    "kernelspec": {
+      "display_name": "Python 3",
+      "name": "python3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
diff --git a/docs/guides/user/running_vizier.ipynb b/docs/guides/user/running_vizier.ipynb
@@ -80,9 +80,7 @@
         "problem = vz.ProblemStatement()\n",
         "problem.search_space.root.add_float_param('x', 0.0, 1.0)\n",
         "problem.search_space.root.add_float_param('y', 0.0, 1.0)\n",
-        "problem.metric_information.append(\n",
-        "    vz.MetricInformation(\n",
-        "        name='maximize_metric', goal=vz.ObjectiveMetricGoal.MAXIMIZE))\n",
+        "problem.metric_information.append(vz.MetricInformation(name='maximize_metric', goal=vz.ObjectiveMetricGoal.MAXIMIZE))\n",
         "\n",
         "\n",
         "def evaluate(x: float, y: float) -\u003e float:\n",
@@ -118,9 +116,7 @@
       },
       "source": [
         "## Setting up the client\n",
-        "Starts a `study_client`, which can be either in **local mode (default)** or **distributed mode.**\n",
-        "\n",
-        "**Local Mode:** The client has no `endpoint` set, and will implicitly create a local Vizier Service which will be shared across other clients in the same Python process. Studies will then be stored locally in a SQL database file located at `service.VIZIER_DB_PATH`."
+        "Starts a `study_client`, which will implicitly create a local Vizier Service which will be shared across other clients in the same Python process. Studies will then be stored locally in a SQL database file located at `service.VIZIER_DB_PATH`."
       ]
     },
     {
@@ -135,51 +131,6 @@
         "print('Local SQL database file located at: ', service.VIZIER_DB_PATH)"
       ]
     },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "w3m48cPsXcxD"
-      },
-      "source": [
-        "**Distributed mode:** The service may be explicitly created, wrapped as a server in a separate process to accept requests from all other client processses. Details such as the `database_url`, `port`, `policy_factory`, etc. can be configured in the server's initializer.\n",
-        "\n",
-        "All client processes (on a single machine or over multiple machines) will connect to this server via a globally specified `endpoint`."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "V6ef6OfMXdpz"
-      },
-      "outputs": [],
-      "source": [
-        "server = servers.DefaultVizierServer()  # Ideally created on a separate process such as a server machine.\n",
-        "clients.environment_variables.server_endpoint = server.endpoint  # Server address.\n",
-        "study_client = clients.Study.from_study_config(study_config, owner='owner', study_id = 'example_study_id')  # Now connects to the explicitly created server."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "Z0Ycmc-exzqm"
-      },
-      "source": [
-        "## Client Parallelization\n",
-        "Regardless of whether the setup is local or distributed, we may simultaneously create multiple clients to work on the same study, useful for parallelizing evaluation workload."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "VlfFb5t3yILl"
-      },
-      "outputs": [],
-      "source": [
-        "another_study_client = clients.Study.from_resource_name(study_client.resource_name)"
-      ]
-    },
     {
       "cell_type": "markdown",
       "metadata": {
diff --git a/vizier/_src/benchmarks/experimenters/infeasible_experimenter_test.py b/vizier/_src/benchmarks/experimenters/infeasible_experimenter_test.py
@@ -38,9 +38,6 @@ def test_consistency(self):
 
       for t in trials:
         self.assertEqual(t.infeasible, trials[0].infeasible)
-        self.assertEqual(
-            t.final_measurement_or_die, trials[0].final_measurement_or_die
-        )
 
 
 class ParamRegionInfeasibleExperimenterTest(absltest.TestCase):
diff --git a/vizier/_src/service/clients.py b/vizier/_src/service/clients.py
@@ -32,6 +32,8 @@
 # Redeclared since clients.py is the user-facing client API.
 environment_variables = vizier_client.environment_variables
 
+UNUSED_CLIENT_ID = constants.UNUSED_CLIENT_ID
+
 
 @attr.define
 class Trial(client_abc.TrialInterface):
@@ -204,7 +206,7 @@ def materialize_state(self) -> vz.StudyState:
 
   @classmethod
   def from_resource_name(cls: Type['Study'], name: str) -> 'Study':
-    client = vizier_client.VizierClient(name, constants.UNUSED_CLIENT_ID)
+    client = vizier_client.VizierClient(name, UNUSED_CLIENT_ID)
     try:
       _ = client.get_study_config()  # Make sure study exists.
     except Exception as err:
@@ -251,7 +253,7 @@ def from_study_config(
     # expected to provide a client_id in the suggest() call.
     client = vizier_client.create_or_load_study(
         owner_id=owner,
-        client_id=constants.UNUSED_CLIENT_ID,
+        client_id=UNUSED_CLIENT_ID,
         study_id=study_id,
         study_config=config,
     )
diff --git a/vizier/service/clients/__init__.py b/vizier/service/clients/__init__.py
@@ -21,3 +21,4 @@
 from vizier._src.service.clients import Study
 from vizier._src.service.clients import Trial
 from vizier._src.service.clients import TrialIterable
+from vizier._src.service.clients import UNUSED_CLIENT_ID