Skip to content

Commit

Permalink
Adds comet-ml plugin (#2550)
Browse files Browse the repository at this point in the history
* Adds comet-ml plugin

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

* For local execution, do not set experiment_key if it is none

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

* Use correct comet-ml links

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

* Allow host to be adjustable

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

* Adds comet-ml plugin

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

* Use new comet-ml login name

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

* Require the project_name workspace and secrets

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>

---------

Signed-off-by: Thomas J. Fan <thomasjpfan@gmail.com>
  • Loading branch information
thomasjpfan authored Jul 17, 2024
1 parent 262f6d6 commit 5a4ba2f
Show file tree
Hide file tree
Showing 6 changed files with 395 additions and 0 deletions.
1 change: 1 addition & 0 deletions .github/workflows/pythonbuild.yml
Original file line number Diff line number Diff line change
Expand Up @@ -316,6 +316,7 @@ jobs:
- flytekit-aws-batch
- flytekit-aws-sagemaker
- flytekit-bigquery
- flytekit-comet-ml
- flytekit-dask
- flytekit-data-fsspec
- flytekit-dbt
Expand Down
26 changes: 26 additions & 0 deletions plugins/flytekit-comet-ml/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
# Flytekit Comet Plugin

Comet’s machine learning platform integrates with your existing infrastructure and tools so you can manage, visualize, and optimize models—from training runs to production monitoring. This plugin integrates Flyte with Comet.ml by configuring links between the two platforms.

To install the plugin, run:

```bash
pip install flytekitplugins-comet-ml
```

Comet requires an API key to authenticate with their platform. In the above example, a secret is created using
[Flyte's Secrets manager](https://docs.flyte.org/en/latest/user_guide/productionizing/secrets.html).

To enable linking from the Flyte side panel to Comet.ml, add the following to Flyte's configuration:

```yaml
plugins:
logs:
dynamic-log-links:
- comet-ml-execution-id:
displayName: Comet
templateUris: "{{ .taskConfig.host }}/{{ .taskConfig.workspace }}/{{ .taskConfig.project_name }}/{{ .executionName }}{{ .nodeId }}{{ .taskRetryAttempt }}{{ .taskConfig.link_suffix }}"
- comet-ml-custom-id:
displayName: Comet
templateUris: "{{ .taskConfig.host }}/{{ .taskConfig.workspace }}/{{ .taskConfig.project_name }}/{{ .taskConfig.experiment_key }}"
```
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
from .tracking import comet_ml_login

__all__ = ["comet_ml_login"]
173 changes: 173 additions & 0 deletions plugins/flytekit-comet-ml/flytekitplugins/comet_ml/tracking.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,173 @@
import os
from functools import partial
from hashlib import shake_256
from typing import Callable, Optional, Union

import comet_ml
from flytekit import Secret
from flytekit.core.context_manager import FlyteContextManager
from flytekit.core.utils import ClassDecorator

COMET_ML_EXECUTION_TYPE_VALUE = "comet-ml-execution-id"
COMET_ML_CUSTOM_TYPE_VALUE = "comet-ml-custom-id"


def _generate_suffix_with_length_10(project_name: str, workspace: str) -> str:
"""Generate suffix from project_name + workspace."""
h = shake_256(f"{project_name}-{workspace}".encode("utf-8"))
# Using 5 generates a suffix with length 10
return h.hexdigest(5)


def _generate_experiment_key(hostname: str, project_name: str, workspace: str) -> str:
"""Generate experiment key that comet_ml can use:
1. Is alphanumeric
2. 32 <= len(experiment_key) <= 50
"""
# In Flyte, then hostname is set to {.executionName}-{.nodeID}-{.taskRetryAttempt}, where
# - len(executionName) == 20
# - 2 <= len(nodeId) <= 8
# - 1 <= len(taskRetryAttempt)) <= 2 (In practice, retries does not go above 99)
# Removing the `-` because it is not alphanumeric, the 23 <= len(hostname) <= 30
# On the low end we need to add 10 characters to stay in the range acceptable to comet_ml
hostname = hostname.replace("-", "")
suffix = _generate_suffix_with_length_10(project_name, workspace)
return f"{hostname}{suffix}"


def comet_ml_login(
project_name: str,
workspace: str,
secret: Union[Secret, Callable],
experiment_key: Optional[str] = None,
host: str = "https://www.comet.com",
**login_kwargs: dict,
):
"""Comet plugin.
Args:
project_name (str): Send your experiment to a specific project. (Required)
workspace (str): Attach an experiment to a project that belongs to this workspace. (Required)
secret (Secret or Callable): Secret with your `COMET_API_KEY` or a callable that returns the API key.
The callable takes no arguments and returns a string. (Required)
experiment_key (str): Experiment key.
host (str): URL to your Comet service. Defaults to "https://www.comet.com"
**login_kwargs (dict): The rest of the arguments are passed directly to `comet_ml.login`.
"""
return partial(
_comet_ml_login_class,
project_name=project_name,
workspace=workspace,
secret=secret,
experiment_key=experiment_key,
host=host,
**login_kwargs,
)


class _comet_ml_login_class(ClassDecorator):
COMET_ML_PROJECT_NAME_KEY = "project_name"
COMET_ML_WORKSPACE_KEY = "workspace"
COMET_ML_EXPERIMENT_KEY_KEY = "experiment_key"
COMET_ML_URL_SUFFIX_KEY = "link_suffix"
COMET_ML_HOST_KEY = "host"

def __init__(
self,
task_function: Callable,
project_name: str,
workspace: str,
secret: Union[Secret, Callable],
experiment_key: Optional[str] = None,
host: str = "https://www.comet.com",
**login_kwargs: dict,
):
"""Comet plugin.
Args:
project_name (str): Send your experiment to a specific project. (Required)
workspace (str): Attach an experiment to a project that belongs to this workspace. (Required)
secret (Secret or Callable): Secret with your `COMET_API_KEY` or a callable that returns the API key.
The callable takes no arguments and returns a string. (Required)
experiment_key (str): Experiment key.
host (str): URL to your Comet service. Defaults to "https://www.comet.com"
**login_kwargs (dict): The rest of the arguments are passed directly to `comet_ml.login`.
"""

self.project_name = project_name
self.workspace = workspace
self.experiment_key = experiment_key
self.secret = secret
self.host = host
self.login_kwargs = login_kwargs

super().__init__(
task_function,
project_name=project_name,
workspace=workspace,
experiment_key=experiment_key,
secret=secret,
host=host,
**login_kwargs,
)

def execute(self, *args, **kwargs):
ctx = FlyteContextManager.current_context()
is_local_execution = ctx.execution_state.is_local_execution()

default_kwargs = self.login_kwargs
login_kwargs = {
"project_name": self.project_name,
"workspace": self.workspace,
**default_kwargs,
}

if is_local_execution:
# For local execution, always use the experiment_key. If `self.experiment_key` is `None`, comet_ml
# will generate it's own key
if self.experiment_key is not None:
login_kwargs["experiment_key"] = self.experiment_key
else:
# Get api key for remote execution
if isinstance(self.secret, Secret):
secrets = ctx.user_space_params.secrets
comet_ml_api_key = secrets.get(key=self.secret.key, group=self.secret.group)
else:
comet_ml_api_key = self.secret()

login_kwargs["api_key"] = comet_ml_api_key

if self.experiment_key is None:
# The HOSTNAME is set to {.executionName}-{.nodeID}-{.taskRetryAttempt}
# If HOSTNAME is not defined, use the execution name as a fallback
hostname = os.environ.get("HOSTNAME", ctx.user_space_params.execution_id.name)
experiment_key = _generate_experiment_key(hostname, self.project_name, self.workspace)
else:
experiment_key = self.experiment_key

login_kwargs["experiment_key"] = experiment_key

if hasattr(comet_ml, "login"):
comet_ml.login(**login_kwargs)
else:
comet_ml.init(**login_kwargs)

output = self.task_function(*args, **kwargs)
return output

def get_extra_config(self):
extra_config = {
self.COMET_ML_PROJECT_NAME_KEY: self.project_name,
self.COMET_ML_WORKSPACE_KEY: self.workspace,
self.COMET_ML_HOST_KEY: self.host,
}

if self.experiment_key is None:
comet_ml_value = COMET_ML_EXECUTION_TYPE_VALUE
suffix = _generate_suffix_with_length_10(self.project_name, self.workspace)
extra_config[self.COMET_ML_URL_SUFFIX_KEY] = suffix
else:
comet_ml_value = COMET_ML_CUSTOM_TYPE_VALUE
extra_config[self.COMET_ML_EXPERIMENT_KEY_KEY] = self.experiment_key

extra_config[self.LINK_TYPE_KEY] = comet_ml_value
return extra_config
39 changes: 39 additions & 0 deletions plugins/flytekit-comet-ml/setup.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,39 @@
from setuptools import setup

PLUGIN_NAME = "comet-ml"
MODULE_NAME = "comet_ml"


microlib_name = f"flytekitplugins-{PLUGIN_NAME}"

plugin_requires = ["flytekit>=1.12.3", "comet-ml>=3.43.2"]

__version__ = "0.0.0+develop"

setup(
name=microlib_name,
version=__version__,
author="flyteorg",
author_email="admin@flyte.org",
description="This package enables seamless use of Comet within Flyte",
namespace_packages=["flytekitplugins"],
packages=[f"flytekitplugins.{MODULE_NAME}"],
install_requires=plugin_requires,
license="apache2",
python_requires=">=3.8",
classifiers=[
"Intended Audience :: Science/Research",
"Intended Audience :: Developers",
"License :: OSI Approved :: Apache Software License",
"Programming Language :: Python :: 3.8",
"Programming Language :: Python :: 3.9",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Topic :: Scientific/Engineering",
"Topic :: Scientific/Engineering :: Artificial Intelligence",
"Topic :: Software Development",
"Topic :: Software Development :: Libraries",
"Topic :: Software Development :: Libraries :: Python Modules",
],
)
Loading

0 comments on commit 5a4ba2f

Please sign in to comment.