From 35681aaf950d627ae948a5499a94d50ac24f4b03 Mon Sep 17 00:00:00 2001 From: Graham Neubig Date: Mon, 12 Feb 2024 14:39:44 -0500 Subject: [PATCH 1/6] Fixed continuous integration --- .github/workflows/ci.yml | 3 ++- .github/workflows/release.yml | 5 ++--- .gitignore | 2 +- .pre-commit-config.yaml | 3 ++- README.md | 7 ++++++- llments/distance/distance.py | 4 +--- llments/distance/norm.py | 1 - llments/eval/eval.py | 5 ++--- llments/lm/lm.py | 4 ++-- llments/lm/lm_loader.py | 2 -- llments/lm/lm_loader_test.py | 1 - 11 files changed, 18 insertions(+), 19 deletions(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index d319354..1028414 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -1,5 +1,6 @@ +--- name: Continuous Integration -on: # yamllint disable-line rule:truthy +on: # yamllint disable-line rule:truthy push: branches: - main diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml index 168d102..36cd252 100644 --- a/.github/workflows/release.yml +++ b/.github/workflows/release.yml @@ -1,10 +1,9 @@ +--- name: Release workflow - -on: +on: # yamllint disable-line rule:truthy push: tags: - "v[0123456789].*" - jobs: release: runs-on: ubuntu-latest diff --git a/.gitignore b/.gitignore index 477bb4f..b148a3e 100644 --- a/.gitignore +++ b/.gitignore @@ -2,4 +2,4 @@ __pycache__ build llments.egg-info .vscode -.pytest_cache \ No newline at end of file +.pytest_cache diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index 053b197..4d692be 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -1,3 +1,4 @@ +--- repos: - repo: https://github.com/astral-sh/ruff-pre-commit rev: v0.1.5 @@ -7,7 +8,7 @@ repos: - repo: https://github.com/pre-commit/mirrors-mypy rev: 'v1.6.1' hooks: - - id: mypy + - id: mypy - repo: https://github.com/DavidAnson/markdownlint-cli2 rev: v0.10.0 hooks: diff --git a/README.md b/README.md index b31b564..eaaf4f1 100644 --- a/README.md +++ b/README.md @@ -2,7 +2,12 @@ ## Development Information +To start developing, install the development dependencies and pre-commit hooks: + ```bash -pip install . +pip install ".[dev]" pre-commit install ``` + +There are several [pre-commit hooks](https://pre-commit.com/) that will run on every +commit to perform formatting, typing, and linting. diff --git a/llments/distance/distance.py b/llments/distance/distance.py index f327d9b..54466bd 100644 --- a/llments/distance/distance.py +++ b/llments/distance/distance.py @@ -1,12 +1,10 @@ - import abc from llments.lm.lm import LanguageModel class Distance: - - @abc.abstractclassmethod + @abc.abstractmethod def distance(self, lm1: LanguageModel, lm2: LanguageModel) -> float: """Returns a distance between two language models.""" ... diff --git a/llments/distance/norm.py b/llments/distance/norm.py index 1000731..0257821 100644 --- a/llments/distance/norm.py +++ b/llments/distance/norm.py @@ -1,4 +1,3 @@ - from llments.lm.lm import LanguageModel diff --git a/llments/eval/eval.py b/llments/eval/eval.py index 00eddb7..2e9acfa 100644 --- a/llments/eval/eval.py +++ b/llments/eval/eval.py @@ -1,4 +1,3 @@ - import abc import dataclasses @@ -6,7 +5,7 @@ class PairwiseEvaluator: """A class that defines an evaluation function, assessing a hypothesized string.""" - @abc.abstractclassmethod + @abc.abstractmethod def evaluate(self, hyp: str, ref: str) -> float: """Returns an evaluation score between 0 and 1 for two strings. @@ -25,7 +24,7 @@ class EvaluatorMetadata: class GeneralEvaluator: """A class that defines an evaluation function, assessing a hypothesized string.""" - @abc.abstractclassmethod + @abc.abstractmethod def evaluate(self, hyp: str, ref: EvaluatorMetadata) -> float: """Returns an evaluation score between 0 and 1 for two strings. diff --git a/llments/lm/lm.py b/llments/lm/lm.py index 54ff1eb..ead0ebb 100644 --- a/llments/lm/lm.py +++ b/llments/lm/lm.py @@ -2,7 +2,7 @@ class LanguageModel: - @abc.abstractclassmethod + @abc.abstractmethod def generate( self, condition: str | None, @@ -11,7 +11,7 @@ def generate( """Generate from the language model, possibly conditioned on a prefix.""" ... - @abc.abstractclassmethod + @abc.abstractmethod def fit( self, target: "LanguageModel", task_description: str | None = None ) -> "LanguageModel": diff --git a/llments/lm/lm_loader.py b/llments/lm/lm_loader.py index ef588c6..d15e476 100644 --- a/llments/lm/lm_loader.py +++ b/llments/lm/lm_loader.py @@ -1,5 +1,3 @@ - - from llments.lm.lm import LanguageModel diff --git a/llments/lm/lm_loader_test.py b/llments/lm/lm_loader_test.py index dd8fbf4..ee9b38b 100644 --- a/llments/lm/lm_loader_test.py +++ b/llments/lm/lm_loader_test.py @@ -1,4 +1,3 @@ - def test_load_from_spec_file(): """Test that load_from_specification_file() loads a language model.""" raise NotImplementedError From 5362d98beb2607ac3efcdfedcb8eb9fcad591c2f Mon Sep 17 00:00:00 2001 From: Graham Neubig Date: Mon, 12 Feb 2024 14:42:10 -0500 Subject: [PATCH 2/6] Update readme --- README.md | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/README.md b/README.md index eaaf4f1..ecb4f15 100644 --- a/README.md +++ b/README.md @@ -11,3 +11,8 @@ pre-commit install There are several [pre-commit hooks](https://pre-commit.com/) that will run on every commit to perform formatting, typing, and linting. + +* `ruff` - Runs formatting, import sorting, and linting. +* `mypy` - Runs type checking. +* `markdownlint` - Runs markdown linting. +* `yamllint` - Runs YAML linting. From 4ff1be334d402f4d7eca15ddef1361d62c91578a Mon Sep 17 00:00:00 2001 From: Graham Neubig Date: Mon, 12 Feb 2024 14:51:31 -0500 Subject: [PATCH 3/6] Fix config --- .pre-commit-config.yaml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index 4d692be..53334c9 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -1,20 +1,20 @@ --- repos: - repo: https://github.com/astral-sh/ruff-pre-commit - rev: v0.1.5 + rev: v0.2.1 hooks: - id: ruff - id: ruff-format - repo: https://github.com/pre-commit/mirrors-mypy - rev: 'v1.6.1' + rev: v1.8.0 hooks: - id: mypy - repo: https://github.com/DavidAnson/markdownlint-cli2 - rev: v0.10.0 + rev: v0.12.1 hooks: - id: markdownlint-cli2 - repo: https://github.com/adrienverge/yamllint - rev: v1.33.0 + rev: v1.34.0 hooks: - id: yamllint - repo: https://github.com/koalaman/shellcheck-precommit From 94f104cbc64501fa042735e945db846cd3590bb7 Mon Sep 17 00:00:00 2001 From: Graham Neubig Date: Mon, 12 Feb 2024 14:58:31 -0500 Subject: [PATCH 4/6] Fix --- llments/lm/empirical.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/llments/lm/empirical.py b/llments/lm/empirical.py index 5b10c00..417fed8 100644 --- a/llments/lm/empirical.py +++ b/llments/lm/empirical.py @@ -1,3 +1,4 @@ +from typing import Any from llments.lm.lm import LanguageModel import random import json @@ -10,10 +11,10 @@ def __init__(self, data: list[str], probs: list[float] | None = None): probs = [1 / len(data)] * len(data) self.data = pd.DataFrame({"text": data, "prob": probs}) - def sample(self, condition: str | None): + def generate(self, condition: str | None, **kwargs: Any) -> str: """Sample from the language model, possibly conditioned on a prefix.""" if condition is None: - return random.choice(self.data["text"], p=self.data["probs"]) + return random.choices(self.data["text"], weights=self.data["probs"])[0] else: # Filter to only those that start with the condition filtered_df = self.data[self.data["text"].str.startswith(condition)] @@ -24,9 +25,9 @@ def sample(self, condition: str | None): ) # Normalize the probabilities filtered_df["prob"] = filtered_df["prob"] / filtered_df["prob"].sum() - return random.choice(filtered_df["text"], p=filtered_df["probs"]) + return random.choices(filtered_df["text"], weights=filtered_df["probs"])[0] - def fit(self, target: LanguageModel): + def fit(self, target: LanguageModel, task_description: str | None = None): raise ValueError( "Cannot fit an empirical distribution to another distribution." ) From f8be9382ff56aa13c06f171d4d572e061d8e3c2a Mon Sep 17 00:00:00 2001 From: Graham Neubig Date: Mon, 12 Feb 2024 15:04:11 -0500 Subject: [PATCH 5/6] Fix CI --- .github/workflows/ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 1028414..4081247 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -19,7 +19,7 @@ jobs: - name: Install ruff run: pip install ruff - name: Run ruff - run: ruff --check . + run: ruff check . python-mypy: runs-on: ubuntu-latest steps: From da85e10090c0a8393b409ab95ec32652963a7bd6 Mon Sep 17 00:00:00 2001 From: Graham Neubig Date: Mon, 12 Feb 2024 15:05:41 -0500 Subject: [PATCH 6/6] Update CI to remove some extra things --- .github/workflows/ci.yml | 24 ------------------------ 1 file changed, 24 deletions(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 4081247..b3f6b74 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -32,14 +32,6 @@ jobs: uses: pre-commit/action@v3.0.0 with: extra_args: mypy --all-files - lint-requirements-txt: - runs-on: ubuntu-latest - steps: - - uses: actions/checkout@v3 - - name: lint - uses: pre-commit/action@v3.0.0 - with: - extra_args: requirements-txt-fixer --all-files lint-markdown: runs-on: ubuntu-latest steps: @@ -76,19 +68,3 @@ jobs: uses: pre-commit/action@v3.0.0 with: extra_args: shellcheck --all-files - lint-trailing-whitespace: - runs-on: ubuntu-latest - steps: - - uses: actions/checkout@v3 - - name: lint - uses: pre-commit/action@v3.0.0 - with: - extra_args: trailing-whitespace --all-files - lint-eof-newline: - runs-on: ubuntu-latest - steps: - - uses: actions/checkout@v3 - - name: lint - uses: pre-commit/action@v3.0.0 - with: - extra_args: end-of-file-fixer --all-files