Skip to content

Commit

Permalink
Change the GRU to a BiGRU in the SA Task. Also now we use the IMDb da…
Browse files Browse the repository at this point in the history
…taset, as we were using the AG_NEWs dataset by mistake.
  • Loading branch information
AlArgente committed Jan 22, 2024
1 parent 547c063 commit d84e321
Show file tree
Hide file tree
Showing 4 changed files with 124 additions and 10 deletions.
35 changes: 35 additions & 0 deletions .github/workflows/pytest.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
# This workflow will install dependencies, create coverage tests and run Pytest Coverage Comment
# For more information see: https://github.com/MishaKav/pytest-coverage-comment/
name: Tests
on:
pull_request:
branches:
- main
types: [synchronize, opened]
jobs:
build:
runs-on: ubuntu-20.04
steps:
- uses: actions/checkout@v2

- name: Set up Python 3.8.10
uses: actions/setup-python@v4
with:
python-version: 3.8.10

- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install flake8 pytest pytest-cov
pip install ".[develop]"
- name: Build coverage file
run: |
pytest -n 2 --junitxml=pytest.xml --cov-report=term-missing:skip-covered --cov=flex tests/ | tee pytest-coverage.txt
- name: Pytest coverage comment
uses: MishaKav/pytest-coverage-comment@main
with:
report-only-changed-files: false
pytest-coverage-path: ./pytest-coverage.txt
junitxml-path: ./pytest.xml
27 changes: 27 additions & 0 deletions .github/workflows/trunk.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
# This is a basic workflow to help you get started with Actions

name: Linter

on:
pull_request:
branches:
- 'main'
types: [synchronize, opened]

# Allows you to run this workflow manually from the Actions tab
workflow_dispatch:

# A workflow run is made up of one or more jobs that can run sequentially or in parallel
jobs:
# This workflow contains a single job called "build"
build:
# The type of runner that the job will run on
runs-on: ubuntu-latest

# Steps represent a sequence of tasks that will be executed as part of the job
steps:
# Checks-out your repository under $GITHUB_WORKSPACE, so your job can access it
- uses: actions/checkout@v3

- name: Trunk Check
uses: trunk-io/trunk-action@v1.0.3
47 changes: 47 additions & 0 deletions .github/workflows/update-coverage.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,47 @@
# This workflow will install dependencies, create coverage tests and run Pytest Coverage Comment
# For more information see: https://github.com/MishaKav/pytest-coverage-comment/
name: Update README
on:
push:
branches: [ 'main' ]

jobs:
build:
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v2

- name: Set up Python 3.9
uses: actions/setup-python@v2
with:
python-version: 3.9

- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install flake8 pytest pytest-cov
pip install .
- name: Build coverage file
run: |
pytest --cov-report=term-missing:skip-covered --cov=flex tests/ | tee pytest-coverage.txt
- name: Pytest coverage comment
if: ${{ github.ref == 'refs/heads/main' }}
id: coverageComment
uses: MishaKav/pytest-coverage-comment@main
with:
hide-comment: true
pytest-coverage-path: ./pytest-coverage.txt

- name: Update Readme with Coverage Html
if: ${{ github.ref == 'refs/heads/main' }}
run: |
sed -i '/<!-- Pytest Coverage Comment:Begin -->/,/<!-- Pytest Coverage Comment:End -->/c\<!-- Pytest Coverage Comment:Begin -->\n\${{ steps.coverageComment.outputs.coverageHtml }}\n<!-- Pytest Coverage Comment:End -->' ./README.md
- name: Commit & Push changes to Readme
if: ${{ github.ref == 'refs/heads/main' }}
uses: actions-js/push@master
with:
message: Update coverage on Readme
github_token: ${{ secrets.CI_GITHUB_TOKEN }}
25 changes: 15 additions & 10 deletions flexnlp/notebooks/Federated IMDb PT using FLExible with a GRU.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -53,7 +53,7 @@
"outputs": [],
"source": [
"# imdb_dataset = load_dataset('imdb', split=['train', 'test']) # Get the dataset from huggingface library\n",
"train_dataset, test_dataset = torchtext.datasets.AG_NEWS() # Get the dataset from torchtext library\n",
"train_dataset, test_dataset = torchtext.datasets.IMDB() # Get the dataset from torchtext library\n",
"unique_classes = set([label for (label, text) in train_dataset])\n",
"num_classes = len(unique_classes)"
]
Expand Down Expand Up @@ -284,20 +284,25 @@
" )\n",
" # Take the embeddings size from the embeddings vector.\n",
" self.embedding_size = embeddings.shape[1]\n",
" #Create the GRU layer with just one layer.\n",
" # Create the GRU layer with just one layer.\n",
" self.gru = nn.GRU(self.embedding_size,\n",
" hidden_size,\n",
" batch_first=True,\n",
" num_layers=1\n",
" bidirectional=True,\n",
" dropout=0.5\n",
" )\n",
" # Create a dropout layer for the BiGRU\n",
" self.dropout = nn.Dropout(0.2)\n",
" # Create the prediction layer.\n",
" self.fc = nn.Linear(hidden_size, num_classes)\n",
" self.fc = nn.Linear(hidden_size*2, num_classes)\n",
"\n",
" def forward(self, x):\n",
" # x.shape = [batch_size, len]\n",
" x = self.emb(x)\n",
" # x.shape = [batch_size, len, emb_dim]\n",
" _, x = self.gru(x)\n",
" x = self.dropout(torch.cat((x[-2,:,:], x[-1,:,:]), dim=1))\n",
" # x.shape = [1, batch_size, hid_dim]\n",
" x = self.fc(x)\n",
" return x\n",
Expand Down Expand Up @@ -452,7 +457,7 @@
" #  batch_sampler=batch_sampler_v2(BATCH_SIZE, train_indices))\n",
" model = client_flex_model[\"model\"]\n",
" # lr = 0.001\n",
" optimizer = client_flex_model['optimizer_func'](model.parameters(), lr=0.1, **client_flex_model[\"optimizer_kwargs\"])\n",
" optimizer = client_flex_model['optimizer_func'](model.parameters(), lr=0.01, **client_flex_model[\"optimizer_kwargs\"])\n",
" model = model.train()\n",
" model = model.to(device)\n",
" criterion = client_flex_model[\"criterion\"]\n",
Expand Down Expand Up @@ -657,20 +662,20 @@
]
},
{
"cell_type": "code",
"execution_count": null,
"cell_type": "markdown",
"metadata": {},
"outputs": [],
"source": [
"# train_n_rounds(5)"
"Run the following cell in order to train the model for multiple rounds, selecting ya"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
"source": [
"train_n_rounds(n_rounds=5)"
]
}
],
"metadata": {
Expand All @@ -689,7 +694,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.11.3"
"version": "3.11.4"
},
"orig_nbformat": 4
},
Expand Down

0 comments on commit d84e321

Please sign in to comment.