Merge pull request #19 from sign-language-processing/dgs_sentences

AmitMY · web-flow · commit a5a178903378 · 2022-09-12T13:39:02.000+02:00
feat(dgs_corpus): add sentence level loading
diff --git a/examples/load.ipynb b/examples/load.ipynb
@@ -20,7 +20,10 @@
    "cell_type": "markdown",
    "metadata": {
     "id": "view-in-github",
-    "colab_type": "text"
+    "colab_type": "text",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "<a href=\"https://colab.research.google.com/github/sign-language-processing/datasets/blob/master/examples/load.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
@@ -29,7 +32,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "ov6fuFwGjlsy"
+    "id": "ov6fuFwGjlsy",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "%%capture\n",
@@ -41,7 +47,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "C4PZsi6pPp9j"
+    "id": "C4PZsi6pPp9j",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "import tensorflow_datasets as tfds\n",
@@ -56,7 +65,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "PKGZ4JXCZmSE"
+    "id": "PKGZ4JXCZmSE",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# RWTH Phoenix 2014 T"
@@ -65,7 +77,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "8wU1Q4URqRBE"
+    "id": "8wU1Q4URqRBE",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "config = SignDatasetConfig(name=\"only-annotations\", version=\"3.0.0\", include_video=False)\n",
@@ -82,7 +97,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "v6iBwM9lTzS6"
+    "id": "v6iBwM9lTzS6",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# Dicta Sign"
@@ -91,7 +109,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "EQWUAgpVT0bK"
+    "id": "EQWUAgpVT0bK",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "config = SignDatasetConfig(name=\"only-annotations\", version=\"1.0.0\", include_video=False, include_pose=None)\n",
@@ -106,7 +127,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "OcIs13W6TfWz"
+    "id": "OcIs13W6TfWz",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# ChicagoFSWild+"
@@ -115,7 +139,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "o1X1kIgoTfec"
+    "id": "o1X1kIgoTfec",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "# Version 2.0.0 is ChicagoFSWild+, 1.0.0 is ChicagoFSWild\n",
@@ -131,7 +158,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "XK7jyOOtYv_P"
+    "id": "XK7jyOOtYv_P",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# AUTSL"
@@ -140,7 +170,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "dfZnI9K8YxfJ"
+    "id": "dfZnI9K8YxfJ",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "config = SignDatasetConfig(name=\"only-annotations\", version=\"1.0.0\", include_video=False)\n",
@@ -155,7 +188,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "rykmI68x3E07"
+    "id": "rykmI68x3E07",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# SignBank"
@@ -164,7 +200,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "12XcWfeg21kE"
+    "id": "12XcWfeg21kE",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "signbank = tfds.load(name='sign_bank')\n",
@@ -178,7 +217,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "biXjC80j17n1"
+    "id": "biXjC80j17n1",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# SignTyp (https://signtyp.uconn.edu/signpuddle/index.php?ui=1&sgn=9032)\n"
@@ -187,7 +229,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "dVgbyUIg165c"
+    "id": "dVgbyUIg165c",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "config = SignDatasetConfig(name=\"only-annotations\", version=\"1.0.0\", include_video=False, extra={\"PHPSESSID\": \"hj9co07ct7f5noq529no9u09l4\"})\n",
@@ -202,7 +247,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "yOLfw9-z2qK7"
+    "id": "yOLfw9-z2qK7",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# Sign2Mint"
@@ -211,7 +259,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "X96ogmu_22zv"
+    "id": "X96ogmu_22zv",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "config = SignDatasetConfig(name=\"only-annotations\", version=\"1.0.0\", include_video=False)\n",
@@ -226,7 +277,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "jnf4AaX936w4"
+    "id": "jnf4AaX936w4",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# SWOJS Glossário"
@@ -235,7 +289,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "shQxQtQP359y"
+    "id": "shQxQtQP359y",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "config = SignDatasetConfig(name=\"only-annotations\", version=\"1.0.0\", include_video=False)\n",
@@ -253,7 +310,10 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "pNJdG7ExZugh"
+    "id": "pNJdG7ExZugh",
+    "pycharm": {
+     "name": "#%% md\n"
+    }
    },
    "source": [
     "# DGS Corpus"
@@ -262,7 +322,10 @@
   {
    "cell_type": "code",
    "metadata": {
-    "id": "TVjrhsbtbWbX"
+    "id": "TVjrhsbtbWbX",
+    "pycharm": {
+     "name": "#%%\n"
+    }
    },
    "source": [
     "%%capture\n",
@@ -271,6 +334,18 @@
    "execution_count": null,
    "outputs": []
   },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Document Level example (Long videos)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   }
+  },
   {
    "cell_type": "code",
    "metadata": {
@@ -300,6 +375,40 @@
    "execution_count": null,
    "outputs": []
   },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Sentence level example (Videos are broken down to sentences)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "outputs": [],
+   "source": [
+    "from sign_language_datasets.datasets.dgs_corpus import DgsCorpusConfig\n",
+    "\n",
+    "config = DgsCorpusConfig(name=\"only-annotations-sentence-level\", version=\"1.0.0\", include_video=False, include_pose=None, data_type=\"sentence\")\n",
+    "dgs_corpus = tfds.load('dgs_corpus', builder_kwargs=dict(config=config))\n",
+    "\n",
+    "for datum in itertools.islice(dgs_corpus[\"train\"], 0, 5):\n",
+    "  sentence = datum[\"sentence\"][\"german\"].numpy().decode('utf-8')\n",
+    "  print(sentence)\n",
+    "  print(datum)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
   {
    "cell_type": "markdown",
    "source": [
diff --git a/requirements.txt b/requirements.txt
@@ -1,3 +1,4 @@
+typing-extensions
 python-dotenv
 tqdm
 pose-format>=0.0.3
diff --git a/setup.py b/setup.py
@@ -11,14 +11,14 @@
 setup(
     name="sign-language-datasets",
     packages=packages,
-    version="0.1.1",
+    version="0.1.2",
     description="TFDS Datasets for sign language",
     author="Amit Moryossef",
     author_email="amitmoryossef@gmail.com",
     url="https://github.com/sign-language-processing/datasets",
     keywords=[],
-    install_requires=["python-dotenv", "tqdm", "pose-format", "tfds-nightly", "tensorflow", "numpy", "pympi-ling",
-                      "Pillow", "opencv-python==4.5.5.64"],
+    install_requires=["typing-extensions", "python-dotenv", "tqdm", "pose-format", "tfds-nightly", "tensorflow",
+                      "numpy", "pympi-ling", "Pillow", "opencv-python==4.5.5.64"],
     tests_require=['pytest', 'pytest-cov'],
     long_description=long_description,
     long_description_content_type="text/markdown",
diff --git a/sign_language_datasets/datasets/config.py b/sign_language_datasets/datasets/config.py
@@ -14,7 +14,6 @@ def __init__(
         include_pose: Optional[str] = None,
         fps: Optional[float] = None,
         resolution: Optional[Tuple[int, int]] = None,
-        split: Optional[str] = None,
         extra: dict = {},
         **kwargs,
     ):
@@ -35,7 +34,6 @@ def __init__(
 
         self.fps = fps
         self.resolution = resolution
-        self.split = split
         self.extra = extra
 
     def ffmpeg_args(self):
@@ -69,4 +67,12 @@ def encode_example(self, video_or_path_or_fobj):
             _, h, w, _ = self.shape
             video_or_path_or_fobj = [cv2.resize(cv2.imread(f), (w, h)) for f in video_or_path_or_fobj]
 
+        # In case where additional ffmpeg parameters are needed
+        if isinstance(video_or_path_or_fobj, dict) and "video" in video_or_path_or_fobj and isinstance(video_or_path_or_fobj["video"], str):
+            old_args = list(self._extra_ffmpeg_args)
+            self._extra_ffmpeg_args += video_or_path_or_fobj["ffmpeg_args"]
+            result = super(VideoFeature, self).encode_example(video_or_path_or_fobj["video"])
+            self._extra_ffmpeg_args = old_args
+            return result
+
         return super(VideoFeature, self).encode_example(video_or_path_or_fobj)
diff --git a/sign_language_datasets/datasets/dgs_corpus/__init__.py b/sign_language_datasets/datasets/dgs_corpus/__init__.py
@@ -1,3 +1,3 @@
 """dgs_corpus dataset."""
 
-from .dgs_corpus import DgsCorpus
+from .dgs_corpus import DgsCorpus, DgsCorpusConfig
diff --git a/sign_language_datasets/datasets/dgs_corpus/dgs_corpus.py b/sign_language_datasets/datasets/dgs_corpus/dgs_corpus.py
diff --git a/sign_language_datasets/datasets/dgs_corpus/dgs_utils.py b/sign_language_datasets/datasets/dgs_corpus/dgs_utils.py

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,4 @@`
	`1`	`+typing-extensions`
`1`	`2`	`python-dotenv`
`2`	`3`	`tqdm`
`3`	`4`	`pose-format>=0.0.3`
Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,3 @@`
`1`	`1`	`"""dgs_corpus dataset."""`
`2`	`2`
`3`		`-from .dgs_corpus import DgsCorpus`
	`3`	`+from .dgs_corpus import DgsCorpus, DgsCorpusConfig`