Skip to content

Commit 9118144

Browse files
authored
Merge pull request #22 from bricksdont/add_dgs_sentence_split
Add dgs sentence split
2 parents a5a1789 + 6c53d26 commit 9118144

File tree

3 files changed

+65557
-2
lines changed

3 files changed

+65557
-2
lines changed

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
setup(
1212
name="sign-language-datasets",
1313
packages=packages,
14-
version="0.1.2",
14+
version="0.1.3",
1515
description="TFDS Datasets for sign language",
1616
author="Amit Moryossef",
1717
author_email="amitmoryossef@gmail.com",

sign_language_datasets/datasets/dgs_corpus/dgs_corpus.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -58,6 +58,7 @@
5858

5959
_KNOWN_SPLITS = {
6060
"3.0.0-uzh-document": path.join(path.dirname(path.realpath(__file__)), "splits", "split.3.0.0-uzh-document.json"),
61+
"3.0.0-uzh-sentence": path.join(path.dirname(path.realpath(__file__)), "splits", "split.3.0.0-uzh-sentence.json")
6162
}
6263

6364

@@ -377,7 +378,7 @@ def _generate_examples(self, data, split: List[str] | Dict[str, List[str]] = Non
377378
else:
378379
sentences = list(get_elan_sentences(datum["eaf"]))
379380
for sentence in sentences:
380-
if split is not None and sentence["id"] not in split[_id]:
381+
if split is not None and sentence["id"] not in split[document_id]:
381382
continue
382383

383384
if sentence["english"] is None:

0 commit comments

Comments
 (0)