From 2b7711e7c817e5fc47a3fbe556dcd084db245b10 Mon Sep 17 00:00:00 2001 From: Amit Moryossef Date: Tue, 28 Apr 2026 09:18:41 +0000 Subject: [PATCH 1/2] Add Langer et al. 2024 DW-DGS dictionary citation Cites the corpus-based Digital Dictionary of DGS in the bilingual dictionaries section, since it is a notable corpus-based DGS lexical resource relevant to that discussion. Co-Authored-By: Claude Opus 4.7 (1M context) --- src/index.md | 1 + src/references.bib | 54 ++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 55 insertions(+) diff --git a/src/index.md b/src/index.md index 8d9a518..556b441 100644 --- a/src/index.md +++ b/src/index.md @@ -1150,6 +1150,7 @@ or by the confidence score of the signer inference." --> ###### Bilingual dictionaries {-} for signed language [@dataset:mesch2012meaning;@fenlon2015building;@crasborn2016ngt;@dataset:gutierrez2016lse] map a spoken language word or short phrase to a signed language video. One notable dictionary, SpreadTheSign\footnote{\url{https://www.spreadthesign.com/}} is a parallel dictionary containing around 25,000 words with up to 42 different spoken-signed language pairs and more than 600,000 videos in total. Unfortunately, while dictionaries may help create lexical rules between languages, they do not demonstrate the grammar or the usage of signs in context. +@langer-etal-2024-introducing introduce the DW-DGS, the first corpus-based digital dictionary of German Sign Language, providing 1876 entries grounded in the DGS Corpus with senses, authentic example clips, regional distribution maps, and synonym/antonym cross-references via thumbnail "micons" instead of glosses. ###### Fingerspelling corpora {-} usually consist of videos of words borrowed from spoken languages that are signed letter-by-letter. They can be synthetically created [@dataset:dreuw2006modeling] or mined from online resources [@dataset:fs18slt;@dataset:fs18iccv]. However, they only capture one aspect of signed languages. diff --git a/src/references.bib b/src/references.bib index 6ffb2f7..e0b8c13 100644 --- a/src/references.bib +++ b/src/references.bib @@ -4663,3 +4663,57 @@ @inproceedings{klomp-etal-2024-extension url = {https://aclanthology.org/2024.signlang-1.19}, year = {2024} } +} + + + title = "An Extension of the {NGT} Dataset in {G}lobal {S}ignbank", + author = "Klomp, Ulrika and + Gierman, Lisa and + Manders, Pieter and + Nauta, Ellen and + Otterspeer, Gom{\`e}r and + Pelupessy, Ray and + Stern, Galya and + Venter, Dalene and + Wubbolts, Casper and + Oomen, Marloes and + Roelofsen, Floris", +} + +@inproceedings{sharma-etal-2024-facial, + title = "Facial Expressions for Sign Language Synthesis using {FACSH}uman and {AZ}ee", + author = "Sharma, Paritosh and + Challant, Camille and + Filhol, Michael", +} + +@inproceedings{langer-etal-2024-introducing, + title = "Introducing the {DW}-{DGS} {--} The Digital Dictionary of {DGS}", + author = {Langer, Gabriele and + M{\"u}ller, Anke and + W{\"a}hl, Sabrina and + Otte, Felicitas and + Sepke, Lea and + Hanke, Thomas}, + editor = "Efthimiou, Eleni and + Fotinea, Stavroula-Evita and + Hanke, Thomas and + Hochgesang, Julie A. and + Mesch, Johanna and + Schulder, Marc", + booktitle = "Proceedings of the LREC-COLING 2024 11th Workshop on the Representation and Processing of Sign Languages: Evaluation of Sign Language Resources", + month = may, + year = "2024", + address = "Torino, Italia", + publisher = "ELRA and ICCL", + url = "https://aclanthology.org/2024.signlang-1.19/", + pages = "178--183" +} + + url = "https://aclanthology.org/2024.signlang-1.39/", + pages = "354--360" +} + + url = "https://aclanthology.org/2024.signlang-1.21/", + pages = "194--203" +} From d36e8ac080dd9a6897216e0ecf1dc73d7313e89e Mon Sep 17 00:00:00 2001 From: AmitMY Date: Tue, 28 Apr 2026 09:49:43 +0000 Subject: [PATCH 2/2] Move langer-etal entry to Dataset Papers section (review feedback) --- src/index.md | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/index.md b/src/index.md index 556b441..119a1b0 100644 --- a/src/index.md +++ b/src/index.md @@ -1139,7 +1139,7 @@ Research papers which do not necessarily contribute new theory or architectures @hall-etal-2024-phonological digitized and phonologically transcribed the Canadian Dictionary of ASL using the Sign Language Phonetic Annotator-Analyzer software, producing a searchable resource that captured handshape, movement, location, and relation parameters for roughly 2000 signs to enable phonologically based queries that paper-based dictionaries cannot support. -The Public DGS Corpus also saw multiple SignLang 2024 contributions: @konrad-etal-2024-corpus describe its fourth release, expanding it to 52.4 hours, adding a new iLex-based portal alongside MY DGS, MY DGS – annotated and MY DGS – ANNIS, and providing additional MediaPipe and Apple Vision Framework pose representations including 3D keypoint estimates; @isard-2024-building introduced a web-based Query Wizard that guided users through the construction of valid ANNIS Query Language expressions over the corpus by composing context-sensitive blocks for annotation tiers, metadata, and inter-tier connections. +The Public DGS Corpus also saw multiple SignLang 2024 contributions: @konrad-etal-2024-corpus describe its fourth release, expanding it to 52.4 hours, adding a new iLex-based portal alongside MY DGS, MY DGS – annotated and MY DGS – ANNIS, and providing additional MediaPipe and Apple Vision Framework pose representations including 3D keypoint estimates; @isard-2024-building introduced a web-based Query Wizard that guided users through the construction of valid ANNIS Query Language expressions over the corpus by composing context-sensitive blocks for annotation tiers, metadata, and inter-tier connections; and @langer-etal-2024-introducing introduce the DW-DGS, the first corpus-based digital dictionary of German Sign Language, providing 1876 entries grounded in the DGS Corpus with senses, authentic example clips, regional distribution maps, and synonym/antonym cross-references via thumbnail "micons" instead of glosses. @klomp-etal-2024-extension describe an ongoing extension of the Sign Language of the Netherlands (NGT) dataset in Global Signbank, aiming to add approximately 11,000 new glosses, 3,000 example sentences, multi-angle videos with non-manual expressions, phonological annotations, and motion capture data to support both linguistic research and automatic recognition. @@ -1150,7 +1150,6 @@ or by the confidence score of the signer inference." --> ###### Bilingual dictionaries {-} for signed language [@dataset:mesch2012meaning;@fenlon2015building;@crasborn2016ngt;@dataset:gutierrez2016lse] map a spoken language word or short phrase to a signed language video. One notable dictionary, SpreadTheSign\footnote{\url{https://www.spreadthesign.com/}} is a parallel dictionary containing around 25,000 words with up to 42 different spoken-signed language pairs and more than 600,000 videos in total. Unfortunately, while dictionaries may help create lexical rules between languages, they do not demonstrate the grammar or the usage of signs in context. -@langer-etal-2024-introducing introduce the DW-DGS, the first corpus-based digital dictionary of German Sign Language, providing 1876 entries grounded in the DGS Corpus with senses, authentic example clips, regional distribution maps, and synonym/antonym cross-references via thumbnail "micons" instead of glosses. ###### Fingerspelling corpora {-} usually consist of videos of words borrowed from spoken languages that are signed letter-by-letter. They can be synthetically created [@dataset:dreuw2006modeling] or mined from online resources [@dataset:fs18slt;@dataset:fs18iccv]. However, they only capture one aspect of signed languages.