@inproceedings{khan:26047:sign-lang:lrec,
  author    = {Khan, Sarmad and McLoughlin, Simon D. and Murtagh, Irene},
  title     = {A Comparative Analysis of Traditional and Contemporary Visual Features for Computational Annotation of {Irish} {Sign} {Language}},
  pages     = {239--247},
  editor    = {Efthimiou, Eleni and Fotinea, Stavroula-Evita and Hanke, Thomas and Hochgesang, Julie A. and Mesch, Johanna and Schulder, Marc},
  booktitle = {Proceedings of the {LREC2026} 12th Workshop on the Representation and Processing of Sign Languages: Language in Motion},
  maintitle = {15th International Conference on Language Resources and Evaluation ({LREC} 2026)},
  publisher = {{European Language Resources Association (ELRA)}},
  address   = {Palma, Mallorca, Spain},
  day       = {16},
  month     = may,
  year      = {2026},
  isbn      = {978-2-493814-82-1},
  language  = {english},
  url       = {https://www.sign-lang.uni-hamburg.de/lrec/pub/26047.html},
  abstract  = {Automatic annotation of sign language data is critical for advancing linguistic research and developing sign language technologies, yet it remains a major bottleneck due to the inherently motion-based and multi-modal nature of signing. Irish Sign Language, like many sign languages, presents challenges for computational annotation and sign language processing due to limited annotated corpora and the inherent difficulty of reliably annotating movement, trajectories, and coarticulation across manual and non-manual articulators. This paper presents an automated computational framework for gloss-level annotation support in Irish Sign Language, designed to assist scalable corpus annotation by learning motion-related cues directly from sign language videos. Using ELAN-aligned segments from the Signs of Ireland Corpus, we compare contemporary self-supervised visual representations with traditional pose-based features derived from explicit skeletal tracking, evaluating three feature configurations: DINOv2, MediaPipe, and multi-modal fusion. Our results show that self-supervised visual embeddings achieve the highest average accuracy 86.12{\%}, outperforming both multi-modal fusion 84.28{\%} and pose-based representations 76.74{\%}. This indicates that recent visual models can implicitly encode linguistically relevant motion information, including articulator movement and transitional dynamics, reducing the need for explicit landmark extraction in practical annotation pipelines. Overall, this work provides empirical guidance and a deployable computational framework to support computational annotation and enrichment of sign language corpora.}
}

@inproceedings{khan:24043:sign-lang:lrec,
  author    = {Khan, Sarmad and Murtagh, Irene and McLoughlin, Simon D.},
  title     = {Investigating Motion History Images and Convolutional Neural Networks for Isolated {Irish} {Sign} {Language} Fingerspelling Recognition},
  pages     = {140--146},
  editor    = {Efthimiou, Eleni and Fotinea, Stavroula-Evita and Hanke, Thomas and Hochgesang, Julie A. and Mesch, Johanna and Schulder, Marc},
  booktitle = {Proceedings of the {LREC-COLING} 2024 11th Workshop on the Representation and Processing of Sign Languages: Evaluation of Sign Language Resources},
  maintitle = {2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation ({LREC-COLING} 2024)},
  publisher = {{ELRA Language Resources Association (ELRA) and the International Committee on Computational Linguistics (ICCL)}},
  address   = {Torino, Italy},
  day       = {25},
  month     = may,
  year      = {2024},
  isbn      = {978-2-493814-30-2},
  language  = {english},
  url       = {https://www.sign-lang.uni-hamburg.de/lrec/pub/24043.html},
  abstract  = {The limited global competency in sign language makes the objective of improving communication for the deaf and hard-of-hearing community through computational processing both vital and necessary. In an effort to address this problem, our research leverages the Irish Sign Language hand shape (ISL-HS) dataset and state-of-the-art deep learning architectures to recognize the Irish Sign Language alphabet. We streamline the feature extraction methodology and pave the way for the efficient use of Convolutional Neural Networks (CNNs) by using Motion History Images (MHIs) for monitoring the sign language motions. The effectiveness of numerous powerful CNN architectures in deciphering the intricate patterns of motion captured in MHIs is investigated in this research. The process includes generating MHIs from the ISL dataset and then using these images to train several CNN neural network models and evaluate their ability to recognize the Irish Sign Language alphabet. The results demonstrate the possibility of investigating MHIs with advanced CNNs to enhance sign language recognition, with a noteworthy accuracy percentage. By contributing to the development of language processing tools and technologies for Irish Sign Language, this research has the potential to address the lack of technological communicative accessibility and inclusion for the deaf and hard-of-hearing community in Ireland.}
}

