@inproceedings{48e1669606af4ddf8ce981c9102c0bbf,
title = "Knowledge-Infused Retrieval Boosts Few-Shot Hand Gesture Recognition on HaGRID with Vision-Language Model",
abstract = "Hand gesture recognition remains challenging, primarily due to its reliance on large-scale annotated datasets and the limited adaptability of existing models when encountering novel gesture classes. In this work, we propose to apply Adaptive Vision-Language Model (Adaptive-VLM). This lightweight, training-free framework utilizes only one image per class to recognize gestures on the HaGRID benchmark. Built upon the CLIP backbone, our approach incorporates symbolic knowledge-infused prompts, multi-prompt contextualization, and semantic exemplar ranking to improve few-shot generalization. Adaptive-VLM achieves a macro F1-score of 65.75\% on the HaGRID test set (540 images) without any parameter fine-tuning, using 18 example images. It significantly outperforms the Random-VLM baseline (59.95\%) and a ResNet-18 model fine-tuned for 10 epochs (4.09\%) under the same data constraints. These findings highlight the effectiveness of combining structured domain knowledge and guided exemplar selection to overcome data scarcity in low-resource gesture recognition. Adaptive-VLM offers a promising direction for building adaptive and efficient HGR systems, especially in real-world human-computer interaction scenarios requiring rapid deployment with minimal data.",
keywords = "Adaptive Learning, Few-Shot Learning, HaGRID Dataset, Hand Gesture Recognition, Human-Computer Interaction, Knowledge Injection, Prompt Engineering, Vision-Language Models",
author = "Enny Indasyah and Kaori Yoshida",
note = "Publisher Copyright: {\textcopyright} 2025 The Authors.; 24th International Conference on New Trends in Intelligent Software Methodologies, Tools and Techniques, SoMeT 2025 ; Conference date: 23-09-2025 Through 26-09-2025",
year = "2025",
month = sep,
day = "16",
doi = "10.3233/FAIA250540",
language = "English",
series = "Frontiers in Artificial Intelligence and Applications",
publisher = "IOS Press BV",
pages = "396--413",
editor = "Hamido Fujita and Andres Hernandez-Matamoros and Yutaka Watanobe",
booktitle = "New Trends in Intelligent Software Methodologies, Tools and Techniques - Proceedings of the 24th International Conference on New Trends in Intelligent Software Methodologies, Tools and Techniques, SoMeT 2025",
address = "Netherlands",
}