@inproceedings{8e7e40c4358742ec84d1074653d95bdf,
title = "Deep Learning Approach for Enhanced Object Recognition and Assembly Guidance with Augmented Reality",
abstract = "In an effort to enhance the efficiency and precision of manual part assembly in industrial settings, the development of software for assembly guidance becomes imperative. Augmented reality (AR) technology offers a means to provide visual instructions for assembly tasks, rendering the guidance more comprehensible. Nevertheless, a significant challenge lies in the technology{\textquoteright}s limited object detection capabilities, especially when distinguishing between similar assembled parts. This project proposes the utilization of deep learning neural networks to enhance the accuracy of object recognition within the AR guided assembly application. To achieve this objective, a dataset of assembly parts, known as the Visual Object Classes (VOC) dataset, was created. Data augmentation techniques were employed to expand this dataset, incorporating scale HSV (hue saturation value) transformations. Subsequently, deep learning models for the recognition of assembly parts were developed which were based on the Single Shot Multibox Detector (SSD) and the YOLOv7 detector. The models were trained and fine-tuned, targeting on the variations of the positions of detected parts. The effectiveness of this approach was evaluated using a case study involving an educational electronic blocks circuit science kit. The results demonstrated a high assembly part recognition accuracy of over 99% in mean average precision (MAP), along with favorable user testing outcomes. Consequently, the AR application was capable of offering high-quality guidance to users which holds promise for application in diverse scenarios and the resolution of real-world challenges.",
keywords = "Assembly Tasks, Augmented Reality, Object Detection, Object Recognition",
author = "Lee, {Boon Giin} and Xiaoying Wang and Renzhi Han and Linjing Sun and Matthew Pike and Chung, {Wan Young}",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2024.; 15th International Conference on Intelligent Human Computer Interaction, IHCI 2023 ; Conference date: 08-11-2023 Through 10-11-2023",
year = "2024",
doi = "10.1007/978-3-031-53830-8_11",
language = "English",
isbn = "9783031538292",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "105--114",
editor = "Choi, {Bong Jun} and Dhananjay Singh and Tiwary, {Uma Shanker} and Wan-Young Chung",
booktitle = "Intelligent Human Computer Interaction - 15th International Conference, IHCI 2023, Revised Selected Papers",
address = "Germany",
}