@article{S{\"u}mePonomarjovaWendtetal.2025, author = {S{\"u}me, Sinan and Ponomarjova, Katrin-Misel and Wendt, Thomas and Rupitsch, Stefan}, title = {Enhancing human-robot collaboration with thermal images and deep neural networks: the unique thermal industrial dataset WLRI-HRC and evaluation of convolutional neural networks}, journal = {Journal of Sensors and Sensor Systems}, volume = {14}, number = {1}, issn = {2194-8771}, doi = {10.5194/jsss-14-37-2025}, institution = {Fakult{\"a}t Wirtschaft (W)}, pages = {37 -- 46}, year = {2025}, abstract = {This contribution introduces the use of convolutional neural networks to detect humans and collaborative robotsĀ (cobots) in human-robot collaboration (HRC) workspaces based on their thermal radiation fingerprint. The unique data acquisition includes an infrared camera, two cobots, and up to two persons walking and interacting with the cobots in real industrial settings. The dataset also includes different thermal distortions from other heat sources. In contrast to data from the public environment, this data collection addresses the challenges of indoor manufacturing, such as heat distortions from the environment, and allows for it to be applicable in indoor manufacturing. The Work-Life Robotics Institute HRC (WLRI-HRC) dataset contains 6485 images with over 20 000 instances to detect. In this research, the dataset is evaluated for implementation by different convolutional neural networks: first, one-stage methods, i.e., You Only Look Once (YOLO v5, v8, v9 and v10) in different model sizes and, secondly, two-stage methods with Faster R-CNN with three variants of backbone structures (ResNet18, ResNet50 and VGG16). The results indicate promising results with the best mean average precision at an intersection over union (IoU) of 50 (mAP50) value achieved by YOLOv9s (99.4 \%), the best mAP50-95 value achieved by YOLOv9s and YOLOv8m (90.2 \%), and the fastest prediction time of 2.2 ms achieved by the YOLOv10n model. Further differences in detection precision and time between the one-stage and multi-stage methods are discussed. Finally, this paper examines the possibility of the Clever Hans phenomenon to verify the validity of the training data and the models' prediction capabilities.}, language = {en} }