@inproceedings{06c4d2f5702f42a9a10a5a68a05d3eca,
title = "Loss functions incorporating auditory spatial perception in deep learning – a review",
abstract = "Binaural reproduction aims to deliver immersive spatial audio with high perceptual realism over headphones. Loss functions play a central role in optimizing and evaluating algorithms that generate binaural signals. However, traditional signal-related difference measures often fail to capture the perceptual properties that are essential to spatial audio quality. This review paper surveys recent loss functions that incorporate spatial perception cues relevant to binaural reproduction. It focuses on losses applied to binaural signals, which are often derived from microphone recordings or Ambisonics signals, while excluding those based on room impulse responses. Guided by the Spatial Audio Quality Inventory (SAQI), the review emphasizes perceptual dimensions related to source localization and room response, while excluding general spectral–temporal attributes. The literature survey reveals a strong focus on localization cues, such as interaural time and level differences (ITDs, ILDs), while reverberation and other room acoustic attributes remain less explored in loss function design. Recent works that estimate room acoustic parameters and develop embeddings that capture room characteristics indicate their potential for future integration into neural network training. The paper concludes by highlighting future research directions toward more perceptually grounded loss functions that better capture the listener's spatial experience.",
keywords = "Spatial audio, audio signal processing, deep learning, machine learning, perceptual loss, spatial perception",
author = "Boaz Rafaely and Stefan Weinzierl and Or Berebi and Fabian Brinkmann",
note = "Publisher Copyright: {\textcopyright} 2025 IEEE.; 2025 Immersive and 3D Audio: from Architecture to Automotive, I3DA 2025 ; Conference date: 10-09-2025 Through 12-09-2025",
year = "2025",
month = jan,
day = "1",
doi = "10.1109/I3DA65421.2025.11202063",
language = "English",
series = "2025 Immersive and 3D Audio: from Architecture to Automotive, I3DA 2025",
publisher = "Institute of Electrical and Electronics Engineers",
booktitle = "2025 Immersive and 3D Audio",
address = "United States",
}