@inproceedings{6b0974dc458042f490b4ede06b756f8b,
title = "Learning Sub-Dimensional HRTF Representations Towards Individualization Applications - Traditional and Deep Learning Approaches",
abstract = "Individualized Head Related Transfer Functions (HRTFs) are indispensable in order to accurately reproduce spatial audio over headphones. Encoding the high-dimensional HRTFs to a sub-dimensional space has proven to be useful in many previous research efforts in predicting individualized HRTFs. In this work, we provide a comparative study of some traditional methods such as Principle Component Analysis (PCA) or Multi-Layer Perceptron (MLP) based Autoencoders and the more recent generative deep learning approaches such as a Convolutional Neural Network (CNN) based Vector Quantized Variational Autoencoder (VQ-VAE) for learning HRTF representations. We further demonstrate the benefits of using 3D-CNNs for this task to learn correlations between neighboring HRTFs, along both spatial and frequency dimensions. To this end, we provide evidence suggesting that such a 3D-CNN based approach enables the derived latent space to encode features more representative of the individuality of the HRTFs while also allowing for the representations to be significantly more compact. Finally, we also explore the advantages of such robust representations towards downstream applications of predicting Individualized HRTFs.",
keywords = "Generative AI, HRTF Modeling, PCA, Representation Learning, VQVAE",
author = "Devansh Zurale and Shlomo Dubnov",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 2023 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2023 ; Conference date: 22-10-2023 Through 25-10-2023",
year = "2023",
month = jan,
day = "1",
doi = "10.1109/WASPAA58266.2023.10248076",
language = "English",
series = "IEEE Workshop on Applications of Signal Processing to Audio and Acoustics",
publisher = "Institute of Electrical and Electronics Engineers",
booktitle = "Proceedings of the 2023 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2023",
address = "United States",
}