@InProceedings{DavidCurto2021,
author="David Curto
and Albert Clapes
and Javier Selva
and Sorina Smeureanu
and Julio C. S. Jacques Junior
and David Gallardo-Pujol
and Georgina Guilera
and David Leiva
and Thomas B. Moeslund
and Sergio Escalera
and Cristina Palmero",
title="Dyadformer: A Multi-Modal Transformer for Long-Range Modeling of Dyadic Interactions",
booktitle="IEEE/CVF International Conference on Computer Vision Workshops",
year="2021",
pages="2177--2188",
abstract="Personality computing has become an emerging topic in computer vision, due to the wide range of applications it can be used for. However, most works on the topic have focused on analyzing the individual, even when applied to interaction scenarios, and for short periods of time. To address these limitations, we present the Dyadformer, a novel multi-modal multi-subject Transformer architecture to model individual and interpersonal features in dyadic interactions using variable time windows, thus allowing the capture of long-term interdependencies. Our proposed cross-subject layer allows the network to explicitly model interactions among subjects through attentional operations. This proof-of-concept approach shows how multi-modality and joint modeling of both interactants for longer periods of time helps to predict individual attributes. With Dyadformer, we improve state-of-the-art self-reported personality inference results on individual subjects on the UDIVA v0.5 dataset.",
optnote="HUPBA; no proj;MILAB",
optnote="exported from refbase (http://refbase.cvc.uab.es/show.php?record=3648), last updated on Mon, 24 Oct 2022 13:44:59 +0200",
doi="10.1109/ICCVW54120.2021.00247",
file=":http://refbase.cvc.uab.es/files/CCS2021.pdf:PDF"
}