Dept of Computer Science
Centre Universitaire d'Informatique (CUI)
Université de Genève
@techreport { messina:arxiv2008.05231, author = { Nicola Messina and Giuseppe Amato and Andrea Esuli and Fabrizio Falchi and Claudio Gennaro and St{\'{e}}phane Marchand{-}Maillet }, title = { Fine-grained Visual Textual Alignment for Cross-Modal Retrieval using Transformer Encoders }, institution = { CoRR abs/2008.05231 }, year = { 2020 }, url = { https://arxiv.org/abs/2008.05231 }, }