@inproceedings{e2300b8b074c484296676eade158c5bb,
title = "Having Your Cake and Eating it Too: Training Neural Retrieval for Language Inference without Losing Lexical Match",
abstract = "We present a study on the importance of information retrieval (IR) techniques for both the interpretability and the performance of neural question answering (QA) methods. We show that the current state-of-the-art transformer methods (like RoBERTa) encode poorly simple information retrieval (IR) concepts such as lexical overlap between query and the document. To mitigate this limitation, we introduce a supervised RoBERTa QA method that is trained to mimic the behavior of BM25 and the soft-matching idea behind embedding-based alignment methods. We show that fusing the simple lexical-matching IR concepts in transformer techniques results in improvement a) of their (lexical-matching) interpretability, b) retrieval performance, and c) the QA performance on two multi-hop QA datasets. We further highlight the lexical-chasm gap bridging capabilities of transformer methods by analyzing the attention distributions of the supervised RoBERTa classifier over the context versus lexically-matched token pairs.",
keywords = "interpretability, question answering, semantic alignment, transformers",
author = "Vikas Yadav and Steven Bethard and Mihai Surdeanu",
note = "Publisher Copyright: {\textcopyright} 2020 ACM.; 43rd Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR 2020 ; Conference date: 25-07-2020 Through 30-07-2020",
year = "2020",
month = jul,
day = "25",
doi = "10.1145/3397271.3401311",
language = "English (US)",
series = "SIGIR 2020 - Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval",
publisher = "Association for Computing Machinery, Inc",
pages = "1625--1628",
booktitle = "SIGIR 2020 - Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval",
}