@techreport{park2022ink, author = {Park, James and Huang, Qiuyuan and Bisk, Yonatan and Yang, Jianwei and Som, Subhojit and Farhadi, Ali and Choi, Yejin and Gao, Jianfeng}, title = {INK: Intensive Neural Knowledge}, institution = {Microsoft MSR-TR-2022-38}, year = {2022}, month = {July}, abstract = {Knowledge-based vision language systems are increasingly ubiquitous in our everyday lives. However, despite the introduction of numerous benchmarks, the community has siloed models of different types of knowledge rather than building general knowledge-intensive models that encompass both commonsense and factoid knowledge. We introduce INK – Intensive Neural Knowledge – a new task that involves extracting the necessary knowledge to accurately perform image and text retrieval. In particular, INK leverages existing resources to require understanding of factoid, object-commonsense, or social-consciousness knowledge to successfully perform retrieval. Finally, we provide a set of competitive baseline models whose weak performance motivates the need to develop new knowledge understanding models and systems.}, url = {http://approjects.co.za/?big=en-us/research/publication/ink-intensive-neural-knowledge-aligned-image-text-retrieval/}, number = {MSR-TR-2022-38}, }