@inproceedings{7d73a2f9c9d14c148deeb64c15b3295c,
title = "Visually Precise Query",
abstract = "We present the problem of Visually Precise Query (VPQ) generation which enables a more intuitive match between a user's information need and an e-commerce site's product description. Given an image of a fashion item, what is the most optimum search query that will retrieve the exact same or closely related product(s) with high probability. In this paper we introduce the task of VPQ generation which takes a product image and its title as its input and provides aword level extractive summary of the title, containing a list of salient attributes, which can now be used as a query to search for similar products. We collect a large dataset of fashion images and their titles and merge it with an existing research dataset which was created for a different task. Given the image and title pair, VPQ problem is posed as identifying a non-contiguous collection of spans within the title. We provide a dataset of around 400K image, title and corresponding VPQ entries and release it to the research community. We provide a detailed description of the data collection process as well as discuss the future direction of research for the problem introduced in this work. We provide the standard text as well as visual domain baseline comparisons and also provide multi-modal baseline models to analyze the task introduced in this work. Finally, we propose a hybrid fusion model which promises to be the direction of research in the multi-modal community.",
keywords = "e-commerce, hybrid fusion, multi-modal information retrieval, visual attributes",
author = "Riddhiman Dasgupta and Francis Tom and Sudhir Kumar and {Das Gupta}, Mithun and Yokesh Kumar and Patro, {Badri N.} and Namboodiri, {Vinay P.}",
year = "2020",
month = oct,
day = "12",
doi = "10.1145/3394171.3413558",
language = "English",
series = "MM 2020 - Proceedings of the 28th ACM International Conference on Multimedia",
publisher = "Association for Computing Machinery",
pages = "3550--3558",
booktitle = "MM 2020 - Proceedings of the 28th ACM International Conference on Multimedia",
address = "USA United States",
note = "28th ACM International Conference on Multimedia, MM 2020 ; Conference date: 12-10-2020 Through 16-10-2020",
}