@inproceedings{76935a69aa154eba94e4af72b399f519,
title = "Tangent-V: Math formula image search using line-of-sight graphs",
abstract = "We present a visual search engine for graphics such as math, chemical diagrams, and figures. Graphics are represented using Line-of-Sight (LOS) graphs, with symbols connected only when they can {\textquoteleft}see{\textquoteright} each other along an unobstructed line. Symbol identities may be provided (e.g., in PDF) or taken from Optical Character Recognition applied to images. Graphics are indexed by pairs of symbols that {\textquoteleft}see{\textquoteright} each other using their labels, spatial displacement, and size ratio. Retrieval has two layers: the first matches query symbol pairs in an inverted index, while the second aligns candidates with the query and scores the resulting matches using the identity and relative position of symbols. For PDFs, we also introduce a new tool that quickly extracts characters and their locations. We have applied our model to the NTCIR-12 Wikipedia Formula Browsing Task, and found that the method can locate relevant matches without unification of symbols or using a math expression grammar. In the future, one might index LOS graphs for entire pages and search for text and graphics. Our source code has been made publicly available.",
keywords = "Graphics search, Image search, Mathematical Information Retrieval (MIR), PDF symbol extraction",
author = "Kenny Davila and Ritvik Joshi and Srirangaraj Setlur and Venu Govindaraju and Richard Zanibbi",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2019.; 41st European Conference on Information Retrieval, ECIR 2019 ; Conference date: 14-04-2019 Through 18-04-2019",
year = "2019",
doi = "10.1007/978-3-030-15712-8\_44",
language = "English",
isbn = "9783030157111",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "681--695",
editor = "Djoerd Hiemstra and Philipp Mayr and Norbert Fuhr and Claudia Hauff and Benno Stein and Leif Azzopardi",
booktitle = "Advances in Information Retrieval - 41st European Conference on IR Research, ECIR 2019, Proceedings",
address = "Germany",
}