@InProceedings{SODA2001b,
AUTHOR = {Erik D. Demaine and Alejandro L\'opez-Ortiz},
TITLE = {A Linear Lower Bound on Index Size for Text Retrieval},
BOOKTITLE = {Proceedings of the 12th Annual ACM-SIAM Symposium on
Discrete Algorithms (SODA 2001)},
bookurl = {http://www.siam.org/meetings/da01/},
ADDRESS = {Washington, DC},
MONTH = {January 7--9},
YEAR = 2001,
PAGES = {289--294},
award = {Invited to special issue of \emph{Journal of Algorithms}.},
length = {6 pages},
ee = {http://dl.acm.org/citation.cfm?id=365411.365460},
papers = {TextSearchLB_JAlgorithms},
dblp = {https://dblp.org/rec/conf/soda/DemaineL01},
}
In this work we prove a linear lower bound on the size of any index that reports the location (if any) of a substring in the text in time proportional to the length of the pattern. In other words, an index supporting linear-time substring searches requires about as much space as the original text. Here “time” is measured in the number of bit probes to the text; an arbitrary amount of computation may be done on an arbitrary amount of the index. Our lower bound applies to inverted word indices as well.