@inproceedings{mkq, author = {Surajit Chaudhuri and Kenneth Church and Arnd Christian K\"{o}nig and Liying Sui}, title = {Heavy-tailed distributions and multi-keyword queries}, booktitle = {SIGIR '07: Proceedings of the 30th annual international ACM SIGIR conference on Research and development in information retrieval}, year = {2007}, isbn = {978-1-59593-597-7}, pages = {663--670}, location = {Amsterdam, The Netherlands}, doi = {http://doi.acm.org/10.1145/1277741.1277855}, publisher = {ACM}, address = {New York, NY, USA}, } @ARTICLE{mkp2p, title={Keyword fusion to support efficient keyword-based search in peer-to-peer file sharing}, author={Lintao Liu and Kyung Dong Ryu and Kang-Won Lee}, journal={Cluster Computing and the Grid, 2004. CCGrid 2004. IEEE International Symposium on}, year={2004}, month={April}, volume={}, number={}, pages={ 269-276}, keywords={ Internet, client-server systems, file organisation, query formulation DHT, Internet, P2P computing, distributed computing, distributed hash table, keyword fusion, keyword-based search, network bandwidth consumption, peer-to-peer file sharing, storage consumption, trace-driven simulations}, doi={10.1109/CCGrid.2004.1336577}, ISSN={ }, } @article{combined, author = {Hugh E. Williams and Justin Zobel and Dirk Bahle}, title = {Fast phrase querying with combined indexes}, journal = {ACM Trans. Inf. Syst.}, volume = {22}, number = {4}, year = {2004}, issn = {1046-8188}, pages = {573--594}, doi = {http://doi.acm.org/10.1145/1028099.1028102}, publisher = {ACM}, address = {New York, NY, USA}, } @article{common, author = {Matthew Chang and Chung Keung Poon}, title = {Efficient phrase querying with common phrase index}, journal = {Inf. Process. Manage.}, volume = {44}, number = {2}, year = {2008}, issn = {0306-4573}, pages = {756--769}, doi = {http://dx.doi.org/10.1016/j.ipm.2007.06.003}, publisher = {Pergamon Press, Inc.}, address = {Tarrytown, NY, USA}, } @article{medical, author = {Wenlei Mao and Wesley W. Chu}, title = {The phrase-based vector space model for automatic retrieval of free-text medical documents}, journal = {Data Knowl. Eng.}, volume = {61}, number = {1}, year = {2007}, issn = {0169-023X}, pages = {76--92}, doi = {http://dx.doi.org/10.1016/j.datak.2006.02.008}, publisher = {Elsevier Science Publishers B. V.}, address = {Amsterdam, The Netherlands, The Netherlands}, } @inproceedings{auxil, author = {Dirk Bahle and Hugh E. Williams and Justin Zobel}, title = {Efficient phrase querying with an auxiliary index}, booktitle = {SIGIR '02: Proceedings of the 25th annual international ACM SIGIR conference on Research and development in information retrieval}, year = {2002}, isbn = {1-58113-561-0}, pages = {215--221}, location = {Tampere, Finland}, doi = {http://doi.acm.org/10.1145/564376.564415}, publisher = {ACM}, address = {New York, NY, USA}, } @inproceedings{nouns, author = {Wei Zhang and Shuang Liu and Clement Yu and Chaojing Sun and Fang Liu and Weiyi Meng}, title = {Recognition and classification of noun phrases in queries for effective retrieval}, booktitle = {CIKM '07: Proceedings of the sixteenth ACM conference on Conference on information and knowledge management}, year = {2007}, isbn = {978-1-59593-803-9}, pages = {711--720}, location = {Lisbon, Portugal}, doi = {http://doi.acm.org/10.1145/1321440.1321540}, publisher = {ACM}, address = {New York, NY, USA}, } @MISC{kss, author = {Frans Kaashoek and Omprakash D Gnawali and Omprakash D Gnawali}, title = {A Keyword Set Search System for Peer-to-Peer Networks}, year = {2002} } @article{short, author = {Kumaran, Giridhar and Allan, James }, citeulike-article-id = {2813349}, doi = {http://dx.doi.org/10.1016/j.ipm.2007.12.006}, journal = {Information Processing \& Management}, keywords = {context, information\_retrieval}, posted-at = {2008-10-22 13:27:30}, priority = {2}, title = {Adapting information retrieval systems to user queries}, url = {http://dx.doi.org/10.1016/j.ipm.2007.12.006}, volume = {In Press, Corrected Proof} } @book{ricardo, author = {Ricardo A. Baeza-Yates and Berthier Ribeiro-Neto}, title = {Modern Information Retrieval}, year = {1999}, isbn = {020139829X}, publisher = {Addison-Wesley Longman Publishing Co., Inc.}, address = {Boston, MA, USA}, } @misc{21578, title = {Machine Learning for Natural Language Processing - ESSLLI 2007 - Reuters 21578 XML}, url = {http://ronaldo.cs.tcd.ie/esslli07/data/reuters21578-xml/}, howpublished = {http://ronaldo.cs.tcd.ie/esslli07/data/reuters21578-xml/} } @article{porter, title = {New models in probabilistic information retrieval}, author = {C.J. van Rijsbergen and S.E. Robertson and M.F. Porter}, publisher = {London: British Library. (British Library Research and Development Report, no. 5587)}, year = {1980}, keywords = {da porter stemmer } } @misc{dbmbench, author = {Mikio Hirabayashi}, title = {Benchmark {T}est of {DBM} {B}rothers}, howpublished = "\url{http://tokyocabinet.sourceforge.net/benchmark.pdf}" } @misc{tc, author = {Mikio Hirabayashi}, title = {Introduction to {T}okyo {P}roducts}, howpublished = "\url{http://tokyocabinet.sourceforge.net/tokyoproducts.pdf}" } @misc{stopw, title = {Linguistic Utils: Stop word list}, howpublished = "\url{http://www.dcs.gla.ac.uk/idom/ir\_resources/linguistic\_utils/stop\_words}" }