@inproceedings{Hashemi2020Antique,
  title={ANTIQUE: A Non-Factoid Question Answering Benchmark},
  author={Helia Hashemi and Mohammad Aliannejadi and Hamed Zamani and Bruce Croft},
  booktitle={ECIR},
  year={2020}
}

@misc{Graff2002Aquaint,
  title={The AQUAINT Corpus of English News Text},
  author={David Graff},
  year={2002},
  url={https://catalog.ldc.upenn.edu/LDC2002T31},
  publisher={Linguistic Data Consortium}
}

@inproceedings{Voorhees2005Robust,
  title={Overview of the TREC 2005 Robust Retrieval Track},
  author={Ellen M. Voorhees},
  booktitle={TREC},
  year={2005}
}

@inproceedings{Dalton2019Cast,
  title={CAsT 2019: The Conversational Assistance Track Overview},
  author={Jeffrey Dalton and Chenyan Xiong and Jamie Callan},
  booktitle={TREC},
  year={2019}
}

@inproceedings{Dalton2020Cast,
  title={CAsT 2020: The Conversational Assistance Track Overview},
  author={Jeffrey Dalton and Chenyan Xiong and Jamie Callan},
  booktitle={TREC},
  year={2020}
}

@article{Thakur2021Beir,
  title = "BEIR: A Heterogenous Benchmark for Zero-shot Evaluation of Information Retrieval Models",
  author = "Thakur, Nandan and Reimers, Nils and Rücklé, Andreas and Srivastava, Abhishek and Gurevych, Iryna", 
  journal= "arXiv preprint arXiv:2104.08663",
  month = "4",
  year = "2021",
  url = "https://arxiv.org/abs/2104.08663",
}

@inproceedings{Wachsmuth2018Arguana,
  author = "Wachsmuth, Henning and Syed, Shahbaz and Stein, Benno",
  title = "Retrieval of the Best Counterargument without Prior Topic Knowledge",
  booktitle = "Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
  year = "2018",
  publisher = "Association for Computational Linguistics",
  location = "Melbourne, Australia",
  pages = "241--251",
  url = "http://aclweb.org/anthology/P18-1023"
}

@article{Diggelmann2020CLIMATEFEVERAD,
  title={CLIMATE-FEVER: A Dataset for Verification of Real-World Climate Claims},
  author={T. Diggelmann and Jordan L. Boyd-Graber and Jannis Bulian and Massimiliano Ciaramita and Markus Leippold},
  journal={ArXiv},
  year={2020},
  volume={abs/2012.00614}
}

@article{Hasibi2017DBpediaEntityVA,
  title={DBpedia-Entity v2: A Test Collection for Entity Search},
  author={Faegheh Hasibi and Fedor Nikolaev and Chenyan Xiong and K. Balog and S. E. Bratsberg and Alexander Kotov and J. Callan},
  journal={Proceedings of the 40th International ACM SIGIR Conference on Research and Development in Information Retrieval},
  year={2017}
}

@inproceedings{Thorne2018Fever,
    title = "{FEVER}: a Large-scale Dataset for Fact Extraction and {VER}ification",
    author = "Thorne, James  and
      Vlachos, Andreas  and
      Christodoulopoulos, Christos  and
      Mittal, Arpit",
    booktitle = "Proceedings of the 2018 Conference of the North {A}merican Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers)",
    month = jun,
    year = "2018",
    address = "New Orleans, Louisiana",
    publisher = "Association for Computational Linguistics",
    url = "https://www.aclweb.org/anthology/N18-1074",
    doi = "10.18653/v1/N18-1074",
    pages = "809--819"
}

@article{Maia2018Fiqa,
  title={WWW'18 Open Challenge: Financial Opinion Mining and Question Answering},
  author={Macedo Maia and S. Handschuh and A. Freitas and Brian Davis and R. McDermott and M. Zarrouk and A. Balahur},
  journal={Companion Proceedings of the The Web Conference 2018},
  year={2018}
}

@inproceedings{Yang2018Hotpotqa,
    title = "{H}otpot{QA}: A Dataset for Diverse, Explainable Multi-hop Question Answering",
    author = "Yang, Zhilin  and
      Qi, Peng  and
      Zhang, Saizheng  and
      Bengio, Yoshua  and
      Cohen, William  and
      Salakhutdinov, Ruslan  and
      Manning, Christopher D.",
    booktitle = "Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing",
    month = oct # "-" # nov,
    year = "2018",
    address = "Brussels, Belgium",
    publisher = "Association for Computational Linguistics",
    url = "https://www.aclweb.org/anthology/D18-1259",
    doi = "10.18653/v1/D18-1259",
    pages = "2369--2380"
}

@inproceedings{Bajaj2016Msmarco,
  title={MS MARCO: A Human Generated MAchine Reading COmprehension Dataset},
  author={Payal Bajaj, Daniel Campos, Nick Craswell, Li Deng, Jianfeng Gao, Xiaodong Liu, Rangan Majumder, Andrew McNamara, Bhaskar Mitra, Tri Nguyen, Mir Rosenberg, Xia Song, Alina Stoica, Saurabh Tiwary, Tong Wang},
  booktitle={InCoCo@NIPS},
  year={2016}
}

@inproceedings{Craswell2019TrecDl,
  title={Overview of the TREC 2019 deep learning track},
  author={Nick Craswell and Bhaskar Mitra and Emine Yilmaz and Daniel Campos and Ellen Voorhees},
  booktitle={TREC 2019},
  year={2019}
}

@inproceedings{Boteva2016Nfcorpus,
  title="A Full-Text Learning to Rank Dataset for Medical Information Retrieval",
  author = "Vera Boteva and Demian Gholipour and Artem Sokolov and Stefan Riezler",
  booktitle = "Proceedings of the European Conference on Information Retrieval ({ECIR})",
  location = "Padova, Italy",
  publisher = "Springer",
  year = 2016
}

@article{Kwiatkowski2019Nq,
  title = {Natural Questions: a Benchmark for Question Answering Research},
  author = {Tom Kwiatkowski and Jennimaria Palomaki and Olivia Redfield and Michael Collins and Ankur Parikh and Chris Alberti and Danielle Epstein and Illia Polosukhin and Matthew Kelcey and Jacob Devlin and Kenton Lee and Kristina N. Toutanova and Llion Jones and Ming-Wei Chang and Andrew Dai and Jakob Uszkoreit and Quoc Le and Slav Petrov},
  year = {2019},
  journal = {TACL}
}

@inproceedings{Cohan2020Scidocs,
    title = "{SPECTER}: Document-level Representation Learning using Citation-informed Transformers",
    author = "Cohan, Arman  and
      Feldman, Sergey  and
      Beltagy, Iz  and
      Downey, Doug  and
      Weld, Daniel",
    booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics",
    month = jul,
    year = "2020",
    address = "Online",
    publisher = "Association for Computational Linguistics",
    url = "https://www.aclweb.org/anthology/2020.acl-main.207",
    doi = "10.18653/v1/2020.acl-main.207",
    pages = "2270--2282"
}

@inproceedings{Wadden2020Scifact,
    title = "Fact or Fiction: Verifying Scientific Claims",
    author = "Wadden, David  and
      Lin, Shanchuan  and
      Lo, Kyle  and
      Wang, Lucy Lu  and
      van Zuylen, Madeleine  and
      Cohan, Arman  and
      Hajishirzi, Hannaneh",
    booktitle = "Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)",
    month = nov,
    year = "2020",
    address = "Online",
    publisher = "Association for Computational Linguistics",
    url = "https://www.aclweb.org/anthology/2020.emnlp-main.609",
    doi = "10.18653/v1/2020.emnlp-main.609",
    pages = "7534--7550"
}

@article{Wang2020Cord19,
  title={CORD-19: The Covid-19 Open Research Dataset},
  author={Lucy Lu Wang and Kyle Lo and Yoganand Chandrasekhar and Russell Reas and Jiangjiang Yang and Darrin Eide and K. Funk and Rodney Michael Kinney and Ziyang Liu and W. Merrill and P. Mooney and D. Murdick and Devvret Rishi and Jerry Sheehan and Zhihong Shen and B. Stilson and A. Wade and K. Wang and Christopher Wilhelm and Boya Xie and D. Raymond and Daniel S. Weld and Oren Etzioni and Sebastian Kohlmeier},
  journal={ArXiv},
  year={2020}
}

@article{Voorhees2020TrecCovid,
  title={TREC-COVID: Constructing a Pandemic Information Retrieval Test Collection},
  author={E. Voorhees and Tasmeer Alam and Steven Bedrick and Dina Demner-Fushman and W. Hersh and Kyle Lo and Kirk Roberts and I. Soboroff and Lucy Lu Wang},
  journal={ArXiv},
  year={2020},
  volume={abs/2005.04474}
}

@inproceedings{Bondarenko2020Tuche,
  title={Overview of Touch{\'e} 2020: Argument Retrieval},
  author={Alexander Bondarenko and Maik Fr{\"o}be and Meriem Beloucif and Lukas Gienapp and Yamen Ajjour and Alexander Panchenko and Christian Biemann and Benno Stein and Henning Wachsmuth and Martin Potthast and Matthias Hagen},
  booktitle={CLEF},
  year={2020}
}

@article{Hoogeveen2015CqaDupStack,
  title={{CQADupStack}: A Benchmark Data Set for Community Question-Answering Research},
  author={D. Hoogeveen and Karin M. Verspoor and Timothy Baldwin},
  journal={Proceedings of the 20th Australasian Document Computing Symposium},
  year={2015}
}

@article{Dietz2017Car,
  title={{TREC CAR}: A Data Set for Complex Answer Retrieval},
  author={Laura Dietz and Ben Gamari},
  year={2017},
  note={Version 1.5},
  url={http://trec-car.cs.unh.edu}
}

@inproceedings{Dietz2017TrecCar,
  title={TREC Complex Answer Retrieval Overview.},
  author={Dietz, Laura and Verma, Manisha and Radlinski, Filip and Craswell, Nick},
  booktitle={TREC},
  year={2017}
}

@inproceedings{Nanni2017BenchmarkCar,
  title={Benchmark for complex answer retrieval},
  author={Nanni, Federico and Mitra, Bhaskar and Magnusson, Matt and Dietz, Laura},
  booktitle={ICTIR},
  year={2017}
}

@inproceedings{Roberts2017TrecPm,
  title={Overview of the TREC 2017 Precision Medicine Track},
  author={Kirk Roberts and Dina Demner-Fushman and Ellen Voorhees and William R. Hersh and Steven Bedrick and Alexander J. Lazar and Shubham Pant},
  booktitle={TREC},
  year={2017}
}

@inproceedings{Roberts2018TrecPm,
  title={Overview of the TREC 2018 Precision Medicine Track},
  author={Kirk Roberts and Dina Demner-Fushman and Ellen Voorhees and William R. Hersh and Steven Bedrick and Alexander J. Lazar},
  booktitle={TREC},
  year={2018}
}

@inproceedings{Roberts2019TrecPm,
  title={Overview of the TREC 2019 Precision Medicine Track},
  author={Kirk Roberts and Dina Demner-Fushman and Ellen Voorhees and William R. Hersh and Steven Bedrick and Alexander J. Lazar and Shubham Pant and Funda Meric-Bernstam},
  booktitle={TREC},
  year={2019}
}

@inproceedings{Sun2020Clirmatrix,
  title = "{CLIRM}atrix: A massively large collection of bilingual and multilingual datasets for Cross-Lingual Information Retrieval",
  author = "Sun, Shuo  and
    Duh, Kevin",
  booktitle = "Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)",
  month = nov,
  year = "2020",
  address = "Online",
  publisher = "Association for Computational Linguistics",
  url = "https://www.aclweb.org/anthology/2020.emnlp-main.340",
  doi = "10.18653/v1/2020.emnlp-main.340",
  pages = "4160--4170"
}

@inproceedings{Clarke2009TrecWeb,
  title={Overview of the TREC 2009 Web Track},
  author={Charles L. A. Clarke and Nick Craswell and Ian Soboroff},
  booktitle={TREC},
  year={2009}
}

@inproceedings{Clarke2010TrecWeb,
  title={Overview of the TREC 2010 Web Track},
  author={Charles L. A. Clarke and Nick Craswell and Ian Soboroff and Gordon V. Cormack},
  booktitle={TREC},
  year={2010}
}

@inproceedings{Clarke2011TrecWeb,
  title={Overview of the TREC 2011 Web Track},
  author={Charles L. A. Clarke and Nick Craswell and Ian Soboroff and Ellen M. Voorhees},
  booktitle={TREC},
  year={2011}
}

@inproceedings{Clarke2012TrecWeb,
  title={Overview of the TREC 2012 Web Track},
  author={Charles L. A. Clarke and Nick Craswell and Ellen M. Voorhees},
  booktitle={TREC},
  year={2012}
}

@inproceedings{Carterette2009MQ,
  title={Million Query Track 2009 Overview},
  author={Ben Carterette and Virgil Pavlu and Hui Fang and Evangelos Kanoulas},
  booktitle={TREC},
  year={2009}
}

@inproceedings{Zuccon2016ClefEhealth,
  title={The IR Task at the CLEF eHealth Evaluation Lab 2016: User-centred Health Information Retrieval},
  author={Guido Zuccon and Joao Palotti and Lorraine Goeuriot and Liadh Kelly and Mihai Lupu and Pavel Pecina and Henning M{\"u}ller and Julie Budaher and Anthony Deacon},
  booktitle={CLEF},
  year={2016}
}

@inproceedings{Palotti2017ClefEhealth,
  title={CLEF 2017 Task Overview: The IR Task at the eHealth Evaluation Lab - Evaluating Retrieval Methods for Consumer Health Search},
  author={Joao Palotti and Guido Zuccon and Jimmy and Pavel Pecina and Mihai Lupu and Lorraine Goeuriot and Liadh Kelly and Allan Hanbury},
  booktitle={CLEF},
  year={2017}
}

@inproceedings{Abualsaud2019TrecDecision,
  title={Overview of the TREC 2019 Decision Track},
  author={Mustafa Abualsaud and Christina Lioma and Maria Maistro and Mark D. Smucker and Guido Zuccon},
  booktitle={TREC},
  year={2019}
}

@inproceedings{Mao2018OWww2,
  title={Overview of the NTCIR-14 We Want Web Task},
  author={Jiaxin Mao and Tetsuya Sakai and Cheng Luo and Peng Xiao and Yiqun Liu and Zhicheng Dou},
  booktitle={NTCIR},
  year={2018}
}

@inproceedings{Luo2017Www1,
  title={Overview of the NTCIR-13 We Want Web Task},
  author={Cheng Luo and Tetsuya Sakai and Yiqun Liu and Zhicheng Dou and Chenyan Xiong and Jingfang Xu},
  booktitle={NTCIR},
  year={2017}
}

@inproceedings{CollinsThompson2014TrecWeb,
  title={TREC 2014 Web Track Overview},
  author={Kevyn Collins-Thompson and Craig Macdonald and Paul Bennett and Fernando Diaz and Ellen M. Voorhees},
  booktitle={TREC},
  year={2014}
}

@inproceedings{CollinsThompson2013TrecWeb,
  title={TREC 2013 Web Track Overview},
  author={Kevyn Collins-Thompson and Paul Bennett and Fernando Diaz and Charles L. A. Clarke and Ellen M. Voorhees},
  booktitle={TREC},
  year={2013}
}

@article{Husain2019CodeSearchNet,
  title={CodeSearchNet Challenge: Evaluating the State of Semantic Code Search},
  author={Hamel Husain and Ho-Hsiang Wu and Tiferet Gazit and Miltiadis Allamanis and Marc Brockschmidt},
  journal={ArXiv},
  year={2019}
}

@misc{Karpukhin2020Dpr,
  title={Dense Passage Retrieval for Open-Domain Question Answering},
  author={Vladimir Karpukhin and Barlas Oğuz and Sewon Min and Patrick Lewis and Ledell Wu and Sergey Edunov and Danqi Chen and Wen-tau Yih},
  year={2020},
  eprint={2004.04906},
  archivePrefix={arXiv},
  primaryClass={cs.CL}
}

@inproceedings{Joshi2017TriviaQA,
  title={TriviaQA: A Large Scale Distantly Supervised Challenge Dataset for Reading Comprehension},
  author={Mandar Joshi and Eunsol Choi and Daniel S. Weld and Luke Zettlemoyer},
  booktitle={ACL},
  year={2017}
}

@inproceedings{Craswell2002TrecWeb,
  title={Overview of the TREC-2002 Web Track},
  author={Nick Craswell and David Hawking},
  booktitle={TREC},
  year={2002}
}

@inproceedings{Craswell2003TrecWeb,
  title={Overview of the TREC 2003 Web Track},
  author={Nick Craswell and David Hawking and Ross Wilkinson and Mingfang Wu},
  booktitle={TREC},
  year={2003}
}

@inproceedings{Craswell2004TrecWeb,
  title={Overview of the TREC-2004 Web Track},
  author={Nick Craswell and David Hawking},
  booktitle={TREC},
  year={2004}
}

@inproceedings{Clarke2004TrecTerabyte,
  title={Overview of the TREC 2004 Terabyte Track},
  author={Charles Clarke and Nick Craswell and Ian Soboroff},
  booktitle={TREC},
  year={2004}
}

@inproceedings{Clarke2005TrecTerabyte,
  title={The TREC 2005 Terabyte Track},
  author={Charles L. A. Clark and Falk Scholer and Ian Soboroff},
  booktitle={TREC},
  year={2005}
}

@inproceedings{Buttcher2006TrecTerabyte,
  title={The TREC 2006 Terabyte Track},
  author={Stefan B\"uttcher and Charles L. A. Clarke and Ian Soboroff},
  booktitle={TREC},
  year={2006}
}

@inproceedings{Allen2007MQ,
  title={Million Query Track 2007 Overview},
  author={James Allan and Ben Carterette and Javed A. Aslam and Virgil Pavlu and Blagovest Dachev and Evangelos Kanoulas},
  booktitle={TREC},
  year={2007}
}

@inproceedings{Allen2008MQ,
  title={Million Query Track 2008 Overview},
  author={James Allan and Javed A. Aslam and Ben Carterette and Virgil Pavlu and Evangelos Kanoulas},
  booktitle={TREC},
  year={2008}
}

@inproceedings{Hersh2006TrecGenomics,
  title={TREC 2006 Genomics Track Overview},
  author={William Hersh and Aaron M. Cohen and Phoebe Roberts and Hari Krishna Rekapalli},
  booktitle={TREC},
  year={2006}
}

@inproceedings{Hersh2007TrecGenomics,
  title={TREC 2007 Genomics Track Overview},
  author={William Hersh and Aaron Cohen and Lynn Ruslen and Phoebe Roberts},
  booktitle={TREC},
  year={2007}
}

@inproceedings{Hersh2004TrecGenomics,
  title={TREC 2004 Genomics Track Overview},
  author={William R. Hersh and Ravi Teja Bhuptiraju and Laura Ross and Phoebe Johnson and Aaron M. Cohen and Dale F. Kraemer},
  booktitle={TREC},
  year={2004}
}

@inproceedings{Hersh2005TrecGenomics,
  title={TREC 2005 Genomics Track Overview},
  author={William Hersh and Aaron Cohen and Jianji Yang and Ravi Teja Bhupatiraju and Phoebe Roberts and Marti Hearst},
  booktitle={TREC},
  year={2007}
}

@article{Craswell2020Orcas,
  title={ORCAS: 18 Million Clicked Query-Document Pairs for Analyzing Search},
  author={Craswell, Nick and Campos, Daniel and Mitra, Bhaskar and Yilmaz, Emine and Billerbeck, Bodo},
  journal={arXiv preprint arXiv:2006.05324},
  year={2020}
}

@inproceedings{Craswell2020TrecDl,
  title={Overview of the TREC 2020 deep learning track},
  author={Nick Craswell and Bhaskar Mitra and Emine Yilmaz and Daniel Campos},
  booktitle={TREC},
  year={2020}
}

@article{Mackie2021DlHard,
  title={How Deep is your Learning: the DL-HARD Annotated Deep Learning Dataset},
  author={Iain Mackie and Jeffrey Dalton and Andrew Yates},
  journal={ArXiv},
  year={2021},
  volume={abs/2105.07975}
}

@inproceedings{MacAvaney2020MedMarco,
  author = {MacAvaney, Sean and Cohan, Arman and Goharian, Nazli},
  title = {SLEDGE-Zero: A Zero-Shot Baseline for COVID-19 Literature Search},
  booktitle = {EMNLP},
  year = {2020}
}

@article{Sandhaus2008Nyt,
  title={The new york times annotated corpus},
  author={Sandhaus, Evan},
  journal={Linguistic Data Consortium, Philadelphia},
  volume={6},
  number={12},
  pages={e26752},
  year={2008}
}

@inproceedings{Allan2017TrecCore,
  author = {James Allan and Donna Harman and Evangelos Kanoulas and Dan Li and Christophe Van Gysel and Ellen Vorhees},
  title = {TREC 2017 Common Core Track Overview},
  booktitle = {TREC},
  year = {2017}
}

@inproceedings{MacAvaney2019Wksup,
  author = {MacAvaney, Sean and Yates, Andrew and Hui, Kai and Frieder, Ophir},
  title = {Content-Based Weak Supervision for Ad-Hoc Re-Ranking},
  booktitle = {SIGIR},
  year = {2019}
}

@inproceedings{Simpson2014TrecCds,
  title={Overview of the TREC 2014 Clinical Decision Support Track},
  author={Matthew S. Simpson and Ellen M. Voorhees and William Hersh},
  booktitle={TREC},
  year={2014}
}

@inproceedings{Roberts2015TrecCds,
  title={Overview of the TREC 2015 Clinical Decision Support Track},
  author={Kirk Roberts and Matthew S. Simpson and Ellen Voorhees and William R. Hersh},
  booktitle={TREC},
  year={2015}
}

@inproceedings{Roberts2016TrecCds,
  title={Overview of the TREC 2016 Clinical Decision Support Track},
  author={Kirk Roberts and Dina Demner-Fushman and Ellen M. Voorhees and William R. Hersh},
  booktitle={TREC},
  year={2016}
}

@misc{Graff2001Arabic,
  title={Arabic Newswire Part 1 LDC2001T55},
  author={Graff, David, and Walker, Kevin},
  year={2001},
  url={https://catalog.ldc.upenn.edu/LDC2001T55},
  publisher={Linguistic Data Consortium}
}

@inproceedings{Gey2001Arabic,
  title={The TREC-2001 Cross-Language Information Retrieval Track: Searching Arabic using English, French or Arabic Queries},
  author={Fredric Gey and Douglas Oard},
  booktitle={TREC},
  year={2001}
}

@inproceedings{Gey2002Arabic,
  title={The TREC-2002 Arabic/English CLIR Track},
  author={Fredric Gey and Douglas Oard},
  booktitle={TREC},
  year={2002}
}

@misc{Rogers2000Mandarin,
  title={TREC Mandarin LDC2000T52},
  author={Rogers, Willie},
  year={2000},
  url={https://catalog.ldc.upenn.edu/LDC2000T52},
  publisher={Linguistic Data Consortium}
}

@inproceedings{Harman1997Chinese,
  title={Spanish and Chinese Document Retrieval in TREC-5},
  author={Alan Smeaton and Ross Wilkinson},
  booktitle={TREC},
  year={1996}
}

@inproceedings{Wilkinson1998Chinese,
  title={Chinese Document Retrieval at TREC-6},
  author={Ross Wilkinson},
  booktitle={TREC},
  year={1997}
}

@inproceedings{Voorhees2004Robust,
  title={Overview of the TREC 2004 Robust Retrieval Track},
  author={Ellen Voorhees},
  booktitle={TREC},
  year={2004}
}

@inproceedings{Huston2014ACO,
  title={A Comparison of Retrieval Models using Term Dependencies},
  author={Samuel Huston and W. Bruce Croft},
  booktitle={CIKM},
  year={2014}
}

@misc{Rogers2000Spanish,
  title={TREC Spanish LDC2000T51},
  author={Rogers, Willie},
  year={2000},
  url={https://catalog.ldc.upenn.edu/LDC2000T51},
  publisher={Linguistic Data Consortium}
}

@inproceedings{Harman1994Trec3,
  title={Overview of the Third Text REtrieval Conference (TREC-3)},
  author={Donna Harman},
  booktitle={TREC},
  year={1994}
}

@inproceedings{Harman1995Trec4,
  title={Overview of the Fourth Text REtrieval Conference (TREC-4)},
  author={Donna Harman},
  booktitle={TREC},
  year={1995}
}

@inproceedings{Rekabsaz2021TripClick,
  title={TripClick: The Log Files of a Large Health Web Search Engine}, 
  author={Navid Rekabsaz and Oleg Lesota and Markus Schedl and Jon Brassey and Carsten Eickhoff},
  year={2021},
  booktitle={SIGIR}
}

@inproceedings{Hofstaetter2022TripClick,
  title={Establishing Strong Baselines for TripClick Health Retrieval},
  author={Sebastian Hofst\"atter and Sophia Althammer and Mete Sertkan and Allan Hanbury},
  year={2022},
  booktitle={ECIR}
}

@inproceedings{Sequiera2017TweetsIA,
  title={Finally, a Downloadable Test Collection of Tweets},
  author={Royal Sequiera and Jimmy Lin},
  booktitle={SIGIR},
  year={2017}
}

@inproceedings{Lin2013Microblog,
  title={Overview of the TREC-2013 Microblog Track},
  author={Jimmy Lin and Miles Efron},
  booktitle={TREC},
  year={2013}
}

@inproceedings{Lin2014Microblog,
  title={Overview of the TREC-2014 Microblog Track},
  author={Jimmy Lin and Miles Efron and Yulu Wang and Garrick Sherman},
  booktitle={TREC},
  year={2014}
}

@inproceedings{Soboroff2018News,
  title={TREC 2018 News Track Overview},
  author={Ian Soboroff and Shudong Huang and Donna Harman},
  booktitle={TREC},
  year={2018}
}

@inproceedings{Soboroff2019News,
  title={TREC 2019 News Track Overview},
  author={Ian Soboroff and Shudong Huang and Donna Harman},
  booktitle={TREC},
  year={2019}
}

@inproceedings{Frej2020Wikir,
  title={WIKIR: A Python toolkit for building a large-scale Wikipedia-based English Information Retrieval Dataset},
  author={Jibril Frej and Didier Schwab and Jean-Pierre Chevallet},
  booktitle={LREC},
  year={2020}
}

@inproceedings{Frej2020MlWikir,
  title={MLWIKIR: A Python Toolkit for Building Large-scale Wikipedia-based Information Retrieval Datasets in Chinese, English, French, Italian, Japanese, Spanish and More},
  author={Jibril Frej and Didier Schwab and Jean-Pierre Chevallet},
  booktitle={CIRCLE},
  year={2020}
}

@article{Zhang2021MrTyDi,
  title={{Mr. TyDi}: A Multi-lingual Benchmark for Dense Retrieval}, 
  author={Xinyu Zhang and Xueguang Ma and Peng Shi and Jimmy Lin},
  year={2021},
  journal={arXiv:2108.08787},
}

@article{Clark2020TyDiQa,
    title={{TyDi QA}: A Benchmark for Information-Seeking Question Answering in Typologically Diverse Languages},
    author={Jonathan H. Clark and Eunsol Choi and Michael Collins and Dan Garrette and Tom Kwiatkowski and Vitaly Nikolaev and Jennimaria Palomaki},
    year={2020},
    journal={Transactions of the Association for Computational Linguistics}
}

@article{Bonifacio2021MMarco,
    title={{mMARCO}: A Multilingual Version of {MS MARCO} Passage Ranking Dataset},
    author={Luiz Henrique Bonifacio and Israel Campiotti and Roberto Lotufo and Rodrigo Nogueira},
    year={2021},
    journal={arXiv:2108.13897}
}

@inproceedings{Pass2006Picture,
  title={A picture of search},
  author={Pass, Greg and Chowdhury, Abdur and Torgeson, Cayley},
  booktitle={InfoScale},
  year={2006}
}

@inproceedings{MacAvaney2022Reproducing,
  author={MacAvaney, Sean and Macdonald, Craig and Ounis, Iadh},
  title={Reproducing Personalised Session Search over the AOL Query Log},
  booktitle={ECIR},
  year={2022}
}

@inproceedings{Wachsmuth2017Argument,
  author = {Henning Wachsmuth and Martin Potthast and Khalid Al-Khatib and Yamen Ajjour and Jana Puschmann and Jiani Qu and Jonas Dorsch and Viorel Morari and Janek Bevendorff and Benno Stein},
  booktitle = {4th Workshop on Argument Mining (ArgMining 2017) at EMNLP},
  editor = {Kevin Ashley and Claire Cardie and Nancy Green and Iryna Gurevych and Ivan Habernal and Diane Litman and Georgios Petasis and Chris Reed and Noam Slonim and Vern Walker},
  month = sep,
  pages = {49-59},
  publisher = {Association for Computational Linguistics},
  site = {Copenhagen, Denmark},
  title = {{Building an Argument Search Engine for the Web}},
  url = {https://www.aclweb.org/anthology/W17-5106},
  year = 2017
}

@inproceedings{Ajjour2019Acquisition,
  address = {Berlin Heidelberg New York},
  author = {Yamen Ajjour and Henning Wachsmuth and Johannes Kiesel and Martin Potthast and Matthias Hagen and Benno Stein},
  booktitle = {42nd German Conference on Artificial Intelligence (KI 2019)},
  doi = {10.1007/978-3-030-30179-8\_4},
  editor = {Christoph Benzm{\"u}ller and Heiner Stuckenschmidt},
  month = sep,
  pages = {48-59},
  publisher = {Springer},
  site = {Kassel, Germany},
  title = {{Data Acquisition for Argument Search: The args.me corpus}},
  year = 2019
}

@inproceedings{Bondarenko2020Touche,
  address = {Berlin Heidelberg New York},
  author = {Alexander Bondarenko and Maik Fr{\"o}be and Meriem Beloucif and Lukas Gienapp and Yamen Ajjour and Alexander Panchenko and Chris Biemann and Benno Stein and Henning Wachsmuth and Martin Potthast and Matthias Hagen},
  booktitle = {Experimental IR Meets Multilinguality, Multimodality, and Interaction. 11th International Conference of the CLEF Association (CLEF 2020)},
  doi = {10.1007/978-3-030-58219-7\_26},
  editor = {Avi Arampatzis and Evangelos Kanoulas and Theodora Tsikrika and Stefanos Vrochidis and Hideo Joho and Christina Lioma and Carsten Eickhoff and Aur{\'e}lie N{\'e}v{\'e}ol and Linda Cappellato and Nicola Ferro},
  month = sep,
  pages = {384-395},
  publisher = {Springer},
  series = {Lecture Notes in Computer Science},
  site = {Thessaloniki, Greece},
  title = {{Overview of Touch{\'e} 2020: Argument Retrieval}},
  url = {https://link.springer.com/chapter/10.1007/978-3-030-58219-7_26},
  volume = 12260,
  year = 2020,
}

@inproceedings{Wachsmuth2017Quality,
  author = {Henning Wachsmuth and Nona Naderi and Yufang Hou and Yonatan Bilu and Vinodkumar Prabhakaran and Tim Alberdingk Thijm and Graeme Hirst and Benno Stein},
  booktitle = {15th Conference of the European Chapter of the Association for Computational Linguistics (EACL 2017)},
  editor = {Phil Blunsom and Alexander Koller and Mirella Lapata},
  month = apr,
  pages = {176-187},
  site = {Valencia, Spain},
  title = {{Computational Argumentation Quality Assessment in Natural Language}},
  url = {http://aclweb.org/anthology/E17-1017},
  year = 2017
}

@inproceedings{Braunstain2016Support,
  author = {Liora Braunstain and Oren Kurland and David Carmel and Idan Szpektor and Anna Shtok},
  editor = {Nicola Ferro and Fabio Crestani and Marie{-}Francine Moens and Josiane Mothe and Fabrizio Silvestri and Giorgio Maria Di Nunzio and Claudia Hauff and Gianmaria Silvello},
  title = {Supporting Human Answers for Advice-Seeking Questions in {CQA} Sites},
  booktitle = {Advances in Information Retrieval - 38th European Conference on {IR} Research, {ECIR} 2016, Padua, Italy, March 20-23, 2016. Proceedings},
  series = {Lecture Notes in Computer Science},
  volume = {9626},
  pages = {129--141},
  publisher = {Springer},
  year = {2016},
  doi = {10.1007/978-3-319-30671-1\_10},
}

@inproceedings{Rafalak2014Credibility,
  author    = {Maria Rafalak and Katarzyna Abramczuk and Adam Wierzbicki},
  editor = {Chin{-}Wan Chung and Andrei Z. Broder and Kyuseok Shim and Torsten Suel},
  title = {Incredible: is (almost) all web content trustworthy? analysis of psychological factors related to website credibility evaluation},
  booktitle = {23rd International World Wide Web Conference, {WWW} '14, Seoul, Republic of Korea, April 7-11, 2014, Companion Volume},
  pages = {1117--1122},
  publisher = {{ACM}},
  year = {2014},
  doi = {10.1145/2567948.2578997},
}

@inproceedings{Bondarenko2021Touche,
  address = {Berlin Heidelberg New York},
  author = {Alexander Bondarenko and Lukas Gienapp and Maik Fr{\"o}be and Meriem Beloucif and Yamen Ajjour and Alexander Panchenko and Chris Biemann and Benno Stein and Henning Wachsmuth and Martin Potthast and Matthias Hagen},
  booktitle = {Experimental IR Meets Multilinguality, Multimodality, and Interaction. 12th International Conference of the CLEF Association (CLEF 2021)},
  doi = {10.1007/978-3-030-85251-1\_28},
  editor = {{K. Sel{\c{c}}uk} Candan and Bogdan Ionescu and Lorraine Goeuriot and Henning M{\"u}ller and Alexis Joly and Maria Maistro and Florina Piroi and Guglielmo Faggioli and Nicola Ferro},
  month = sep,
  pages = {450-467},
  publisher = {Springer},
  series = {Lecture Notes in Computer Science},
  site = {Bucharest, Romania},
  title = {{Overview of Touch{\'e} 2021: Argument Retrieval}},
  url = {https://link.springer.com/chapter/10.1007/978-3-030-85251-1_28},
  volume = 12880,
  year = 2021,
}

@inproceedings{Froebe2022Anchors,
  address =               {Berlin Heidelberg New York},
  author =                {Maik Fr{\"o}be and Sebastian G{\"u}nther and Maximilian Probst and Martin Potthast and Matthias Hagen},
  booktitle =             {Advances in Information Retrieval. 44th European Conference on IR Research (ECIR 2022)},
  month =                 apr,
  publisher =             {Springer},
  series =                {Lecture Notes in Computer Science},
  site =                  {Stavanger, Norway},
  title =                 {{The Power of Anchor Text in the Neural Retrieval Era}},
  year =                  2022
}

@article{Santhanam2021ColBERTv2,
  title = "ColBERTv2: Effective and Efficient Retrieval via Lightweight Late Interaction",
  author = "Keshav Santhanam and Omar Khattab and Jon Saad-Falcon and Christopher Potts and Matei Zaharia", 
  journal= "arXiv preprint arXiv:2112.01488",
  year = "2021",
  url = "https://arxiv.org/abs/2112.01488"
}

@inproceedings{petroni-etal-2021-kilt,
    title = "{KILT}: a Benchmark for Knowledge Intensive Language Tasks",
    author = {Petroni, Fabio  and Piktus, Aleksandra  and
      Fan, Angela  and Lewis, Patrick  and
      Yazdani, Majid  and De Cao, Nicola  and
      Thorne, James  and Jernite, Yacine  and
      Karpukhin, Vladimir  and Maillard, Jean  and
      Plachouras, Vassilis  and Rockt{\"a}schel, Tim  and
      Riedel, Sebastian},
    booktitle = "Proceedings of the 2021 Conference of the North American Chapter of the Association 
                 for Computational Linguistics: Human Language Technologies",
    month = "jun",
    year = "2021",
    address = "Online",
    publisher = "Association for Computational Linguistics",
    url = "https://aclanthology.org/2021.naacl-main.200",
    doi = "10.18653/v1/2021.naacl-main.200",
    pages = "2523--2544",
}

@misc{Voorhees1996Disks45,
  title = {NIST TREC Disks 4 and 5: Retrieval Test Collections Document Set},
  author = {Ellen M. Voorhees},
  doi = {10.18434/t47g6m},
  year = {1996},
  publisher = {National Institute of Standards and Technology}
}

@inproceedings{Voorhees1998Trec7,
  title = {Overview of the Seventh Text Retrieval Conference (TREC-7)},
  author = {Ellen M. Voorhees and Donna Harman},
  year = {1998},
  booktitle = {TREC}
}

@inproceedings{Voorhees1999Trec8,
  title = {Overview of the Eight Text Retrieval Conference (TREC-8)},
  author = {Ellen M. Voorhees and Donna Harman},
  year = {1999},
  booktitle = {TREC}
}

@inproceedings{sasaki-etal-2018-cross,
    title = "Cross-Lingual Learning-to-Rank with Shared Representations",
    author = "Sasaki, Shota  and
      Sun, Shuo  and
      Schamoni, Shigehiko  and
      Duh, Kevin  and
      Inui, Kentaro",
    booktitle = "Proceedings of the 2018 Conference of the North {A}merican Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 2 (Short Papers)",
    month = jun,
    year = "2018",
    address = "New Orleans, Louisiana",
    publisher = "Association for Computational Linguistics",
    url = "https://aclanthology.org/N18-2073",
    doi = "10.18653/v1/N18-2073",
    pages = "458--463"
}

@inproceedings{mackie2022codec,
   title={CODEC: Complex Document and Entity Collection},
   author={Mackie, Iain and Owoicho, Paul and Gemmell, Carlos and Fischer, Sophie and MacAvaney, Sean and Dalton, Jeffery},
   booktitle={Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval},
   year={2022}
}

@inproceedings{Dato2022Istella,
  title={The Istella22 Dataset: Bridging Traditional and Neural Learning to Rank Evaluation},
  author={Domenico Dato, Sean MacAvaney, Franco Maria Nardini, Raffaele Perego, Nicola Tonellotto},
  booktitle={Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval},
  year={2022}
}

@inproceedings{Bondarenko2022Touche,
  address = {Berlin Heidelberg New York},
  author = {Alexander Bondarenko and Maik Fr{\"o}be and Johannes Kiesel and Shahbaz Syed and Timon Gurcke and Meriem Beloucif and Alexander Panchenko and Chris Biemann and Benno Stein and Henning Wachsmuth and Martin Potthast and Matthias Hagen},
  booktitle = {Experimental IR Meets Multilinguality, Multimodality, and Interaction. 13th International Conference of the CLEF Association (CLEF 2022)},
  editor = {Alberto Barr{\'o}n-Cede{\~n}o and Giovanni Da San Martino and Mirko Degli Esposti and Fabrizio Sebastiani and Craig Macdonald and Gabriella Pasi and Allan Hanbury and Martin Potthast and Guglielmo Faggioli and Nicola Ferro},
  month = sep,
  numpages = 29,
  publisher = {Springer},
  series = {Lecture Notes in Computer Science},
  site = {Bologna, Italy},
  title = {{Overview of Touch{\'e} 2022: Argument Retrieval}},
  year = 2022
}

@inproceedings{Kiesel2021Image,
  author = {Johannes Kiesel and Nico Reichenbach and Benno Stein and Martin Potthast},
  booktitle = {8th Workshop on Argument Mining (ArgMining 2021) at EMNLP},
  doi = {10.18653/v1/2021.argmining-1.4},
  editor = {Khalid Al-Khatib and Yufang Hou and Manfred Stede},
  month = nov,
  pages = {36-45},
  publisher = {Association for Computational Linguistics},
  site = {Punta Cana, Dominican Republic},
  title = {{Image Retrieval for Arguments Using Stance-Aware Query Expansion}},
  url = {https://aclanthology.org/2021.argmining-1.4/},
  year = 2021
}

@inproceedings{Dimitrov2021SemEval,
  author = {Dimitar Dimitrov and Bishr Bin Ali and Shaden Shaar and Firoj Alam and Fabrizio Silvestri and Hamed Firooz and Preslav Nakov and Giovanni Da San Martino},
  editor = {Alexis Palmer and Nathan Schneider and Natalie Schluter and Guy Emerson and Aur{\'{e}}lie Herbelot and Xiaodan Zhu},
  title = {SemEval-2021 Task 6: Detection of Persuasion Techniques in Texts and Images},
  booktitle = {Proceedings of the 15th International Workshop on Semantic Evaluation, SemEval@ACL/IJCNLP 2021, Virtual Event / Bangkok, Thailand, August 5-6, 2021},
  pages = {70--98},
  publisher = {Association for Computational Linguistics},
  year = {2021},
  doi = {10.18653/v1/2021.semeval-1.7},
}

@inproceedings{Yanai2007Image,
  author = {Keiji Yanai},
  editor = {Carey L. Williamson and Mary Ellen Zurko and Peter F. Patel{-}Schneider and Prashant J. Shenoy},
  title = {Image collector {III:} a web image-gathering system with bag-of-keypoints},
  booktitle = {Proceedings of the 16th International Conference on World Wide Web, {WWW} 2007, Banff, Alberta, Canada, May 8-12, 2007},
  pages = {1295--1296},
  publisher = {{ACM}},
  year = {2007},
  doi = {10.1145/1242572.1242816},
}

@article{Zhang2022Miracl,
  title={Making a MIRACL: Multilingual information retrieval across a continuum of languages},
  author={Zhang, Xinyu and Thakur, Nandan and Ogundepo, Odunayo and Kamalloo, Ehsan and Alfonso-Hermelo, David and Li, Xiaoguang and Liu, Qun and Rezagholizadeh, Mehdi and Lin, Jimmy},
  journal={arXiv preprint arXiv:2210.09984},
  year={2022}
}

@article{Lawrie2022HC4,
  author = {Dawn Lawrie and James Mayfield and Douglas W. Oard and Eugene Yang},
  title = {HC4: A New Suite of Test Collections for Ad Hoc CLIR},
  booktitle = {{Advances in Information Retrieval. 44th European Conference on IR Research (ECIR 2022)}},
  year = {2022},
  month = apr,
  publisher = {Springer},
  series = {Lecture Notes in Computer Science},
  site = {Stavanger, Norway},
  url = {https://arxiv.org/abs/2201.09992}
}

@inproceedings{DBLP:conf/iclr/SuYXSMWLSST0YA025,
  author       = {Hongjin Su and
                  Howard Yen and
                  Mengzhou Xia and
                  Weijia Shi and
                  Niklas Muennighoff and
                  Han{-}yu Wang and
                  Haisu Liu and
                  Quan Shi and
                  Zachary S. Siegel and
                  Michael Tang and
                  Ruoxi Sun and
                  Jinsung Yoon and
                  Sercan {\"{O}}. Arik and
                  Danqi Chen and
                  Tao Yu},
  title        = {{BRIGHT:} {A} Realistic and Challenging Benchmark for Reasoning-Intensive
                  Retrieval},
  booktitle    = {The Thirteenth International Conference on Learning Representations,
                  {ICLR} 2025, Singapore, April 24-28, 2025},
  publisher    = {OpenReview.net},
  year         = {2025},
  url          = {https://openreview.net/forum?id=ykuc5q381b},
  timestamp    = {Thu, 15 May 2025 17:19:05 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SuYXSMWLSST0YA025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}