%Aigaion2 BibTeX export from Idiap Publications
%Thursday 17 April 2025 07:32:06 PM

@INPROCEEDINGS{Valentino_TEXTGRAPHS-16_2022,
         author = {Valentino, Marco and Mendes, Deborah and Thayaparan, Mokanarangan and Freitas, Andre and Ustalov, Dmitry},
       projects = {Idiap},
          title = {TextGraphs 2022 Shared Task on Natural Language Premise Selection},
      booktitle = {Proceedings of TextGraphs-16: Graph-based Methods for Natural Language Processing},
           year = {2022},
            url = {https://aclanthology.org/2022.textgraphs-1.11},
       abstract = {The Shared Task on Natural Language Premise Selection (NLPS) asks participants to retrieve the set of premises that are most likely to be useful for proving a given mathematical statement from a supporting knowledge base. While previous editions of the TextGraphs shared tasks series targeted multi-hop inference for explanation regeneration in the context of science questions (Thayaparan et al., 2021; Jansen and Ustalov, 2020, 2019), NLPS aims to assess the ability of state-of-the-art approaches to operate on a mixture of natural and mathematical language and model complex multi-hop reasoning dependencies between statements. To this end, this edition of the shared task makes use of a large set of approximately 21k mathematical statements extracted from the PS-ProofWiki dataset (Ferreira and Freitas, 2020a). In this summary paper, we present the results of the 1st edition of the NLPS task, providing a description of the evaluation data, and the participating systems. Additionally, we perform a detailed analysis of the results, evaluating various aspects involved in mathematical language processing and multi-hop inference. The best-performing system achieved a MAP of 15.39, improving the performance of a TF-IDF baseline by approximately 3.0 MAP.}
}