Skip to content

Commit cfca710

Browse files
Update pubs.bib
1 parent a74891a commit cfca710

File tree

1 file changed

+20
-0
lines changed

1 file changed

+20
-0
lines changed

pubs.bib

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,22 @@
1+
@inproceedings{quan-etal-2024-verification,
2+
title = "Verification and Refinement of Natural Language Explanations through {LLM}-Symbolic Theorem Proving",
3+
author = "Quan, Xin and
4+
Valentino, Marco and
5+
Dennis, Louise A. and
6+
Freitas, Andre",
7+
editor = "Al-Onaizan, Yaser and
8+
Bansal, Mohit and
9+
Chen, Yun-Nung",
10+
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
11+
month = nov,
12+
year = "2024",
13+
address = "Miami, Florida, USA",
14+
publisher = "Association for Computational Linguistics",
15+
url = "https://aclanthology.org/2024.emnlp-main.172",
16+
pages = "2933--2958",
17+
abstract = "Natural language explanations represent a proxy for evaluating explanation-based and multi-step Natural Language Inference (NLI) models. However, assessing the validity of explanations for NLI is challenging as it typically involves the crowd-sourcing of apposite datasets, a process that is time-consuming and prone to logical errors. To address existing limitations, this paper investigates the verification and refinement of natural language explanations through the integration of Large Language Models (LLMs) and Theorem Provers (TPs). Specifically, we present a neuro-symbolic framework, named Explanation-Refiner, that integrates TPs with LLMs to generate and formalise explanatory sentences and suggest potential inference strategies for NLI. In turn, the TP is employed to provide formal guarantees on the logical validity of the explanations and to generate feedback for subsequent improvements. We demonstrate how Explanation-Refiner can be jointly used to evaluate explanatory reasoning, autoformalisation, and error correction mechanisms of state-of-the-art LLMs as well as to automatically enhance the quality of explanations of variable complexity in different domains.",
18+
}
19+
120
@INPROCEEDINGS{10704818,
221
author={Shaukat, Nabil and Dubey, Shival and Kaddouh, Bilal and Blight, Andy and Mudrich, Lenka and Ribeiro, Pedro and Araujo, Hugo and Richardson, Rob and Dennis, Louise and Cavalcanti, Ana and Mousavi, Mohammad},
322
booktitle={2024 20th IEEE/ASME International Conference on Mechatronic and Embedded Systems and Applications (MESA)},
@@ -6,6 +25,7 @@ @INPROCEEDINGS{10704818
625
volume={},
726
number={},
827
pages={1-7},
28+
note={[<span class="tas_vn">TAS Verifiability Node</span>]},
929
keywords={Mechatronics;Software architecture;Surveillance;Computer architecture;Software;Personnel;Formal specifications;Robots;Testing;Drones;robochart;ros;drone;firefighting;software;robots;trustworthy architecture;trustworthy},
1030
doi={10.1109/MESA61532.2024.10704818}}
1131

0 commit comments

Comments
 (0)