@inproceedings{30643033c2234ee4b52cadd718332541,
title = "TraQuLA: Transparent Question Answering Over RDF Through Linguistic Analysis",
abstract = "Answering complex questions over knowledge graphs has gained popularity recently. Systems based on large language models seem to achieve top performance. However, these models may generate content that looks reasonable but is incorrect. They also lack transparency, making it impossible to exactly explain why a particular answer was generated. To tackle these problems we present the TraQuLA (Transparent QUestion-answering through Linguistic Analysis) system – a rule-based system developed through linguistic analysis of datasets of complex questions over DBpedia and Wikidata. TraQuLA defines a question{\textquoteright}s type and extracts its semantic component candidates (named entities, properties and class names). For the extraction of properties, whose natural language verbalisations are most diverse, we built an extensive database which matches DBpedia/Wikidata properties to natural language expressions, allowing linguistic variation. TraQuLA generates semantic parses for the components and ranks them by each question{\textquoteright}s structure and morphological features. The ranked parses are then analysed top down according to their patterns, also noting linguistic aspects, until a solution is found and a SPARQL query is produced. TraQuLA outperforms the existing baseline systems on the LC-QuAD 1.0 and competes with ChatGPT-based systems on LC-QuAD 2.0. For the LC-QuAD 1.0 test set, we developed an evaluation approach that accepts multiple ways to answer the questions (some ignored by the dataset) and curated some errors. TraQuLa contains no “black boxes” of neural networks or machine learning and makes its answer construction traceable. Users can therefore better rely on them and assess their correctness.",
keywords = "Linguistic analysis, Question-answering, RDF, Rule-based",
author = "Elizaveta Zimina and Kalervo J{\"a}rvelin and Jaakko Peltonen and Aarne Ranta and Jyrki Nummenmaa",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2024.; International Conference on Web Engineering ; Conference date: 17-06-2024 Through 20-06-2024",
year = "2024",
doi = "10.1007/978-3-031-62362-2_2",
language = "English",
isbn = "978-3-031-62361-5",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "19--33",
editor = "Kostas Stefanidis and Kari Syst{\"a} and Maristella Matera and Sebastian Heil and Haridimos Kondylakis and Elisa Quintarelli",
booktitle = "Web Engineering - 24th International Conference, ICWE 2024, Proceedings",
}