
<ns0:uwmetadata xmlns:ns0="http://phaidra.univie.ac.at/XML/metadata/V1.0" xmlns:ns1="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0" xmlns:ns10="http://phaidra.univie.ac.at/XML/metadata/provenience/V1.0" xmlns:ns11="http://phaidra.univie.ac.at/XML/metadata/provenience/V1.0/entity" xmlns:ns12="http://phaidra.univie.ac.at/XML/metadata/digitalbook/V1.0" xmlns:ns13="http://phaidra.univie.ac.at/XML/metadata/etheses/V1.0" xmlns:ns2="http://phaidra.univie.ac.at/XML/metadata/extended/V1.0" xmlns:ns3="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0/entity" xmlns:ns4="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0/requirement" xmlns:ns5="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0/educational" xmlns:ns6="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0/annotation" xmlns:ns7="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0/classification" xmlns:ns8="http://phaidra.univie.ac.at/XML/metadata/lom/V1.0/organization" xmlns:ns9="http://phaidra.univie.ac.at/XML/metadata/histkult/V1.0">
  <ns1:general>
    <ns1:identifier>o:8175</ns1:identifier>
    <ns1:title language="en">Scientific QA system with verifiable answers</ns1:title>
    <ns1:language>en</ns1:language>
    <ns1:description language="en">In this paper, we introduce the Verif.ai project, a pioneering open-source scientific question-answering system,
designed to provide answers that are not only referenced
but also automatically vetted and verifiable. The components of the system are (1) an Information Retrieval system
combining semantic and lexical search techniques over scientific papers (PubMed), (2) a Retrieval-Augmented Generation (RAG) module using fine-tuned generative model
(Mistral 7B) and retrieved articles to generate claims with
references to the articles from which it was derived, and
(3) a Verification engine, based on a fine-tuned DeBERTa
and XLM-RoBERTa models on Natural Language Inference
task using SciFACT dataset. The verification engine crosschecks the generated claim and the article from which the
claim was derived, verifying whether there may have been
any hallucinations in generating the claim. By leveraging
the Information Retrieval and RAG modules, Verif.ai excels
in generating factual information from a vast array of scientific sources. At the same time, the Verification engine
rigorously double-checks this output, ensuring its accuracy
and reliability. This dual-stage process plays a crucial role in
acquiring and confirming factual information, significantly
enhancing the information landscape. Our methodology
could significantly enhance scientists’ productivity, concurrently fostering trust in applying generative language models
within scientific domains, where hallucinations and misinformation are unacceptable.</ns1:description>
    <ns2:identifiers>
      <ns2:resource>1552100</ns2:resource>
      <ns2:identifier>978-92-9083-669-8</ns2:identifier>
    </ns2:identifiers>
    <ns2:identifiers>
      <ns2:resource>1552101</ns2:resource>
      <ns2:identifier>2957-4935</ns2:identifier>
    </ns2:identifiers>
    <ns2:identifiers>
      <ns2:resource>1552099</ns2:resource>
      <ns2:identifier>https://doi.org/10.5281/zenodo.13863828</ns2:identifier>
    </ns2:identifiers>
  </ns1:general>
  <ns1:lifecycle>
    <ns1:upload_date>2025-08-28T08:56:52.784Z</ns1:upload_date>
    <ns1:status>44</ns1:status>
    <ns2:peer_reviewed>no</ns2:peer_reviewed>
    <ns1:contribute seq="0">
      <ns1:role>46</ns1:role>
      <ns1:entity seq="0">
        <ns3:firstname>Adela</ns3:firstname>
        <ns3:lastname>Ljajić</ns3:lastname>
        <ns3:institution>Istraživačko-razvojni institut za veštačku inteligenciju Srbije</ns3:institution>
        <ns3:orcid>0000-0001-7326-059X</ns3:orcid>
      </ns1:entity>
    </ns1:contribute>
    <ns1:contribute seq="1">
      <ns1:role>46</ns1:role>
      <ns1:entity seq="0">
        <ns3:firstname>Miloš</ns3:firstname>
        <ns3:lastname>Košprdić</ns3:lastname>
        <ns3:institution>Istraživačko-razvojni institut za veštačku inteligenciju Srbije</ns3:institution>
        <ns3:orcid>0000-0001-6902-3639</ns3:orcid>
      </ns1:entity>
    </ns1:contribute>
    <ns1:contribute seq="2">
      <ns1:role>46</ns1:role>
      <ns1:entity seq="0">
        <ns3:firstname>Bojana</ns3:firstname>
        <ns3:lastname>Bašaragin</ns3:lastname>
        <ns3:institution>Istraživačko-razvojni institut za veštačku inteligenciju Srbije</ns3:institution>
        <ns3:orcid>0000-0002-7679-1676</ns3:orcid>
      </ns1:entity>
    </ns1:contribute>
    <ns1:contribute seq="3">
      <ns1:role>46</ns1:role>
      <ns1:entity seq="0">
        <ns3:firstname>Darija</ns3:firstname>
        <ns3:lastname>Medvecki</ns3:lastname>
        <ns3:institution>Istraživačko-razvojni institut za veštačku inteligenciju Srbije</ns3:institution>
        <ns3:orcid>0000-0002-4180-0050</ns3:orcid>
      </ns1:entity>
    </ns1:contribute>
    <ns1:contribute seq="4">
      <ns1:role>46</ns1:role>
      <ns1:entity seq="0">
        <ns3:firstname>Lorenzo</ns3:firstname>
        <ns3:lastname>Cassano</ns3:lastname>
        <ns3:institution>Bayer A.G. Research and development</ns3:institution>
      </ns1:entity>
    </ns1:contribute>
    <ns1:contribute seq="5">
      <ns1:role>46</ns1:role>
      <ns1:entity seq="0">
        <ns3:firstname>Nikola</ns3:firstname>
        <ns3:lastname>Milošević</ns3:lastname>
        <ns3:institution>Istraživačko-razvojni institut za veštačku inteligenciju Srbije</ns3:institution>
        <ns3:orcid>0000-0003-2706-9676</ns3:orcid>
      </ns1:entity>
    </ns1:contribute>
  </ns1:lifecycle>
  <ns1:technical>
    <ns1:format>application/pdf</ns1:format>
    <ns1:size>8991896</ns1:size>
    <ns1:location>https://unilib.phaidrabg.rs/o:8175</ns1:location>
  </ns1:technical>
  <ns1:rights>
    <ns1:cost>no</ns1:cost>
    <ns1:copyright>yes</ns1:copyright>
    <ns1:license>20</ns1:license>
  </ns1:rights>
  <ns1:classification>
    <ns1:purpose>70</ns1:purpose>
  </ns1:classification>
  <ns1:organization>
    <ns8:hoschtyp>92000004</ns8:hoschtyp>
    <ns8:orgassignment>
      <ns8:faculty>71A08</ns8:faculty>
    </ns8:orgassignment>
  </ns1:organization>
  <ns12:digitalbook>
    <ns12:name_magazine language="en">Prcocededings of the 6th International Open Search Symposium #ossym2024</ns12:name_magazine>
    <ns12:from_page>59</ns12:from_page>
    <ns12:to_page>64</ns12:to_page>
    <ns12:publisherlocation>Minhen, Nemačka</ns12:publisherlocation>
    <ns12:publisher>Leibniz Supercomputing Centre LRZ</ns12:publisher>
    <ns12:releaseyear>2024</ns12:releaseyear>
  </ns12:digitalbook>
</ns0:uwmetadata>
