<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/CINECAstyle.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-06-06T01:17:13Z</responseDate><request verb="GetRecord" identifier="oai:iris.cnr.it:20.500.14243/562981" metadataPrefix="oai_dc">https://iris.cnr.it/oai/request</request><GetRecord><record><header><identifier>oai:iris.cnr.it:20.500.14243/562981</identifier><datestamp>2026-01-16T01:15:20Z</datestamp><setSpec>com_20.500.14243_46</setSpec><setSpec>com_20.500.14243_21</setSpec><setSpec>col_20.500.14243_47</setSpec><setSpec>ou_ou294</setSpec><setSpec>ou_ou239</setSpec></header><metadata><oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:doc="http://www.lyncode.com/xoai" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
<dc:title>Novel benchmark for NER in the wastewater and stormwater domain</dc:title>
<dc:creator>Cardillo F. A.</dc:creator>
<dc:creator>Debole F.</dc:creator>
<dc:creator>Frontini F.</dc:creator>
<dc:creator>Aelami M.</dc:creator>
<dc:creator>Chahinian N.</dc:creator>
<dc:creator>Conrad S.</dc:creator>
<dc:contributor>Cardillo, F. A.</dc:contributor>
<dc:contributor> Debole, F.</dc:contributor>
<dc:contributor> Frontini, F.</dc:contributor>
<dc:contributor> Aelami, M.</dc:contributor>
<dc:contributor> Chahinian, N.</dc:contributor>
<dc:contributor> Conrad, S.</dc:contributor>
<dc:subject>Annotation projection</dc:subject>
<dc:subject>Domain-specific corpus</dc:subject>
<dc:subject>LLMs for NER</dc:subject>
<dc:subject>Multilingual NLP</dc:subject>
<dc:subject>Named Entity Recognition</dc:subject>
<dc:description>Efficient wastewater and stormwater management is mandatory for sustainable cities. Extracting structured knowledge from reports and regulations is challenging due to domain-specific terminology and multilingual contexts. This work focuses on domain-specific Named Entity Recognition (NER) as a first step towards effective relation and information extraction to support decision making. A multilingual benchmark is crucial for evaluating these methods. This study develops a French-Italian domain-specific text corpus for wastewater management. It evaluates state-of-the-art NER methods, including LLM-based approaches, to provide a reliable baseline for future strategies and explores automated annotation projection in view of an extension of the corpus to new languages.</dc:description>
<dc:date>2025</dc:date>
<dc:type>info:eu-repo/semantics/conferenceObject</dc:type>
<dc:identifier>https://hdl.handle.net/20.500.14243/562981</dc:identifier>
<dc:identifier>10.1109/cist65886.2025.11224095</dc:identifier>
<dc:identifier>info:eu-repo/semantics/altIdentifier/scopus/2-s2.0-105024952471</dc:identifier>
<dc:relation>info:eu-repo/semantics/altIdentifier/isbn/979-8-3315-4384-6</dc:relation>
<dc:identifier>https://ieeexplore.ieee.org/document/11224095</dc:identifier>
<dc:language>eng</dc:language>
<dc:relation>ispartofbook:Cist 2025  proceedings</dc:relation>
<dc:relation>Cist 2025 - 8th IEEE International Congress on Information Science and Technology</dc:relation>
<dc:relation>firstpage:226</dc:relation>
<dc:relation>lastpage:231</dc:relation>
<dc:relation>numberofpages:6</dc:relation>
<dc:relation>serie:COLLOQUIUM IN INFORMATION SCIENCE AND TECHNOLOGY</dc:relation>
<dc:rights>info:eu-repo/semantics/restrictedAccess</dc:rights>
<dc:format>ELETTRONICO</dc:format>
<dc:publisher>Institute of Electrical and Electronics Engineers</dc:publisher>
<dc:publisher>country:USA</dc:publisher>
<dc:rights>license:NON PUBBLICO - Accesso privato/ristretto</dc:rights>
<dc:rights>license uri:iris.PRI01</dc:rights>
</oai_dc:dc></metadata></record></GetRecord></OAI-PMH>