<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/CINECAstyle.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-05-10T23:15:33Z</responseDate><request verb="GetRecord" identifier="oai:iris.cnr.it:20.500.14243/479241" metadataPrefix="oai_dc">https://iris.cnr.it/oai/request</request><GetRecord><record><header><identifier>oai:iris.cnr.it:20.500.14243/479241</identifier><datestamp>2025-01-24T23:20:40Z</datestamp><setSpec>com_20.500.14243_46</setSpec><setSpec>com_20.500.14243_21</setSpec><setSpec>col_20.500.14243_47</setSpec><setSpec>ou_ou239</setSpec></header><metadata><oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:doc="http://www.lyncode.com/xoai" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
<dc:title>XL-WA: a Gold Evaluation Benchmark for Word Alignment in 14 Language Pairs</dc:title>
<dc:creator>Martelli F.</dc:creator>
<dc:creator>Bejgu A. S.</dc:creator>
<dc:creator>Campagnano C.</dc:creator>
<dc:creator>Cibej J.</dc:creator>
<dc:creator>Costa R.</dc:creator>
<dc:creator>Gantar A.</dc:creator>
<dc:creator>Kallas J.</dc:creator>
<dc:creator>Koeva S.</dc:creator>
<dc:creator>Koppel K.</dc:creator>
<dc:creator>Krek S.</dc:creator>
<dc:creator>Langemets M.</dc:creator>
<dc:creator>Lipp V.</dc:creator>
<dc:creator>Nimb S.</dc:creator>
<dc:creator>Olsen S.</dc:creator>
<dc:creator>Pedersen B. S.</dc:creator>
<dc:creator>Quochi V.</dc:creator>
<dc:creator>Salgado A.</dc:creator>
<dc:creator>Simon L.</dc:creator>
<dc:creator>Tiberius C.</dc:creator>
<dc:creator>Urena-Ruiz R. -J.</dc:creator>
<dc:creator>Navigli R.</dc:creator>
<dc:contributor>Federico Boschetti, Gianluca E. Lebani, Bernardo Magnini, Nicole Novielli</dc:contributor>
<dc:contributor>Martelli, F.</dc:contributor>
<dc:contributor> Bejgu, A. S.</dc:contributor>
<dc:contributor> Campagnano, C.</dc:contributor>
<dc:contributor> Cibej, J.</dc:contributor>
<dc:contributor> Costa, R.</dc:contributor>
<dc:contributor> Gantar, A.</dc:contributor>
<dc:contributor> Kallas, J.</dc:contributor>
<dc:contributor> Koeva, S.</dc:contributor>
<dc:contributor> Koppel, K.</dc:contributor>
<dc:contributor> Krek, S.</dc:contributor>
<dc:contributor> Langemets, M.</dc:contributor>
<dc:contributor> Lipp, V.</dc:contributor>
<dc:contributor> Nimb, S.</dc:contributor>
<dc:contributor> Olsen, S.</dc:contributor>
<dc:contributor> Pedersen, B. S.</dc:contributor>
<dc:contributor> Quochi, V.</dc:contributor>
<dc:contributor> Salgado, A.</dc:contributor>
<dc:contributor> Simon, L.</dc:contributor>
<dc:contributor> Tiberius, C.</dc:contributor>
<dc:contributor> Urena-Ruiz, R. -J.</dc:contributor>
<dc:contributor> Navigli, R.</dc:contributor>
<dc:subject>Deep Learning</dc:subject>
<dc:subject>Multilinguality</dc:subject>
<dc:subject>Natural Language Processing</dc:subject>
<dc:subject>Word Alignment</dc:subject>
<dc:description>Word alignment plays a crucial role in several Natural Language Processing tasks, such as lexicon injection and cross-lingual label projection. The evaluation of word alignment systems relies heavily on manually-curated datasets, which are not always available, especially in mid- and low-resource languages. In order to address this limitation, we propose XL-WA, a novel entirely manually-curated evaluation benchmark for word alignment covering 14 language pairs. We illustrate the creation process of our benchmark and compare statistical and neural approaches to word alignment in both language-specific and zero-shot settings, thus investigating the ability of state-of-the-art models to generalize on unseen language pairs. We release our new benchmark at: https://github.com/SapienzaNLP/XL-WA.</dc:description>
<dc:date>2023</dc:date>
<dc:type>info:eu-repo/semantics/conferenceObject</dc:type>
<dc:identifier>https://hdl.handle.net/20.500.14243/479241</dc:identifier>
<dc:identifier>info:eu-repo/semantics/altIdentifier/scopus/2-s2.0-85181170710</dc:identifier>
<dc:language>eng</dc:language>
<dc:relation>ispartofbook:Proceedings of the Ninth Italian Conference on Computational Linguistics</dc:relation>
<dc:relation>9th Italian Conference on Computational Linguistics, CLiC-it 2023</dc:relation>
<dc:relation>volume:3596</dc:relation>
<dc:relation>numberofpages:9</dc:relation>
<dc:relation>serie:CEUR WORKSHOP PROCEEDINGS</dc:relation>
<dc:rights>info:eu-repo/semantics/openAccess</dc:rights>
<dc:publisher>CEUR-WS</dc:publisher>
<dc:rights>license:Creative commons</dc:rights>
<dc:rights>license uri:http://creativecommons.org/licenses/by/4.0/</dc:rights>
</oai_dc:dc></metadata></record></GetRecord></OAI-PMH>