<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">GFG -Gender-Fair Generation: A CALAMITA Challenge</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Simona</forename><surname>Frenda</surname></persName>
							<email>s.frenda@hw.ac.uk</email>
							<affiliation key="aff0">
								<orgName type="laboratory">Interaction Lab</orgName>
								<orgName type="institution">Heriot-Watt University</orgName>
								<address>
									<settlement>Edinburgh</settlement>
									<country key="GB">Scotland</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">aequa-tech</orgName>
								<address>
									<settlement>Turin</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Andrea</forename><surname>Piergentili</surname></persName>
							<email>apiergentili@fbk.eu</email>
							<affiliation key="aff2">
								<orgName type="institution">Fondazione Bruno Kessler</orgName>
								<address>
									<settlement>Trento</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
							<affiliation key="aff3">
								<orgName type="institution">University of Trento</orgName>
								<address>
									<settlement>Trento</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Beatrice</forename><surname>Savoldi</surname></persName>
							<email>bsavoldi@fbk.eu</email>
							<affiliation key="aff2">
								<orgName type="institution">Fondazione Bruno Kessler</orgName>
								<address>
									<settlement>Trento</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Marco</forename><surname>Madeddu</surname></persName>
							<email>marco.madeddu@unito.it</email>
							<affiliation key="aff4">
								<orgName type="department">Computer Science Department</orgName>
								<orgName type="institution">University of Turin</orgName>
								<address>
									<settlement>Turin</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Martina</forename><surname>Rosola</surname></persName>
							<email>martina.rosola@gmail.com</email>
							<affiliation key="aff5">
								<orgName type="institution">Universitat de Barcelona</orgName>
								<address>
									<settlement>Barcelona</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Silvia</forename><surname>Casola</surname></persName>
							<email>s.casola@lmu.de</email>
							<affiliation key="aff6">
								<orgName type="department">MaiNLP &amp; MCML</orgName>
								<orgName type="institution">LMU Munich</orgName>
								<address>
									<country key="DE">Germany</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Chiara</forename><surname>Ferrando</surname></persName>
							<email>chiara.ferrando@unito.it</email>
							<affiliation key="aff4">
								<orgName type="department">Computer Science Department</orgName>
								<orgName type="institution">University of Turin</orgName>
								<address>
									<settlement>Turin</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Viviana</forename><surname>Patti</surname></persName>
							<email>viviana.patti@unito.it</email>
							<affiliation key="aff4">
								<orgName type="department">Computer Science Department</orgName>
								<orgName type="institution">University of Turin</orgName>
								<address>
									<settlement>Turin</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Matteo</forename><surname>Negri</surname></persName>
							<email>negri@fbk.eu</email>
							<affiliation key="aff2">
								<orgName type="institution">Fondazione Bruno Kessler</orgName>
								<address>
									<settlement>Trento</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Luisa</forename><surname>Bentivogli</surname></persName>
							<affiliation key="aff2">
								<orgName type="institution">Fondazione Bruno Kessler</orgName>
								<address>
									<settlement>Trento</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">GFG -Gender-Fair Generation: A CALAMITA Challenge</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">D5158ECE06D9DEF1DCD4E927F558F4C9</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2025-04-23T17:37+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>Gender-fair language, Inclusive language, Unfairness detection, Machine translation, Generation, Neomorphemes 1. Challenge: Introduction and Motivation Orcid 0000-0002-6215-3374 (S. Frenda)</term>
					<term>0000-0003-2117-1338 (A. Piergentili)</term>
					<term>0000-0002-3061-8317 (B. Savoldi)</term>
					<term>0009-0004-5620-0631 (M. Madeddu)</term>
					<term>0000-0002-8891-352X (M. Rosola)</term>
					<term>0000-0002-0017-2975 (S. Casola)</term>
					<term>0000-0001-5991-370X (V. Patti)</term>
					<term>0000-0002-8811-4330 (M. Negri)</term>
					<term>0000-0001-7480-2231 (L. Bentivogli)</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Gender-fair language aims at promoting gender equality by using terms and expressions that include all identities and avoid reinforcing gender stereotypes. Implementing gender-fair strategies is particularly challenging in heavily gender-marked languages, such as Italian. To address this, the Gender-Fair Generation challenge intends to help shift toward gender-fair language in written communication. The challenge, designed to assess and monitor the recognition and generation of gender-fair language in both mono-and cross-lingual scenarios, includes three tasks: (1) the detection of gendered expressions in Italian sentences, (2) the reformulation of gendered expressions into gender-fair alternatives, and (3) the generation of gender-fair language in automatic translation from English to Italian. The challenge relies on three different annotated datasets: the GFL-it corpus, which contains Italian texts extracted from administrative documents provided by the University of Brescia; GeNTE, a bilingual test set for gender-neutral rewriting and translation built upon a subset of the Europarl dataset; and Neo-GATE, a bilingual test set designed to assess the use of non-binary neomorphemes in Italian for both fair formulation and translation tasks. Finally, each task is evaluated with specific metrics: average of F1-score obtained by means of BERTScore computed on each entry of the datasets for task 1, an accuracy measured with a gender-neutral classifier, and a coverage-weighted accuracy for tasks 2 and 3.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>reinforcing gender stereotypes <ref type="bibr" target="#b0">[1]</ref>.</p><p>In order to pursue the goals of fairness and inclusiveness, measures that take into account the importance of the correlation between language and gender become central. Especially in heavily gender-marked languages such as Italian, the use and application of gender-fair strategies is an urgent and yet difficult challenge. Indeed, in these languages, several are the elements one has to take into account to ensure a gender-fair use of language. However, adopting a gender-fair language is crucial given the negative effects of the masculine generics, documented in a range of empirical studies <ref type="bibr" target="#b1">[2,</ref><ref type="bibr" target="#b2">3]</ref>; and recent years witnessed an increase in awareness and effort to address these issues by promoting gender-fair language <ref type="bibr" target="#b3">[4]</ref>.</p><p>In Italian, the masculine is not only used to refer to and address men but also generic or unknown individuals; mixed-gender groups, regardless of the proportion of genders of its members; women, typically when occupying prestigious roles; and genderqueer people, given that there is no codified grammatical gender for referring to them <ref type="bibr" target="#b4">[5]</ref>. This use, though, makes women and gen-derqueer people invisible, giving rise to a proper injustice <ref type="bibr" target="#b5">[6,</ref><ref type="bibr" target="#b6">7,</ref><ref type="bibr" target="#b7">8]</ref>. Extensive empirical literature also highlights how certain gendered expressions influence our cognition, with masculine terms evoking male images and reducing, e.g, the likelihood of women applying for or being considered suitable for a job position (for an overview see <ref type="bibr" target="#b8">[9,</ref><ref type="bibr" target="#b9">10]</ref>).</p><p>Crucially, such unfair linguistic practices are perpetuated in language technologies <ref type="bibr" target="#b10">[11]</ref>. This becomes particularly evident in languages, like Italian, for which NLP tools often adopt masculine and stereotypical representations, making undue binary gender assumptions <ref type="bibr" target="#b11">[12]</ref>.</p><p>We propose the Gender-Fair Generation challenge at CALAMITA 2024 <ref type="bibr" target="#b12">[13]</ref>, whose goal is to reduce the use of gender-unfair expressions in written Italian, focusing on both monolingual and cross-lingual scenarios (English-Italian). Our challenge is structured into three tasks-i) gendered language detection, ii) fair reformulation, and iii) fair translation-across three different datasets. Namely, the newly created GFL-it corpus, composed of Italian texts extracted from 35 documents provided by the academic administration office of the University of Brescia and annotated following specific guidelines <ref type="bibr" target="#b0">[1]</ref>; GeNTE, a bilingual test set for gender-neutral rewriting and translation built on a subset of the Europarl dataset <ref type="bibr" target="#b13">[14]</ref>; and Neo-GATE, a bilingual test set designed to evaluate the use of nonbinary neomorphemes in Italian <ref type="bibr" target="#b14">[15]</ref>. <ref type="foot" target="#foot_0">1</ref> We combine and repurpose these datasets across the three tasks envisioned in the Gender-Fair Generation challenge.</p><p>This report is structured as follows: in Section 2, we provide a description of our challenge; in Section 3, we present the three datasets in detail; in Section 4, we describe the metrics involved in our task; in Section 5, we describe the limitations of our work, and finally, in Section 6, we discuss the ethical issues.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Challenge: Description</head><p>The Gender-Fair Generation challenge is organized into three tasks, which we present in detail below.</p><p>1) Gendered language detection: the first task tests the models' ability to identify referentially gender-marked expressions within Italian sentences, namely those expressions whose (typically grammatical) gender is linked to their human referent. Referentially gendered (henceforth simply gendered) language includes:</p><p>• the overextended masculine or feminine, i.e., the use of a single gendered expression to refer to persons belonging to a mixed-gender group -e.g., i cittadini (the.M citizens:M) used for a group of citizens of different genders; • the generic masculine or feminine, i.e., the use of a single gendered expression to refer to a generic or unknown person -e.g., il candidato deve avere tutti i requisiti (the.M candidate:M has to possess all the requirements); • the incongruous gender, i.e., the use of a grammatical gender that does not match the referent's gender -e.g., il professore ordinario Maria Rossi (the.M full.M professor:M Maria Rossi).</p><p>2) Fair reformulation: the second task tests models' ability to rewrite gendered expressions into alternative gender-fair expressions. To achieve this goal, various gender-fair language strategies can be employed. In particular, we will employ obscuration strategies:</p><p>• conservative obscuration, i.e., the use of expressions and constructions that avoid providing information on the referent's gender -e.g., il corpo docente (the teaching body) or coloro che insegnano (those who teach) instead of i professori (the.M professors:M); • innovative obscuration, i.e., the use of novel, gender-neutral markers instead of the gendered ones -e.g., lǝ professorǝ (the.INN professor:INN) instead of il professore (the.M professor:M) or la professoressa (the.F professor:F). <ref type="foot" target="#foot_1">2</ref>As we further discuss in Section 3, the released version of GFL-it for this challenge and GeNTE include references and annotations designed for the former strategy, whereas Neo-GATE for the latter.</p><p>Note that the chosen strategies do not exhaust the full range of possibilities: we discarded, for the moment, visibility strategies such as the repetition of an expression in the feminine and the masculine -e.g., i professori e le professoresse (the.M professors:M and the.F professors:F) -and the repetition of in three gendered forms (feminine, masculine and innovative) -e.g., i professori, lǝ professorǝ e le professoresse (the.M professors:M, the.INN professors:INN and the.F professors:F).</p><p>3) Fair translation: like the second task, the third one is designed to test the models' ability to generate genderfair language texts, but in the cross-lingual context of automatic translation from English into Italian. For example, consider applying the two gender-fair language strategies described above to the translation of the sentence "I am glad to know such knowledgeable doctors": • innovative obscuration: Sono contentǝ di conoscere medicǝ così preparatǝ.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Data description</head><p>For our challenge, we propose three benchmarks dedicated to the evaluation of gender-fair language generation, (GFL-it <ref type="foot" target="#foot_2">3</ref> , GeNTE <ref type="bibr" target="#b13">[14]</ref>, <ref type="foot" target="#foot_3">4</ref> and Neo-GATE <ref type="bibr" target="#b14">[15]</ref>), <ref type="foot" target="#foot_4">5</ref> and a total of 7 prompts to be used across the tasks and datasets. We describe the datasets in subsections 3.1, 3.2, and 3.3 respectively, and the prompts in subsection 3.4.</p><p>Statistics about the benchmarks and their use within this challenge proposal are available in Table <ref type="table" target="#tab_1">1</ref>. GFL-it contains a total of 2,187 texts, among which 5 expert annotators identified an average of 3.24 unfair spans (in total 3,908) in 1,206 texts. For each identified span, the annotators proposed various gender-fair alternatives, with an average of 3.8 alternatives per span. For more detailed statistics about GeNTE and Neo-GATE we refer to the respective papers.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.">GFL-it</head><p>GFL-it was built on documents and texts from University website pages provided by the University of Brescia. It constitutes an expansion of the corpus presented in Rosola et al. <ref type="bibr" target="#b0">[1]</ref>. The corpus comprises a total of 35 documents in Italian, split into 2,187 texts. Each text was annotated by 5 paid expert annotators following the original annotation scheme <ref type="bibr" target="#b0">[1]</ref>. First, the annotators identified all the spans that contained any gender-unfairness, distinguishing among: overextended <ref type="bibr" target="#b2">(3,</ref><ref type="bibr">465)</ref>, generic (530) and incongruous gender (31) (see 2). Overall, 3,908 spans were identified. Then, they provided at least one alternative per span. The alternatives could belong to any of the gender-fair strategies: conservative or innovative obscuration, conservative or innovative visibility, or hybrid alternatives (i.e., any combination of these types).</p><p>Given that GFL-it is annotated for spans, each text contains a list of different spans and their reformulations in different forms of gender-fair language <ref type="foot" target="#foot_5">6</ref> . More specifi-cally, each entry is described by the following attributes:</p><p>• id_text: The unique ID for each text.</p><p>• text: The entire text of the entry.</p><p>• list_spans: The list containing all spans found in the text. • rewritten_texts_generico: A reformulation of the entire text where spans labeled as generic are replaced. • rewritten_texts_sovraesteso: A reformulation of the entire text where spans labeled as overextended are replaced. • rewritten_texts_generico_e_sovraesteso: A reformulation of the entire text where spans are randomly replaced by available options in rewrit-ten_texts_generico or rewritten_texts_sovraesteso.</p><p>Each span in list_spans follows the structure:</p><p>• span: The textual representation of the span.</p><p>• start: The starting index of the span in the text.</p><p>• end: The ending index of the span in the text.</p><p>• labels: A list of the types of gendered language used in the selected spans; possible values are overextended, generic and incongruous gender. • key_span: The concatenation of span, start and end attributes; it can be used as an ID for each span contained inside a text.</p><p>We propose to use the GFL-it corpus for tasks 1 and 2,<ref type="foot" target="#foot_6">7</ref> namely, those regarding gendered language detection and fair reformulation.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.2.">GeNTE</head><p>GeNTE is a parallel English → Italian test set <ref type="bibr" target="#b15">[16]</ref>. Originally designed to evaluate MT models' ability to perform gender-neutral translations, GeNTE was built upon a subset of the Europarl corpus <ref type="bibr" target="#b16">[17]</ref>, which is representative of natural, formal communicative situations from the institutional domain, the context where gender-neutral language is most accepted and encouraged <ref type="bibr" target="#b15">[16,</ref><ref type="bibr" target="#b13">14]</ref>. Overall, it consists of 1,500 &lt;English source, gendered Italian reference, gender-neutral Italian reference&gt; triplets aligned at the sentence level, which always contain at least one mention of human referents. The gendered Italian reference (REF-G) comes from the original Europarl corpus, whereas the gender-neutral reference (REF-N) was produced by professional translators who edited gendered forms into gender-neutral alternatives.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Text</head><p>Per gli iscritti agli anni successivi al primo tali valutazioni scendono rispettivamente a NUM , NUM (sotto la soglia critica) e NUM (vicino alla soglia critica).</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Span</head><p>gli iscritti Reformulated Text Per le persone iscritte agli anni successivi al primo tali valutazioni scendono rispettivamente a NUM , NUM (sotto la soglia critica) e NUM (vicino alla soglia critica).</p><p>[For those enrolled in years after the first, these ratings drop to NUM, NUM (below the critical threshold) and NUM (close to the critical threshold), respectively.]</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Table 2</head><p>Example from the GFL-it dataset. Words in bold correspond to the identified unfair spans in the text, and the reformulated expressions in the reformulated text. A translation of the text is provided in square brackets.  As shown in Table <ref type="table" target="#tab_2">3</ref>, GeNTE represents two types of phenomena, which are equally represented within the corpus. Namely, i) Set-N, featuring 750 genderambiguous source sentences that require to be rendered gender-neutrally; and ii) Set-G featuring genderunambiguous source sentences, to be properly rendered with gendered (masculine or feminine) forms. Crucially, these two sets are a key feature of GeNTE, as they allow benchmarking whether systems are able to perform gender-neutral translations, but only when desirable. As a matter of fact, when referents' gender is unknown or irrelevant, undue gender inferences should not be made and gender-neutral language (i.e., conservative obscuration strategy) should be used. However, gender-neutralization should not be always enforced, and when a referent's gender is known or relevant, models should not over-generalize to gender-neutral generations.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Set</head><p>Each entry in GeNTE is organized into the following fields:</p><p>• ID: The unique GeNTE ID. We propose the use of the whole GeNTE for the translation task 3, testing models' ability to produce gender-neutral translations only when appropriate. For</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>SOURCE</head><p>After the accident, they took me to the hospital and I stayed there for a whole month.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>REF-M</head><p>Dopo l'incidente, mi hanno portato all'ospedale e sono rimasto lì per un mese intero.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>REF-F</head><p>Dopo l'incidente, mi hanno portata all'ospedale e sono rimasta lì per un mese intero.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>REF-TAGGED</head><p>Dopo l'incidente, mi hanno portat@ all'ospedale e sono rimast@ lì per un mese intero. ANNOTATION portato portata portat@; rimasto rimasta rimast@;</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Table 4</head><p>Example of a Neo-GATE entry, already adapted to the schwa-simple neomorpheme paradigm. Underlined words include the neomorpheme schwa (@).</p><p>the fair reformulation task 2, we only repurpose part of the Italian portion of the corpus, i.e., REF-G references from Set-N.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.3.">Neo-GATE</head><p>Similarly to GeNTE, Neo-GATE is a parallel corpus designed for gender-fair English → Italian MT evaluation. Here, however, the focus is on the use of gender-fair neomorphemes (i.e., innovative obscuration strategy) rather than conservative gender-neutral language. Neo-GATE was built on GATE <ref type="bibr" target="#b17">[18]</ref>, a test set manually created specifically to evaluate gender reformulation and gender bias in MT. In GATE, the gender of human entities is unknown, i.e., there are no linguistic elements providing gender information about human referents in the (English) source sentences.</p><p>Neo-GATE includes an annotation that defines the words upon which the evaluation is based. It includes the three forms required for the evaluation, i.e., the masculine and feminine forms, and forms featuring placeholders in place of Italian overt gender markers. Before the evaluation, the placeholders must be replaced with the correct forms in the desired neomorpheme paradigm. For this task, Neo-GATE was adapted to a version of the 'schwa' paradigm <ref type="bibr" target="#b18">[19,</ref><ref type="bibr" target="#b19">20]</ref>, to which we refer as schwasimple here, i.e., the placeholders were replaced with the forms described in Appendix A.</p><p>Like GeNTE, Neo-GATE includes Italian references that differ exclusively in gender expression. Besides the English source sentence, all entries in Neo-GATE have three Italian references: REF-M, where the gender of words referring to human beings is masculine, REF-F, where human beings are referred to as feminine, and REF-TAGGED, where placeholders replace overt markers of gender -here adapted to the schwa-simple paradigm. However, differently from GeNTE, the English sentences in Neo-GATE never include gender cues. An example of a Neo-GATE entry is available in Table <ref type="table">4</ref>.</p><p>Each entry in Neo-GATE includes the following fields:</p><p>• #: The entry identifier within Neo-GATE.</p><p>• GATE-ID: A unique identifier of the original GATE entry, composed of a prefix indicating the subset of origin followed by a serial number. We propose to use all Neo-GATE entries for all three tasks of our challenge. While for tasks 1 (gendered language detection) and 2 (fair reformulation) we only use Italian references -namely both REF-M and REF-F for task 1, and REF-M only for task 2 -as input for the models, for task 3 (fair translation) we use the English SOURCE sentences.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.4.">Example of used prompts</head><p>This section describes the prompts we propose for our challenge, with examples available in Table <ref type="table">5</ref>.</p><p>In prompts A and B, we ask the model to identify the gendered expressions (introduced by the tag [Espressione]:) in the text given as input; if no gendered expression is detected in the text (initialized with the tag [Genere marcato]:) the model should output 0. The model can recognize more than one gendered expression.</p><p>In prompts C, D, and E, the shots include one line starting with the tag [Genere marcato]:, indicating that the following sentence is gendered. Then, in prompts C and D the following line starts with [Neutro]: followed by a gender-neutral reformulation, whereas in E it starts with [Neomorfema]: and includes the innovative obscuration alternative of the first sentence, with neomorphemes in place of the masculine forms. <ref type="foot" target="#foot_7">8</ref>Prompts F and G start with the tag [Inglese]: followed by the English source sentence to be translated. In prompt F, the second line either starts with the tag [Italiano, genere marcato]: (see F -Exemplar format 1 in Table <ref type="table">5</ref>) if it is followed by a gendered translation or with the tag [Italiano, neutro]: if the subsequent translation is gender-neutral (see F -Exemplar format 2). Models are required to produce the correct tag and translation depending on the presence or absence of gender cues in the source. Finally, prompt G includes two different translations after the source sentence: the first, preceded by the tag [Italiano, genere marcato]:, includes a translation featuring masculine forms in reference to human beings, whereas the second translation starts with the tag [Italiano, neomorfema]: and uses neomorphemes in reference to human beings. Models are required to produce both translations, though only the second will be extracted in post-processing and used for the evaluation.</p><p>In particular, prompts D, E, F, and G are based on the ones used in previous experiments on the same datasets <ref type="bibr" target="#b11">[12,</ref><ref type="bibr" target="#b14">15]</ref>, and were in turn inspired by the format proposed by Sánchez et al. <ref type="bibr" target="#b20">[21]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Task 1: Gendered language detection</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>A Instruction</head><p>Identifica le espressioni che contengono dei marcatori di genere femminile o maschile. Se più di un'espressione è identificata, separale con " ;". Se nessuna espressione è identificata, restituisci 0.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Exemplar format</head><p>[Genere marcato]: A livello di Ateneo ha partecipato il 76% degli iscritti del 1°anno del CdL e l'81% di tutti gli altri studenti.</p><p>[Espressione]: degli iscritti ; tutti gli altri studenti</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>B Instruction</head><p>Identifica le espressioni che contengono dei marcatori di genere femminile o maschile. Se più di un'espressione è identificata, separale con " ;". Se nessuna espressione è identificata, restituisci 0.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Exemplar format</head><p>[Genere marcato]: Quest'anno mi sono ammalata già due volte.</p><p>[Espressione]: ammalata Task 2: Fair reformulation</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>C Instruction</head><p>Riformula la seguente frase utilizzando un linguaggio neutro rispetto al genere dei referenti umani, evitando l'uso di forme maschili e femminili.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Exemplar format</head><p>[Genere marcato]: -Il 79% dei laureati lavora (a un anno dalla laurea).</p><p>[Neutro]: -Il 79% delle persone laureate lavora (a un anno dalla laurea).</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>D Instruction</head><p>Riformula la seguente frase utilizzando un linguaggio neutro rispetto al genere dei referenti umani, evitando l'uso di forme maschili e femminili.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Exemplar format</head><p>[Genere marcato]: Secondariamente, fino a che punto aumenta la trasparenza e la responsabilità dei parlamentari europei?</p><p>[Neutro]: Secondariamente, fino a che punto aumenta la trasparenza e la responsabilità dei membri del Parlamento Europeo?</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>E Instruction</head><p>Riformula la seguente frase usando il neomorfema "@". Il neomorfema "@" deve essere usato come sostituto dei morfemi maschili e femminili nelle parole che si riferiscono agli esseri umani.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Exemplar format</head><p>[Genere marcato]: Il partner di un mio amico ci ha invitati a cena.</p><p>[Neomorfema]: L@ partner di un@ mi@ amic@ ci ha invitat@ a cena. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>G Instruction</head><p>Traduci la seguente frase inglese in italiano usando il neomorfema "@". Il neomorfema "@" deve essere usato come sostituto dei morfemi maschili e femminili nelle parole che si riferiscono agli esseri umani.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Exemplar format</head><p>[Inglese]: The partner of a friend of mine invited us to dinner.</p><p>[Italiano, genere marcato]: Il partner di un mio amico ci ha invitati a cena.</p><p>[Italiano, neomorfema]: L@ partner di un@ mi@ amic@ ci ha invitat@ a cena.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Table 5</head><p>Examples of the format of all prompts we propose for our challenge. Dataset-wise, prompts A and C are designed to be used with GFL-it data, prompts B, E, and G are designed for Neo-GATE, and prompts D and F are designed for GeNTE.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Metrics</head><p>For the evaluation of gendered language detection (i.e., with GFL-it and Neo-GATE in task 1) we used the F1-score obtained using BERTScore<ref type="foot" target="#foot_8">9</ref>  <ref type="bibr" target="#b21">[22]</ref> for each entry in the datasets. In particular, for each entry, we extract the most relevant correspondence between the gendered expressions identified by the annotators and the ones produced by the generative model, computing the maximum F1-score. Once the correspondences are set for each entry, we average the scores.</p><p>For the evaluation of gender-neutral reformulationi.e., with GFL-it and GeNTE in task 2-and translationi.e., with GeNTE and Neo-GATE in task 3-we propose an accuracy score based on the labels produced by the classifier introduced in Piergentili et al. <ref type="bibr" target="#b13">[14]</ref>. More specifically, we use version 2 of the classifier, introduced in Savoldi et al. <ref type="bibr" target="#b11">[12]</ref>. This classifier assigns a label to each model output, either gender-neutral or gendered. We then compare those labels against the true labels, i.e., always gender-neutral in the reformulation task and either gendered or gender-neutral for the translation task, depending on whether the entry belongs to Set-G or Set-N respectively. The final score is computed as the corpus-level percentage of correct labels.</p><p>For neomorpheme-based gender-fair reformulation (task 2) and translation (task 3) based on Neo-GATE, we propose the coverage-weighted accuracy described in Piergentili et al. <ref type="bibr" target="#b14">[15]</ref> as the main metric. This metric takes into account both how accurately a model generates neomorphemes and the proportion of annotations (i.e., either of the masculine, feminine, or innovative forms) found during the evaluation, thus allowing for fair system comparisons and rankings. As complementary metric to assess models' ability to correctly generate neomorphemes, we propose reporting the mis-generation score <ref type="bibr" target="#b14">[15]</ref> as well. This metric can flag undesired behaviors even despite good accuracy, as it counts cases where models generate neomorphemes inappropriately, for instance by applying the use of neomorphemes to words that do not refer to human entities (e.g., by generating 'tavol@' instead of 'tavolo', en: table).</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Limitations</head><p>Our work presents some limitations. Firstly, the datasets employed only derive from specific domains: GFL-it exclusively contains data from administrative documents and official web pages of the University, GeNTE from documents of the European Parliament, and Neo-GATE data manually created by experts. The corpora could be expanded to other domains and annotated by more annotators in future research. Secondly, our metrics are only a first attempt and others should be explored in the future. Moreover, we only tested one paradigm of neomorphemes, namely the schwa-simple, while many others exist (e.g., the asterisk, the '-u', the '@' -see <ref type="bibr" target="#b22">[23]</ref> for a complete list), and even more could be proposed. Furthermore, GeNTE and Neo-GATE do not contain mixed texts where rewriting is needed with respect to one entity but not others.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="6.">Ethical issues</head><p>The proposed tasks in this challenge have the purpose of reducing the use of gender-unfair expressions in heavily gender-marked languages (i.e., Italian) that affect the visibility of other genders (in particular, feminine and non-binary). Although the datasets have been built by experts of gender-fair language, the group of annotators of GFL-it was not gender-balanced as only 2 out of 5 annotators were men.</p><p>Moreover, we are aware of the fact that the use of neomorphemes like the schwa ǝ makes reading harder for people with dyslexia or visual impairments <ref type="bibr" target="#b3">[4,</ref><ref type="bibr" target="#b23">24,</ref><ref type="bibr" target="#b24">25]</ref>. This issue, however, is mitigated thanks to the possibility of selecting the most suitable neomorpheme according to each user's needs. In particular, both people with dyslexia or visual impairments can rely on screen readers, which differ in their ability to correctly interpret specific neomorphemes: the possibility to select different neomorphemes allows each user to select the one(s) their screenreader interpret best.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="7.">Data license and copyright issues</head><p>Creative Commons Attribution 4.0 International license (CC BY 4.0). https://creativecommons.org/licenses/by-sa/ 4.0/deed.it</p><p>A. The schwa-simple paradigm </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Table 6</head><p>The full tagset used in Neo-GATE, mapped to the Italian gendered forms and the schwa-simple nomorpheme paradigm.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head></head><label></label><figDesc>-G SRC When you assumed office, Mr Schreyer, you assured us that you would strive to achieve this. REF-G Al momento della sua nomina, signor [Mr] Schreyer, ci aveva promesso che si sarebbe adoperato [(would have) strived] in tal senso. REF-N Al momento della sua nomina, Schreyer, ci aveva promesso un impegno [a commitment] in tal senso. Set-N SRC To some extent, those of us who are politicians find ourselves in the middle. REF-G In certa misura quelli [those (of us)] di noi che sono politici [politicians] si trovano in una posizione intermedia. REF-N In certa misura chi di noi [who, among us,] svolge attività politica [carries out political activities] si trova in una posizione intermedia.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head>•</head><label></label><figDesc>Europarl_ID: The original sentence ID from Europarl's common-test-set 2. • SET : Indicates whether the entry belongs to the Set-G or the Set-N subportion of the corpus. • SRC: The English source sentence. • REF-G: The gendered Italian reference translation. • REF-N : The gender-neutral Italian reference, produced by a professional translator. • GENDER: For entries belonging to the Set-G, it indicates if the entry is Feminine or Masculine.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_2"><head></head><label></label><figDesc>• SOURCE: The English source sentence. • REF-M: The Italian reference where all gendermarked terms are masculine. • REF-F : The Italian reference where all gendermarked terms are feminine. • REF-TAGGED: The Italian reference where all gender-marked terms are tagged with Neo-GATE's annotation. • ANNOTATION : The word level annotation.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_3"><head>Task 3 :</head><label>3</label><figDesc>Fair translationF InstructionTraduci la seguente frase inglese in italiano seguendo queste regole: 1. Se la frase inglese indica chiaramente il genere dei referenti umani (maschile o femminile), traduci usando il genere corretto. 2. Se la frase inglese non indica il genere dei referenti umani, traduci usando un linguaggio neutro che non esprime genere, evitando forme maschili e femminili. Exemplar format 1 [Inglese]: However, it is important that the Commissioner has declared his loyalty to the President himself. [Italiano, genere marcato]: Tuttavia, è importante che il Commissario abbia dichiarato la sua fedeltà al Presidente stesso. Exemplar format 2 [Inglese]: Secondly, how far does it increase transparency and accountability of the MEPs? [Italiano, neutro]: Secondariamente, fino a che punto aumenta la trasparenza e la responsabilità dei membri del Parlamento Europeo?</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>Task GFL-it GeNTE Neo-GATE Task total</head><label></label><figDesc></figDesc><table><row><cell>Detection</cell><cell>2,187</cell><cell>-</cell><cell>841</cell><cell>3,028</cell></row><row><cell cols="2">Reformulation 1,206</cell><cell>750</cell><cell>841</cell><cell>2,797</cell></row><row><cell>Translation</cell><cell>-</cell><cell>1,500</cell><cell>841</cell><cell>2,341</cell></row><row><cell></cell><cell></cell><cell></cell><cell></cell><cell>• conservative obscuration: Sono felice di conoscere</cell></row><row><cell></cell><cell></cell><cell></cell><cell></cell><cell>un personale medico così preparato. [medical staff]</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_1"><head>Table 1</head><label>1</label><figDesc>Number of dataset entries used for each task.</figDesc><table /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_2"><head>Table 3</head><label>3</label><figDesc>Examples of Set-G and Set-N entries in GeNTE. Underlined words are linguistic cues informing about human referents' gender; words in bold are gendered mentions of human referents; words in italic are the gender-neutral reformulations of the gendered mentions. Glosses of relevant expressions are provided in square brackets.</figDesc><table /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_3"><head>Table 6</head><label>6</label><figDesc>reports the forms used in the schwa-simple paradigm, along with the corresponding tags in Neo-GATE and masculine and feminine equivalents.</figDesc><table><row><cell>TAG</cell><cell>Description</cell><cell>Masculine</cell><cell>Feminine</cell><cell>Schwa</cell></row><row><cell>&lt;ENDS&gt;</cell><cell cols="2">portion of the word differentiating gendered forms, singular o, e, tore</cell><cell cols="2">a, essa, trice @, tor@</cell></row><row><cell>&lt;ENDP&gt;</cell><cell>portion of the word differentiating gendered forms, plural</cell><cell>i, tori</cell><cell cols="2">e, esse, trici @, tor@</cell></row><row><cell>&lt;DARTS&gt;</cell><cell>definite article, singular</cell><cell>il, lo, l'</cell><cell>la, l'</cell><cell>l@</cell></row><row><cell>&lt;DARTP&gt;</cell><cell>definite article, plural</cell><cell>i, gli</cell><cell>le</cell><cell>l@</cell></row><row><cell>&lt;IART&gt;</cell><cell>indefinite article</cell><cell>uno, un</cell><cell>una, un'</cell><cell>un@</cell></row><row><cell>&lt;PARTP&gt;</cell><cell>partitive article, plural</cell><cell>dei, degli</cell><cell>delle</cell><cell>de@</cell></row><row><cell>&lt;PREPdiS&gt;</cell><cell>articulated preposition with root 'di', singular</cell><cell>del, dello, dell'</cell><cell>della, dell'</cell><cell>dell@</cell></row><row><cell>&lt;PREPdiP&gt;</cell><cell>articulated preposition with root 'di', plural</cell><cell>dei, degli</cell><cell>delle</cell><cell>dell@</cell></row><row><cell>&lt;PREPaS&gt;</cell><cell>articulated preposition with root 'a', singular</cell><cell>al, allo, all'</cell><cell>alla, all'</cell><cell>all@</cell></row><row><cell>&lt;PREPaP&gt;</cell><cell>articulated preposition with root 'a', plural</cell><cell>agli, ai</cell><cell>alle</cell><cell>all@</cell></row><row><cell>&lt;PREPdaS&gt;</cell><cell>articulated preposition with root 'da', singular</cell><cell>dal, dallo, dall'</cell><cell>dalla, dall'</cell><cell>dall@</cell></row><row><cell>&lt;PREPdaP&gt;</cell><cell>articulated preposition with root 'da', plural</cell><cell>dagli</cell><cell>dalle</cell><cell>dall@</cell></row><row><cell>&lt;PREPinP&gt;</cell><cell>articulated preposition with root 'in', plural</cell><cell>negli</cell><cell>nelle</cell><cell>nell@</cell></row><row><cell>&lt;PREPsuS&gt;</cell><cell>articulated preposition with root 'su', singular</cell><cell>sul, sullo, sull'</cell><cell>sulla, sull'</cell><cell>sull@</cell></row><row><cell>&lt;PREPsuP&gt;</cell><cell>articulated preposition with root 'su', plural</cell><cell>sugli</cell><cell>sulle</cell><cell>sull@</cell></row><row><cell cols="2">&lt;DADJquelS&gt; demonstrative adjective (far), singular</cell><cell cols="3">quel, quello, quell' quella, quell' quell@</cell></row><row><cell cols="2">&lt;DADJquelP&gt; demonstrative adjective (far), plural</cell><cell>quegli</cell><cell>quelle</cell><cell>quell@</cell></row><row><cell cols="2">&lt;DADJquestS&gt; demonstrative adjective (near), singular</cell><cell>questo, quest'</cell><cell cols="2">questa, quest' quest@</cell></row><row><cell cols="2">&lt;DADJquestP&gt; demonstrative adjective (near), plural</cell><cell>questi</cell><cell>queste</cell><cell>quest@</cell></row><row><cell>&lt;POSS1S&gt;</cell><cell>possessive adjective, 1st person singular, singular</cell><cell>mio</cell><cell>mia</cell><cell>mi@</cell></row><row><cell>&lt;POSS1P&gt;</cell><cell>possessive adjective, 1st person singular, plural</cell><cell>miei</cell><cell>mie</cell><cell>mi@</cell></row><row><cell>&lt;POSS2S&gt;</cell><cell>possessive adjective, 2nd person singular, singular</cell><cell>tuo</cell><cell>tua</cell><cell>tu@</cell></row><row><cell>&lt;POSS2P&gt;</cell><cell>possessive adjective, 2nd person singular, plural</cell><cell>tuoi</cell><cell>tue</cell><cell>tu@</cell></row><row><cell>&lt;POSS3S&gt;</cell><cell>possessive adjective, 3rd person singular, singular</cell><cell>suo</cell><cell>sua</cell><cell>su@</cell></row><row><cell>&lt;POSS3P&gt;</cell><cell>possessive adjective, 3rd person singular, plural</cell><cell>suoi</cell><cell>sue</cell><cell>su@</cell></row><row><cell>&lt;POSS4S&gt;</cell><cell>possessive adjective, 1st person plural, singular</cell><cell>nostro</cell><cell>nostra</cell><cell>nostr@</cell></row><row><cell>&lt;POSS4P&gt;</cell><cell>possessive adjective, 1st person plural, plural</cell><cell>nostri</cell><cell>nostre</cell><cell>nostr@</cell></row><row><cell cols="2">&lt;PRONDOBJS&gt; direct object pronoun, singular</cell><cell>lo</cell><cell>la</cell><cell>l@</cell></row><row><cell cols="2">&lt;PRONDOBJP&gt; direct object pronoun, plural</cell><cell>li</cell><cell>le</cell><cell>l@</cell></row></table></figure>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="1" xml:id="foot_0">In this report, we refer to innovative gender-fair strategies such as the schwa as "neomorphemes". Although aware that this terminology is controversial, we adopted it for simplicity and do not intend our terminology to imply any substantive stance.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="2" xml:id="foot_1">We indicate the innovative forms with "INN" in the glosses.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="3" xml:id="foot_2">https://github.com/simonasnow/GFL-it-Dataset</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="4" xml:id="foot_3">https://huggingface.co/datasets/FBK-MT/GeNTE</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="5" xml:id="foot_4">https://huggingface.co/datasets/FBK-MT/Neo-GATE</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="6" xml:id="foot_5">For the purpose of the task 2, only the conservative obscured reformulations have been released in this version of the dataset.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="7" xml:id="foot_6">For task 2, we used a classifier that distinguishes between gendered and gender-neutral texts (see Section 4). Hence, we only used the GFL-it texts where the annotators identified gendered expressions (= gendered class) and the texts for which annotators provided at least one conservative obscured reformulation (= gender-neutral class) for a total amount of 1,206 texts.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="8" xml:id="foot_7">We here used neutro (neutral/neuter), despite being aware of its ambiguity with neuter, a grammatical gender not present in the Italian linguistic system. However, nothing substantive hinges on this terminological choice.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="9" xml:id="foot_8">https://huggingface.co/spaces/evaluate-metric/bertscore</note>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="8.">Acknowledgments</head><p>Beatrice Savoldi is supported by the PNRR project FAIR -Future AI Research (PE00000013), under the NRRP MUR program funded by the NextGenerationEU. Luisa Bentivogli is funded by the Horizon Europe research and innovation programme, under grant agreement No 101135798, project Meetween (My Personal AI Mediator for Virtual MEETtings BetWEEN People). The work of Viviana Patti and Marco Madeddu is supported by "HAR-MONIA" project -M4-C2, I1.3 Partenariati Estesi -Cascade Call -FAIR -CUP C63C22000770006 -PE PE0000013 under the NextGenerationEU programme.</p><p>The annotation of GFL-it has been partially funded by Università degli Studi di Brescia as part of the actions provided for by the Gender Equality Plan.</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Beyond obscuration and visibility: Thoughts on the different strategies of gender-fair language in italian</title>
		<author>
			<persName><forename type="first">M</forename><surname>Rosola</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Frenda</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">T</forename><surname>Cignarella</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Pellegrini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Marra</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Floris</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 9th Italian Conference on Computational Linguistics</title>
				<meeting>the 9th Italian Conference on Computational Linguistics<address><addrLine>Venice, Italy</addrLine></address></meeting>
		<imprint>
			<publisher>CEUR-WS</publisher>
			<date type="published" when="2023-11-30">2023. November 30-December 2, 2023. 2023</date>
			<biblScope unit="volume">3596</biblScope>
			<biblScope unit="page" from="1" to="10" />
		</imprint>
	</monogr>
	<note>CLiC-it</note>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">Generic Masculine Words and Thinking</title>
		<author>
			<persName><forename type="first">J</forename><surname>Silveira</surname></persName>
		</author>
		<ptr target="https://www.sciencedirect.com/science/article/pii/S0148068580921132" />
	</analytic>
	<monogr>
		<title level="j">Women&apos;s Studies International Quarterly</title>
		<imprint>
			<biblScope unit="volume">3</biblScope>
			<biblScope unit="page" from="165" to="178" />
			<date type="published" when="1980">1980</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">The masculine form in grammatically gendered languages and its multiple interpretations: A challenge for our cognitive system</title>
		<author>
			<persName><forename type="first">P</forename><surname>Gygax</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Sato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Öttl</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Gabriel</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Language Sciences</title>
		<imprint>
			<biblScope unit="volume">83</biblScope>
			<biblScope unit="page">101328</biblScope>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">The debate on language and gender in italy, from the visibility of women to inclusive language (1980s-2020s)</title>
		<author>
			<persName><forename type="first">G</forename><surname>Sulis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Gheno</surname></persName>
		</author>
		<idno type="DOI">10.1080/02614340.2022.2125707</idno>
	</analytic>
	<monogr>
		<title level="j">The Italianist</title>
		<imprint>
			<biblScope unit="volume">42</biblScope>
			<biblScope unit="page" from="153" to="183" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">across Languages, Beyond pronouns</title>
		<author>
			<persName><forename type="first">G</forename><surname>Visibility</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">The Oxford Handbook of Applied Philosophy of Language</title>
				<imprint>
			<date type="published" when="2024">2024</date>
			<biblScope unit="page">320</biblScope>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Linguistic hermeneutical injustice</title>
		<author>
			<persName><forename type="first">M</forename><surname>Rosola</surname></persName>
		</author>
		<idno type="DOI">10.1080/02691728.2024.2401143</idno>
	</analytic>
	<monogr>
		<title level="j">Social Epistemology</title>
		<imprint>
			<date type="published" when="2024">2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">Misgendering and its moral contestability</title>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">J</forename><surname>Kapusta</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Hypatia</title>
		<imprint>
			<biblScope unit="volume">31</biblScope>
			<biblScope unit="page" from="502" to="519" />
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<monogr>
		<author>
			<persName><forename type="first">R</forename><surname>Dembroff</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Wodak</surname></persName>
		</author>
		<author>
			<persName><forename type="first">/</forename><surname>He</surname></persName>
		</author>
		<title level="m">she/they/ze</title>
				<imprint>
			<publisher>Ergo</publisher>
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">Can genderfair language reduce gender stereotyping and discrimination?</title>
		<author>
			<persName><forename type="first">S</forename><surname>Sczesny</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Formanowicz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Moser</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Frontiers in psychology</title>
		<imprint>
			<biblScope unit="volume">7</biblScope>
			<biblScope unit="page">154379</biblScope>
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<monogr>
		<author>
			<persName><forename type="first">P</forename><surname>Gygax</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Zufferey</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Gabriel</surname></persName>
		</author>
		<title level="m">Le cerveau pense-til au masculin, Cerveau, langage et représentations sexistes</title>
				<meeting><address><addrLine>Paris</addrLine></address></meeting>
		<imprint>
			<publisher>Le Robert</publisher>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">Language (technology) is power: A critical survey of &quot;bias&quot; in NLP</title>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">L</forename><surname>Blodgett</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Barocas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Daumé</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Iii</forename></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Wallach</surname></persName>
		</author>
		<idno type="DOI">10.18653/v1/2020.acl-main.485</idno>
		<ptr target="https://aclanthology.org/2020.acl-main.485.doi:10.18653/v1/2020.acl-main.485" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, Association for Computational Linguistics</title>
				<editor>
			<persName><forename type="first">D</forename><surname>Jurafsky</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><surname>Chai</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">N</forename><surname>Schluter</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><surname>Tetreault</surname></persName>
		</editor>
		<meeting>the 58th Annual Meeting of the Association for Computational Linguistics, Association for Computational Linguistics</meeting>
		<imprint>
			<date type="published" when="2020">2020</date>
			<biblScope unit="page" from="5454" to="5476" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">A prompt response to the demand for automatic gender-neutral translation</title>
		<author>
			<persName><forename type="first">B</forename><surname>Savoldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Piergentili</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Fucci</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Negri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Bentivogli</surname></persName>
		</author>
		<ptr target="https://aclanthology.org/2024.eacl-short.23" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics</title>
				<editor>
			<persName><forename type="first">Y</forename><surname>Graham</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">M</forename><surname>Purver</surname></persName>
		</editor>
		<meeting>the 18th Conference of the European Chapter of the Association for Computational Linguistics<address><addrLine>St. Julian&apos;s, Malta</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2024">2024</date>
			<biblScope unit="volume">2</biblScope>
			<biblScope unit="page" from="256" to="267" />
		</imprint>
	</monogr>
	<note>: Short Papers), Association for Computational Linguistics</note>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">CALAMITA: Challenge the Abilities of LAnguage Models in ITAlian</title>
		<author>
			<persName><forename type="first">G</forename><surname>Attanasio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Basile</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Borazio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Croce</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Francis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Gili</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Musacchio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Nissim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Patti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Rinaldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Scalena</surname></persName>
		</author>
		<ptr target="CEUR-WS.org" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 10th Italian Conference on Computational Linguistics (CLiC-it 2024)</title>
		<title level="s">CEUR Workshop Proceedings</title>
		<meeting>the 10th Italian Conference on Computational Linguistics (CLiC-it 2024)<address><addrLine>Pisa, Italy</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2024-12-06">December 4 -December 6, 2024. 2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">tivogli, Hi guys or hi folks? benchmarking genderneutral machine translation with the GeNTE corpus</title>
		<author>
			<persName><forename type="first">A</forename><surname>Piergentili</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Savoldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Fucci</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Negri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Ben</surname></persName>
		</author>
		<idno type="DOI">10.18653/v1/2023.emnlp-main.873</idno>
		<ptr target="https://aclanthology.org/2023.emnlp-main.873.doi:10.18653/v1/2023.emnlp-main.873" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing</title>
		<title level="s">Association for Computational Linguistics</title>
		<editor>
			<persName><forename type="first">H</forename><surname>Bouamor</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><surname>Pino</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">K</forename><surname>Bali</surname></persName>
		</editor>
		<meeting>the 2023 Conference on Empirical Methods in Natural Language Processing<address><addrLine>Singapore</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2023">2023</date>
			<biblScope unit="page" from="14124" to="14140" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">Enhancing gender-inclusive machine translation with neomorphemes and large language models</title>
		<author>
			<persName><forename type="first">A</forename><surname>Piergentili</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Savoldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Negri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Bentivogli</surname></persName>
		</author>
		<ptr target="https://aclanthology.org/2024.eamt-1.25" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 25th Annual Conference of the European Association for Machine Translation (Volume 1</title>
				<editor>
			<persName><forename type="first">C</forename><surname>Scarton</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">C</forename><surname>Prescott</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">C</forename><surname>Bayliss</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">C</forename><surname>Oakley</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><surname>Wright</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">S</forename><surname>Wrigley</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">X</forename><surname>Song</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">E</forename><surname>Gow-Smith</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">R</forename><surname>Bawden</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">V</forename><forename type="middle">M</forename><surname>Sánchez-Cartagena</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">P</forename><surname>Cadwell</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">E</forename><surname>Lapshinova-Koltunski</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">V</forename><surname>Cabarrão</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">K</forename><surname>Chatzitheodorou</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">M</forename><surname>Nurminen</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">D</forename><surname>Kanojia</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">H</forename><surname>Moniz</surname></persName>
		</editor>
		<meeting>the 25th Annual Conference of the European Association for Machine Translation (Volume 1<address><addrLine>Sheffield, UK</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2024">2024</date>
			<biblScope unit="page" from="300" to="314" />
		</imprint>
	</monogr>
	<note>European Association for Machine Translation (EAMT)</note>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">Gender neutralization for an inclusive machine translation: from theoretical foundations to open challenges</title>
		<author>
			<persName><forename type="first">A</forename><surname>Piergentili</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Fucci</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Savoldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Bentivogli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Negri</surname></persName>
		</author>
		<ptr target="https://aclanthology.org/2023.gitt-1.7" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the First Workshop on Gender-Inclusive Translation Technologies, European Association for Machine Translation</title>
				<editor>
			<persName><forename type="first">E</forename><surname>Vanmassenhove</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">B</forename><surname>Savoldi</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">L</forename><surname>Bentivogli</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><surname>Daems</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><surname>Hackenbuchner</surname></persName>
		</editor>
		<meeting>the First Workshop on Gender-Inclusive Translation Technologies, European Association for Machine Translation<address><addrLine>Tampere, Finland</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2023">2023</date>
			<biblScope unit="page" from="71" to="83" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">Europarl: A Parallel Corpus for Statistical Machine Translation</title>
		<author>
			<persName><forename type="first">P</forename><surname>Koehn</surname></persName>
		</author>
		<ptr target="http://mt-archive.info/MTS-2005-Koehn.pdf" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the tenth Machine Translation Summit</title>
				<meeting>the tenth Machine Translation Summit<address><addrLine>Phuket, TH</addrLine></address></meeting>
		<imprint>
			<publisher>AAMT</publisher>
			<date type="published" when="2005">2005</date>
			<biblScope unit="page" from="79" to="86" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b17">
	<analytic>
		<title level="a" type="main">GATE: A challenge set for gender-ambiguous translation examples</title>
		<author>
			<persName><forename type="first">S</forename><surname>Rarrick</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Naik</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Mathur</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Poudel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Chowdhary</surname></persName>
		</author>
		<idno type="DOI">10.1145/3600211.3604675</idno>
		<idno>doi:10.1145/ 3600211.3604675</idno>
		<ptr target="https://doi.org/10.1145/3600211.3604675" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2023 AAAI/ACM Conference on AI, Ethics, and Society, AIES &apos;23</title>
				<meeting>the 2023 AAAI/ACM Conference on AI, Ethics, and Society, AIES &apos;23<address><addrLine>New York, NY, USA</addrLine></address></meeting>
		<imprint>
			<publisher>Association for Computing Machinery</publisher>
			<date type="published" when="2023">2023</date>
			<biblScope unit="page" from="845" to="854" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b18">
	<analytic>
		<title level="a" type="main">Genere e igiene verbale: l&apos;uso di forme con @ in italiano, Annali Del Dipartimento Di Studi Letterari, Linguistici E Comparati</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">M</forename><surname>Thornton</surname></persName>
		</author>
		<idno type="DOI">10.6093/2281-6585/9623</idno>
		<ptr target="https://doi.org/10.6093/2281-6585/9623" />
	</analytic>
	<monogr>
		<title level="j">Sezione Linguistica</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<biblScope unit="page" from="11" to="54" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b19">
	<analytic>
		<title level="a" type="main">Italian proposal for non-binary and inclusive language: The schwa as a non-gender-specific ending</title>
		<author>
			<persName><forename type="first">R</forename><surname>Baiocco</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Rosati</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Pistella</surname></persName>
		</author>
		<idno type="DOI">10.1080/19359705.2023.2183537</idno>
		<idno>doi:10. 1080/19359705.2023.2183537</idno>
		<ptr target="https://doi.org/10.1080/19359705.2023.2183537" />
	</analytic>
	<monogr>
		<title level="j">Journal of Gay &amp; Lesbian Mental Health</title>
		<imprint>
			<biblScope unit="volume">27</biblScope>
			<biblScope unit="page" from="248" to="253" />
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b20">
	<monogr>
		<title level="m" type="main">Gender-specific machine translation with large language models</title>
		<author>
			<persName><forename type="first">E</forename><surname>Sánchez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Andrews</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Stenetorp</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Artetxe</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">R</forename><surname>Costa-Jussà</surname></persName>
		</author>
		<ptr target="https://arxiv.org/abs/2309.03175.arXiv:2309.03175" />
		<imprint>
			<date type="published" when="2024">2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b21">
	<analytic>
		<title level="a" type="main">BERTScore: Evaluating text generation with BERT</title>
		<author>
			<persName><forename type="first">T</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">*</forename></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Kishore</surname></persName>
		</author>
		<author>
			<persName><forename type="first">*</forename></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Wu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">*</forename></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">Q</forename><surname>Weinberger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Artzi</surname></persName>
		</author>
		<ptr target="https://openreview.net/forum?id=SkeHuCVFDr" />
	</analytic>
	<monogr>
		<title level="m">International Conference on Learning Representations</title>
				<imprint>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b22">
	<monogr>
		<title level="m" type="main">Lo schwa tra fantasia e norma</title>
		<author>
			<persName><forename type="first">V</forename><surname>Gheno</surname></persName>
		</author>
		<ptr target="https://lafalla.cassero.it/lo-schwa-tra-fantasia-e-norma/" />
		<imprint>
			<date type="published" when="2020">2020</date>
			<pubPlace>La falla</pubPlace>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b23">
	<monogr>
		<author>
			<persName><forename type="first">L</forename><surname>Iacopini</surname></persName>
		</author>
		<ptr target="https://webaccessibile.org/approfondimenti/lo-schwa-%C7%9D-che-rende-linclusione-inaccessibile/" />
		<title level="m">Lo schwa (ǝ) che rende l&apos;inclusione inaccessibile</title>
				<imprint>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
	<note>Web accessibile</note>
</biblStruct>

<biblStruct xml:id="b24">
	<monogr>
		<title level="m" type="main">L&apos;emancipazione grammaticale non passa per una e rovesciata</title>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">D</forename><surname>Santis</surname></persName>
		</author>
		<ptr target="https://www.treccani.it/magazine/lingua_italiana/articoli/scritto_e_parlato/Schwa.html" />
		<imprint>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
