<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Integrating Terminological and Ontological Principles into a Lexicographic Resource</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Rute</forename><surname>Costa</surname></persName>
							<email>rute.costa@fcsh.unl.pt</email>
							<affiliation key="aff0">
								<orgName type="department">CLUNL -Centro de Linguística</orgName>
								<orgName type="institution">Universidade Nova de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Ana</forename><surname>Salgado</surname></persName>
							<email>anacastrosalgado@gmail.com</email>
							<affiliation key="aff0">
								<orgName type="department">CLUNL -Centro de Linguística</orgName>
								<orgName type="institution">Universidade Nova de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Academia das Ciências de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Margarida</forename><surname>Ramos</surname></persName>
							<email>mvramos@fcsh.unl.pt</email>
							<affiliation key="aff0">
								<orgName type="department">CLUNL -Centro de Linguística</orgName>
								<orgName type="institution">Universidade Nova de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Fahad</forename><surname>Khan</surname></persName>
							<email>fahad.khan@ilc.cnr.it</email>
							<affiliation key="aff2">
								<orgName type="institution">CNR -Istituto di Linguistica Computazionale &quot;Antonio Zampollo&quot;</orgName>
								<address>
									<settlement>Pisa</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Sara</forename><surname>Carvalho</surname></persName>
							<email>sara.carvalho@ua.pt</email>
							<affiliation key="aff0">
								<orgName type="department">CLUNL -Centro de Linguística</orgName>
								<orgName type="institution">Universidade Nova de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
							<affiliation key="aff3">
								<orgName type="institution">CLLC -Cetnro de Línguas. Literaturas e Culturas</orgName>
								<address>
									<settlement>Aveiro</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Toma</forename><surname>Tasovac</surname></persName>
							<email>ttasovac@humanistika.org</email>
							<affiliation key="aff4">
								<orgName type="institution">BCDH -Belgrade Center for Digital Humanities</orgName>
								<address>
									<settlement>Belgrade</settlement>
									<country key="RS">Serbia</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Bruno</forename><surname>Almeida</surname></persName>
							<email>brunoalmeida@fcsh.unl.pt</email>
							<affiliation key="aff0">
								<orgName type="department">CLUNL -Centro de Linguística</orgName>
								<orgName type="institution">Universidade Nova de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
							<affiliation key="aff5">
								<orgName type="department">ROSSIO -ROSSIO Infrastructure -Social Sciences</orgName>
								<orgName type="institution">Arts and Humanities</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Mohamed</forename><surname>Khemakhem</surname></persName>
							<email>mohamed.khemakhem@inria.fr</email>
							<affiliation key="aff6">
								<orgName type="institution">ArcaScience. Paris</orgName>
								<address>
									<country key="FR">France</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Laurent</forename><surname>Romary</surname></persName>
							<email>laurent.romary@inria.fr</email>
							<affiliation key="aff7">
								<orgName type="department">&amp; Compuatational Humanities</orgName>
								<orgName type="laboratory">ALMAnaCH -Automatic Language Modelling and ANAlysis</orgName>
								<orgName type="institution">INRIA</orgName>
								<address>
									<settlement>Paris</settlement>
									<country key="FR">France</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Raquel</forename><surname>Silva</surname></persName>
							<email>raq.silva@fcsh.unl.pta.10</email>
							<affiliation key="aff0">
								<orgName type="department">CLUNL -Centro de Linguística</orgName>
								<orgName type="institution">Universidade Nova de Lisboa</orgName>
								<address>
									<settlement>Lisboa</settlement>
									<country key="PT">Portugal</country>
								</address>
							</affiliation>
						</author>
						<author>
							<affiliation key="aff8">
								<orgName type="department">International Conference on &quot;Multilingual digital terminology today. Design</orgName>
								<orgName type="institution">representation formats and management systems&quot;</orgName>
								<address>
									<addrLine>June 16 -17</addrLine>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Integrating Terminological and Ontological Principles into a Lexicographic Resource</title>
					</analytic>
					<monogr>
						<imprint>
							<date/>
						</imprint>
					</monogr>
					<idno type="MD5">F9742829612FAFA10C0D84C5CC9ADC9A</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-03-24T18:02+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>dictionary</term>
					<term>lexicography</term>
					<term>digital humanities</term>
					<term>standards</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>In this paper we will present the research that is taking place at the NOVA CLUNL 1 where an international team is working on a financed project MORDigital 2 . MORDigital's goal is to encode the selected editions of Diccinario de Lingua Portugueza by António de Morais Silva (MOR), first published in 1789.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>MORDigital's ultimate goals are, on the one hand, to promote accessibility to cultural heritage while fostering reusability and, on the other hand, to contribute towards a more significant presence of lexicographic digital content in Portuguese through open tools and standards. MOR represents a significant legacy, since it marks the beginning of Portuguese dictionaries, having served as a model for all subsequent lexicographic production. The team follows a new paradigm in lexicography, which results from the convergence between lexicography, terminology, computational linguistics, and ontologies as an integral part of digital humanities and linked (open) data. In the Portuguese context, this research fills a gap concerning searchable online retrodigitised dictionaries, built on current standards and methodologies which promote data sharing and harmonisation, namely TEI Lex-0<ref type="foot" target="#foot_2">4</ref> and Ontolex-Lemon<ref type="foot" target="#foot_3">5</ref> . The team will further ensure the connection to other existing systems and lexical resources, particularly in the Portuguese-speaking world.</p><p>For this paper, after posing the theoretical background (terminology and lexicography) that /underpins our methodology, we will present 4 interrelated tasks:</p><p>1. Structuration of MOR's digitised versions using GROBID-Dictionaries<ref type="foot" target="#foot_4">6</ref> , a specific software for the parsing, extraction and structuring of information extracted from dictionary text. In our case, the tool will be used to parse the constituent parts of each dictionary entry, which involves the preparation of a native encoding format that is compliant with the XML/TEI metamodel. 2. Presentation of a systematic analysis of the Mathematical Sciences and Medical Sciences domains, their related domain labels <ref type="bibr" target="#b5">[6]</ref>, <ref type="bibr" target="#b0">[1]</ref> and other mechanisms, such as the use of formulae present in the definition which identifies the specialised field of knowledge. We will propose a hierarchical organisation that constitutes the foundation of domain ontologies. 3. Representation of the model in OWL resorting to Protégé<ref type="foot" target="#foot_5">7</ref> , a free, open-source ontology editor. This means each class or individual in the ontology will be assigned a URI (Universal Resource Identifier), used to reference the label present in each of the lexicographic entries in accordance -whenever possible -with the TEI schemas. 4. Conversion of the TEI Lex-0 output of Task 4 into linked data using the RDF-based model Ontolex-Lemon; the conversion will be based on work already carried out in the scope of previous initiatives in rendering the two models more interoperable. The Ontolex-Lemon model has recently been extended by a lexicography module -lexicog<ref type="foot" target="#foot_6">8</ref> -, which facilitates interoperability in modelling dictionaries as linked data.</p><p>At the end of the paper, we will discuss the results, highlighting the challenges that we faced.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Acknowledgements</head><p>This paper is supported by the MORDigital -Digitalização do Diccionario da Lingua Portugueza de António de Morais Silva [PTDC/LLT-LIN/6841/2020] project financed by the Portuguese National Funding through the FCT -Fundação para a Ciência e Tecnologia.</p></div>			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="1" xml:id="foot_0">https://clunl.fcsh.unl.pt/grupos_clunl/lexicologia-lexicografia-terminologia/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="2" xml:id="foot_1">https://www.fct.pt/apoios/projectos/consulta/vglobal_projecto?idProjecto=164850&amp;idElemConcurso=14818</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="4" xml:id="foot_2">https://dariah-eric.github.io/lexicalresources/pages/TEILex0/TEILex0.html</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="5" xml:id="foot_3">https://www.w3.org/community/ontolex/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="6" xml:id="foot_4">https://github.com/MedKhem/grobid-dictionaries</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="7" xml:id="foot_5">https://protege.stanford.edu/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="8" xml:id="foot_6">https://www.w3.org/2019/09/lexicog/</note>
		</body>
		<back>
			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Ontologie des marques de domaines appliquée aux dictionnaires de langue générale</title>
		<author>
			<persName><forename type="first">R</forename><surname>Costa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Simões</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Tasovac</surname></persName>
		</author>
		<idno>ISSN numérique 2684-6691</idno>
	</analytic>
	<monogr>
		<title level="m">La lexicographie en tant que méthodologie de recherche en linguistique Revue de Philologie Française et Romane -Langue(s) &amp; Parole</title>
				<imprint>
			<date type="published" when="2020">2020</date>
			<biblScope unit="volume">5</biblScope>
			<biblScope unit="page" from="201" to="230" />
		</imprint>
	</monogr>
	<note>Mons: Edition du CIPA</note>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">SKOS as a key element for linking lexicography to digital humanities. Information Organization in Digital Humanities: A Global Perspective</title>
		<author>
			<persName><forename type="first">R</forename><surname>Costa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Almeida</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Coll. Digital Research in the Arts and Humanities</title>
				<editor>
			<persName><forename type="first">Koraljka</forename><surname>Golub</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">/</forename><surname>Ying</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">-Hsang</forename><surname>Liu</surname></persName>
		</editor>
		<imprint>
			<publisher>Routledge</publisher>
			<date type="published" when="2021">2021</date>
			<biblScope unit="page" from="178" to="204" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">MORDigital: the advent of a new lexicographical Portuguese project. Electronic lexicography in the 21st century</title>
		<author>
			<persName><forename type="first">R</forename><surname>Costa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Khan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Romary</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Almeida</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">M</forename><surname>Khemakhem</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Ramos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Silva</surname></persName>
		</author>
		<author>
			<persName><surname>Tasovac</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the eLex 2021 conference</title>
				<meeting>the eLex 2021 conference<address><addrLine>Brno, Czech Republic</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2021">2021</date>
			<biblScope unit="page" from="321" to="324" />
		</imprint>
	</monogr>
	<note>Lexical Computing CZ s.r.o.</note>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">Modelling Lexicographic Resources Using CIDOC CRM, FRBRoo and Ontolex Lemon</title>
		<author>
			<persName><forename type="first">F</forename><surname>Kahn</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the International Joint Workshop on Semantic Web and Ontology Design for Cultural Heritage co-located with the Bolzano Summer of Knowledge 2021 (BOSK 2021)</title>
				<editor>
			<persName><forename type="first">A</forename><surname>Bikakis</surname></persName>
		</editor>
		<meeting>the International Joint Workshop on Semantic Web and Ontology Design for Cultural Heritage co-located with the Bolzano Summer of Knowledge 2021 (BOSK 2021)<address><addrLine>Bozen-Bolzano</addrLine></address></meeting>
		<imprint>
			<publisher>CEUR-WS</publisher>
			<date type="published" when="2021">2021</date>
			<biblScope unit="page" from="1" to="12" />
		</imprint>
	</monogr>
	<note>SWODCH 2021 -Semantic Web and Ontology Design for Cultural Heritage 2021</note>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Modelling Etymology in LMF/TEI: The &apos;Grande Dicionário Houaiss da Língua Portuguesa&apos; Dictionary as a Use Case</title>
		<author>
			<persName><forename type="first">F</forename><surname>Khan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Romary</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Bowers</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Khemakhem</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Tasovac</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">LREC 2020 Conference Proceedings</title>
				<editor>
			<persName><forename type="first">N</forename><surname>Calzolari</surname></persName>
		</editor>
		<meeting><address><addrLine>Paris</addrLine></address></meeting>
		<imprint>
			<publisher>ELRA</publisher>
			<date type="published" when="2020">2020</date>
			<biblScope unit="page" from="3172" to="3180" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Marcas temáticas en los diccionarios académicos ibéricos: estudio comparativo</title>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Costa</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">RILEX: Revista sobre investigación léxicos</title>
		<idno type="ISSN">2605-3136</idno>
		<imprint>
			<biblScope unit="volume">2</biblScope>
			<biblScope unit="issue">2</biblScope>
			<biblScope unit="page" from="37" to="63" />
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">Improving the consistency of usage labelling in dictionaries with TEI Lex-0</title>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Costa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Tasovac</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Lexicography: Journal of ASIALEX</title>
		<idno type="ISSN">2197-4306</idno>
		<imprint>
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">TEI Lex-0 In Action: Improving the Encoding of the Dictionary of the Academia das Ciências de Lisboa</title>
		<author>
			<persName><forename type="first">A</forename><surname>Salgado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Costa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Tasovac</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Simões</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Alberto</forename></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Electronic lexicography in the 21st century. Proceedings of the eLex 2019 conference. 1-3</title>
				<editor>
			<persName><forename type="first">I</forename><surname>Kosem</surname></persName>
		</editor>
		<meeting><address><addrLine>Sintra, Portugal; Brno</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2019-10">2019. October 2019</date>
			<biblScope unit="page" from="417" to="433" />
		</imprint>
	</monogr>
	<note>: Lexical Computing CZ</note>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
