<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Knowledge Graphs for Digital Transformation Monitoring in Social Media</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Vanni</forename><surname>Zavarella</surname></persName>
							<email>v.zavarella@unica.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Mathematics and Computer Science</orgName>
								<orgName type="institution">University of Cagliari</orgName>
								<address>
									<settlement>Cagliari</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Diego</forename><forename type="middle">Reforgiato</forename><surname>Recupero</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Department of Mathematics and Computer Science</orgName>
								<orgName type="institution">University of Cagliari</orgName>
								<address>
									<settlement>Cagliari</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Sergio</forename><surname>Consoli</surname></persName>
							<email>sergio.consoli@ec.europa.eu</email>
							<affiliation key="aff1">
								<orgName type="department" key="dep1">European Commission</orgName>
								<orgName type="department" key="dep2">Joint Research Centre (DG JRC)</orgName>
								<address>
									<settlement>Ispra (</settlement>
									<region>VA)</region>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Gianni</forename><surname>Fenu</surname></persName>
							<email>gianni.fenu@unica.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Mathematics and Computer Science</orgName>
								<orgName type="institution">University of Cagliari</orgName>
								<address>
									<settlement>Cagliari</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Simone</forename><surname>Angioni</surname></persName>
							<email>simone.angioni@unica.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Mathematics and Computer Science</orgName>
								<orgName type="institution">University of Cagliari</orgName>
								<address>
									<settlement>Cagliari</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Davide</forename><surname>Buscaldi</surname></persName>
							<email>davide.buscaldi@lipn.univ-paris13.fr</email>
							<affiliation key="aff2">
								<orgName type="laboratory">Laboratoire d&apos;Informatique de Paris Nord</orgName>
								<orgName type="institution">Sorbonne Paris Nord University</orgName>
								<address>
									<addrLine>99 Av. Jean Baptiste Clement</addrLine>
									<postCode>93430</postCode>
									<settlement>Villetaneuse</settlement>
									<country key="FR">France</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Danilo</forename><surname>Dessí</surname></persName>
							<email>danilo.dessi@gesis.org</email>
							<affiliation key="aff3">
								<orgName type="department">Knowledge Technologies for Social Sciences Department</orgName>
								<orgName type="institution">GESIS Leibniz Institute for the Social Sciences</orgName>
								<address>
									<addrLine>Unter Sachsenhausen 6-8</addrLine>
									<settlement>Cologne</settlement>
									<country key="DE">Germany</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Francesco</forename><surname>Osborne</surname></persName>
							<email>francesco.osborne@gopen.ac.uk</email>
							<affiliation key="aff4">
								<orgName type="department">Knowledge Media Institute</orgName>
								<orgName type="institution">The Open University</orgName>
								<address>
									<settlement>Milton Keynes</settlement>
									<country key="GB">UK</country>
								</address>
							</affiliation>
							<affiliation key="aff5">
								<orgName type="department">Department of Business and Law</orgName>
								<orgName type="institution">University of Milano Bicocca</orgName>
								<address>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Knowledge Graphs for Digital Transformation Monitoring in Social Media</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">53DF78952E72E43C498EFC61C4FECFED</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2025-04-23T18:39+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>Information Extraction</term>
					<term>Knowledge Graphs</term>
					<term>Social Media Analysis</term>
					<term>Named Entity Recognition</term>
					<term>Hierarchical Clustering</term>
					<term>Word Embeddings</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Several techniques and workflows have emerged recently for automatically extracting knowledge graphs from documents like scientific articles and patents. However, adapting these approaches to integrate alternative text sources such as micro-blogging posts and news and to model open-domain entities and relationships commonly found in these sources is still challenging. This paper introduces an improved information extraction pipeline designed specifically for extracting a knowledge graph comprising opendomain entities from micro-blogging posts on social media platforms. Our pipeline utilizes dependency parsing and employs unsupervised classification of entity relations through hierarchical clustering over word embeddings. We present a case study involving the extraction of semantic triples from a tweet collection concerning digital transformation and show through two experimental evaluations on the same dataset that our system achieves precision rates exceeding 95% and surpasses similar pipelines by approximately 5% in terms of precision, while also generating a notably higher number of triples.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>In recent years, knowledge graphs (KGs) have become increasingly recognized for their ability to organize structured data in a semantically significant way, allowing them to effectively support various AI systems <ref type="bibr" target="#b0">[1]</ref>. Large-scale KGs are usually generated through a semi-automated process, utilizing both structured and unstructured data. Some prominent examples include DBpedia <ref type="bibr" target="#b1">[2]</ref> <ref type="foot" target="#foot_0">1</ref> , Google Knowledge Graph<ref type="foot" target="#foot_1">2</ref> , BabelNet<ref type="foot" target="#foot_2">3</ref> , and YAGO <ref type="foot" target="#foot_3">4</ref> . A few proposals have been recently put forth for generating organized, interconnected, and machine-readable data frameworks of content found within text from microblogging platforms <ref type="bibr" target="#b2">[3,</ref><ref type="bibr" target="#b3">4,</ref><ref type="bibr" target="#b4">5]</ref>, using Semantic Web technologies such as ontologies and knowledge graphs <ref type="bibr" target="#b5">[6,</ref><ref type="bibr" target="#b6">7,</ref><ref type="bibr" target="#b7">8]</ref>. However, creating extensive and high-quality knowledge graphs from social media is still an open research problem. Existing solutions either depend on systems that aid social media experts in structuring their knowledge, therefore suffering from scalability problems, or rely on information extraction pipelines <ref type="bibr" target="#b8">[9,</ref><ref type="bibr" target="#b9">10,</ref><ref type="bibr" target="#b10">11]</ref>. Generating large-scale, coherent, and semantically sound representations of social media texts drawn from millions of posts has proven to be challenging, as existing methods for entity and relationship extraction typically focus on specific domains <ref type="bibr" target="#b3">[4]</ref>.</p><p>In this paper we present Triplétoile, an enhanced information extraction architecture designed to extract and merge instances of open-domain entities from social media text and to identify and generalize various relationships among these entities by using hierarchical clustering, word embeddings and dimensionality reduction techniques.</p><p>The designed architecture is scalable and introduces a novel approach for entity extraction that leverages the dependency tree of an input sentence and a list of patterns validated by experts. It incorporates a module for unifying and grounding entity instances using external resources such as DBpedia. We also provide a use case application of the proposed architecture to a set of around 100k tweets extracted from the X/Twitter platform<ref type="foot" target="#foot_4">5</ref> from 2022 and concerning the digital transformation domain and we released the resulting knowledge graph. Finally, we conducted an assessment of Triplétoile by comparing it to several alternative solutions using a benchmark dataset consisting of 500 triples and show that it outperforms them in terms of accuracy, while at the same time generating a relatively higher number of triples.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Related Work</head><p>Numerous scholarly articles delve into the methodologies for generating knowledge graphs across different domains and under various constraints <ref type="bibr" target="#b11">[12,</ref><ref type="bibr" target="#b6">7,</ref><ref type="bibr" target="#b12">13,</ref><ref type="bibr" target="#b13">14,</ref><ref type="bibr" target="#b14">15,</ref><ref type="bibr" target="#b15">16]</ref>. These knowledge graphs are often enhanced and refined using link prediction techniques <ref type="bibr" target="#b16">[17,</ref><ref type="bibr" target="#b17">18]</ref>. The extraction of knowledge graphs from web sources to answer questions related to social networks <ref type="bibr" target="#b2">[3]</ref>, such as Twitter or Facebook, has been widely discussed in literature <ref type="bibr" target="#b18">[19,</ref><ref type="bibr" target="#b19">20,</ref><ref type="bibr" target="#b3">4]</ref>. He et al. <ref type="bibr" target="#b4">[5]</ref> described how to build knowledge graphs for social networks by developing deep Natural Language Processing models. A number of information extraction pipelines have been proposed to create high-quality knowledge graphs within the social network analysis domain ( <ref type="bibr" target="#b8">[9,</ref><ref type="bibr" target="#b3">4,</ref><ref type="bibr" target="#b9">10,</ref><ref type="bibr" target="#b10">11]</ref>).</p><p>Haslhofer et al. <ref type="bibr" target="#b20">[21]</ref> have emphasized the importance of connected knowledge graphs and discovery, whereas Hyvönen and Rantala <ref type="bibr" target="#b21">[22]</ref> have highlighted the significance of new relationships extracted from the original dataset. In recent years there has been also an increasing research focus on ontologies and interoperable data <ref type="bibr" target="#b22">[23]</ref>. In particular, Dessì et al. <ref type="bibr" target="#b13">[14]</ref> have proposed an information extraction method that combines data from different tools using a domain ontology, enabling the creation of expansive knowledge graphs. This first approach has been a source of inspiration for further research in the field <ref type="bibr" target="#b23">[24,</ref><ref type="bibr" target="#b24">25,</ref><ref type="bibr" target="#b25">26,</ref><ref type="bibr" target="#b26">27,</ref><ref type="bibr" target="#b27">28]</ref>. Recently, approaches leveraging fine-tuning of pre-trained large language model such as GPT-3 have been proven to be effective in performing joint named entity recognition and relation extraction for complex hierarchical information <ref type="bibr" target="#b28">[29,</ref><ref type="bibr" target="#b29">30]</ref>. Some recent solutions also augment large language model by using knowledge injection methods in order to improve their performance in specific domains <ref type="bibr" target="#b30">[31]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Methodology</head><p>Figure <ref type="figure" target="#fig_0">1</ref> shows the workflow of the pipeline that we propose in this paper. We describe in more detail in the following the main component processing blocks and modules.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.">Data Preprocessing</head><p>Prior to extracting triples, we follow a two-fold approach to tweet normalization. On the one hand, we remove tokens and token sequences encoding platform-specific metadata or denoting communicative conventions that (typically) do not carry any syntactic function in the tweet sentence, namely sentiment emoticons and smileys, reserved tokens (e.g., RT for 'retweet') and URLs. On the other hand, we keep by default other platform-specific tokens that can carry syntactic functions in some contexts, like the tokens (e.g. #digitaltransformation, #SME, @NASA). Then, we apply a number of heuristics for capturing and removing token patterns that typically disrupt the syntactic parsing of the sentence <ref type="foot" target="#foot_5">6</ref> . This results in fixing noisy parser edges induced for example by trailing hashtags sequences. The preprocessing step is carried out using the output of Spacy's English transformer pipeline en_core_web_trf-3.6.1 after customizing the default Tokenizer in order to parse tweet metadata (e.g., mentions and hashtags) <ref type="foot" target="#foot_6">7</ref> .</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.2.">Triple Extraction</head><p>In the triple extraction block, preprocessed tweets are sentence split and each sentence is fed to the Spacy pipeline. Building upon the works in <ref type="bibr" target="#b31">[32]</ref> and <ref type="bibr" target="#b32">[33]</ref>, we define a set of procedures to extract candidate nominal entities and predicative triples connecting them out of dependency parse trees.</p><p>Entity extraction module: It detects local nominal phrases with a restricted range of syntactic modifications (e.g., compound nouns and adjectives). It then connects and expands them with a. non-recursive attached prepositional phrases; b. quantity-type entities (MONEY, PERCENT, QUANTITY, CARDINAL); c. entity spans linked via pronominal anaphoras, resolved using the Spacy pipeline component coreferee <ref type="foot" target="#foot_7">8</ref> . Overall, the module ends up with a set 𝐸 = {𝑒 0 , ..., 𝑒 𝑛 } of non-unified, candidate entity phrases (e.g. #digitaltransformation and digital transformation are not mapped to the same general concept digital transformation at this stage.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Relation extraction module:</head><p>For each sentence 𝑠 𝑖 all the shortest paths of the dependency tree between each pair of entities (𝑒 𝑚 , 𝑒 𝑛 ) containing a verb and matching any of a shortlist of expert validated patterns <ref type="foot" target="#foot_8">9</ref> are selected. The target pattern set has been selected through an expert validation process over a sampling of the most frequent patterns matched in an external, opendomain text corpus. The entire updated process generates a set of verbal relations 𝑉 = 𝑣 0 , ..., 𝑣 𝑘 and a set of triples 𝑆 = 𝑠 0 , ..., 𝑠 𝑘 of the form &lt; 𝑒 𝑚 , 𝑣, 𝑒 𝑛 &gt; where 𝑣 ∈ 𝑉 and 𝑒 ∈ 𝐸.</p><p>The final goal of the pipeline is to allow to generalize from the set 𝑆 of surface form triples to the lower sized set 𝑇 = 𝑡 0 , ..., 𝑡 ℎ of triples of the form &lt; 𝜖 𝑚 , 𝑟, 𝜖 𝑛 &gt; where each 𝜖 𝑖 ∈ 𝐸 is a unified entity and 𝑟 is a label in a generalized relation vocabulary 𝑅.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.3.">Entity Refining</head><p>Entities are first cleaned up by removing leading/trailing punctuation marks as well as stopwords. Then, hashtags and @ mentions are normalized and lower-cased and "camel case" forms resolved (e.g. from #SmartCities to 'smart cities'), while we lemmatize and lowercase all other component tokens whose POS tag is neither Verb nor Proper Noun.</p><p>We leverage the linking of these normalized candidate entities to DBpedia entries via DBpedia Spotlight library 10 in order to merge them. To this purpose, we run the library over modified tweet sentences with the original subjects and objects entity spans replaced with their normalized forms, and then merge entities that get linked to the same DBpedia entries. For example, the two candidate entities 'Gartner' and '@Gartner_inc' are merged as they get linked to the DBpedia entry of the Gartner consulting firm http://dbpedia.org/resource/Gartner). This is then formalized with a relation owl:sameAs in the final knowledge graph. In case only the first condition is met, we assign a semantic 'relatedness' link between the candidate entity and the DBpedia entry, indicating that the former is not an instance of, but rather related to the latter. For example, the span '@gartner_survey' is considered only 'related' (encoded as skos:related) to the DBpedia entry for Gartner.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.4.">Relation Refining</head><p>In order to find the best predicate label 𝑟 for each relation verb 𝑣 in a triple &lt; 𝑒 𝑚 , 𝑣, 𝑒 𝑛 &gt; and to map 𝑣 to 𝑟 in the resulting triple, we first derive a word embedding representation of the verb predicates from a pre-trained model, then we compute an optimized clustering of the relation vectors, and finally use a representative instance of each cluster to map verb predicates.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Relation Embeddings:</head><p>For each single or multi-token relation predicate, we use the static, 300-dimensional word embeddings learned with GloVe <ref type="bibr" target="#b33">[34]</ref> and made available for text Span objects in the Spacy en_core_web_lg-3.6.0 pipeline 1112 .</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Dimensionality Reduction and Clustering:</head><p>We used the HDBSCAN clustering algorithm enhanced by previously applying UMAP dimension reduction technique on the word embeddings vectors <ref type="foot" target="#foot_12">13</ref> . HDBSCAN is a hierarchical version of the popular density-based DBSCAN algorithm, which is characterized by considering outliers and leaves unclustered the data points lying in low-density regions <ref type="bibr" target="#b34">[35]</ref>. Consequently, high dimensional data require more observed samples to produce the suitable level of density for HDBSCAN to work properly. However, applying UMAP to perform non-linear, manifold aware dimension reduction <ref type="bibr" target="#b35">[36]</ref> has been proven to transform the datasets down to a dimension small enough for HDBSCAN to cluster the vast majority of instances. In order to optimize the combination of UMAP and HDBSCAN, we perform a grid search over the hyper-parameters of both algorithms and evaluate the clustering using the score: 𝑆 = 𝑠𝑖𝑙ℎ𝑜𝑢𝑒𝑡𝑡𝑒 𝑋 • 𝑐𝑙𝑢𝑠𝑡𝑒𝑟𝑒𝑑 𝑋 , where 𝑠𝑖𝑙ℎ𝑜𝑢𝑒𝑡𝑡𝑒 𝑋 is the mean silhouette coefficient over all the instances of the dataset 𝑋 that were actually clustered by HDBSCAN <ref type="bibr" target="#b36">[37]</ref> and 𝑐𝑙𝑢𝑠𝑡𝑒𝑟𝑒𝑑 𝑋 is the fraction of instances of 𝑋 that were actually clustered. In practice, we optimize for the classical measure of cluster cohesion and separation while penalizing the configurations with low coverage of the dataset. We finally chose a subset of best-scoring hyper-parameter configurations and plotted their 𝑆 score over the number of output clusters they generate, so that we are able to pick a sub-optimal configuration that balances between generalization (fewer clusters) and accuracy (cluster number closer to the dataset size).</p><p>Relation Mapping: Finally, for each relation verb 𝑣 in the dataset, we replace it with the predicate label 𝑟 consisting of the lemma of the most frequent relation in the cluster of 𝑣.</p><p>Otherwise, we map it to itself if 𝑣 was an outlier.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Evaluation</head><p>We first evaluate the precision by manually assessing the truthfulness of a test set of statements. Second, we evaluate our pipeline's precision against a number of alternative tools.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Human Expert Assessment:</head><p>We randomly selected about 500 statements extracted by our pipeline and ask three domain expert evaluators to assess each statement as True or False <ref type="foot" target="#foot_13">14</ref> . Average pair-wise Cohen 𝜅 inter-rater agreement was 0.61, while Fleiss 𝜅 𝐹 agreement score over all 3 raters (ranging in [−1, +1], <ref type="bibr" target="#b37">[38]</ref>) reached 0.558 (substantial agreement). The accuracy of the majority vote assessments over the 500 triples was 0.96, indicating that the pipeline is able to extract triples with good precision.</p><p>Comparative Evaluation: Successively, we randomly sampled 500 tweets from the 100ksized original dataset and used our pipeline to extract candidate entities. We then merge this set of entities with the ones generated by the DyGIEpp Extractor <ref type="bibr" target="#b38">[39]</ref>. Finally we deploy four alternative methods to identify relationships between these entities and extract statements from the 500 tweets. Specifically, we compared with: a. OpenIE Extractor, the IE tool of the Stanford Core NLP suite <ref type="bibr" target="#b39">[40]</ref>; b. PoST Extractor, a module that searches for all verbs in a 15 token window between two candidate entities in a sentence to extract verb relations; c. Dependency-based Extractor, a module that exploits 12 hand-crafted paths <ref type="foot" target="#foot_14">15</ref> over Stanford Core NLP dependency parses to find verbs that connect DyGIEpp entities; d. Entity and Relationship Refiner, described in <ref type="bibr" target="#b32">[33]</ref>. Precision (P) of the triples extracted from a set of alternative methods from a set of 500 tweets, using a combination of Triplétoile and DyGIEpp candidate entities.</p><p>Table <ref type="table" target="#tab_0">1</ref> reports the number of extracted triples for each of these methods. In order to use these numbers as an indirect assessment of the relative recall levels of the different pipelines, we also report the expert-assessed precision on a limited random sample of 150 triples generated by each method. It can be seen how the precision of our pipeline on this smaller sample largely outperforms all the alternative methods, while also yielding the second largest number of triples, interestingly outperforming the Dependency-based Extractor method, which deploys very similar syntactic information from the sentence <ref type="foot" target="#foot_15">16</ref> . </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Digital Transformation Monitoring Knowledge Graph</head><p>The presented prototype pipeline was deployed as part of a Digital Transformation monitoring system, targeting specifically its capacity to link and extend existing knowledge graphs generated from conventional sources (scientific papers, patents) with continuous updates from news and social media. Therefore, we have generated a knowledge graph from around 100k topicspecific tweets, sampled from 4M English language tweets from 2022 containing the hashtag #DigitalTransformation, excluding retweets <ref type="foot" target="#foot_16">17</ref> .</p><p>The generated DTSMM (Digital Transformation Social Media Monitor) knowledge graph comprises approximately 22,270 (non-reified) triples, connecting a total of 22597 nodes via 43428 edges. A number of sample triples are shown in Table <ref type="table" target="#tab_1">2</ref>.</p><p>We reified then each claim into dtsmm-ont:Statement class instances, where dtsmmont:Statement defines a specific claim extracted from a given number of tweets. Figure <ref type="figure">2</ref> shows an example of claim reification having the instance multi_page_document_classification as rdf:subject. DTSMM features a total of 18693 unique detected entities, whose 33.9% and 6.44% included hashtags and @ entity mentions, respectively, 3.34% were complex noun phrases with prepositional attachments, while around 16.6% contained quantitative modifiers of any type (currency, percent, etc.). Out of all the generated triples, a 5.98% had either the subject or object entity made by a resolved pronominal anaphora.</p><p>Around 8% of all unique entities were linked to DBpedia entries via 2,857 owl:sameAs and 3,309 skos:related predicates in order to encode entity equality and relatedness, respectively. Centre (JRC) <ref type="foot" target="#foot_18">19</ref> , whose goal is to create a tracker that monitors societal and economic activities through European countries using unconventional data <ref type="bibr" target="#b40">[41]</ref>.</p><p>Therefore, DTSMM has been made publicly accessible both through a SPARQL endpoint and a serialization file. Through the Virtuoso SPARQL endpoint https://api-vast.jrc.service.ec.europa. eu/sparql/ DTSMM can be queried using the graph name 'DTSMM_KG'<ref type="foot" target="#foot_19">20</ref> as shown in Figure <ref type="figure">3</ref>, where we retrieve all the statements in DTSMM having the target entity dtsmm:microsoft as object.</p><p>Finally, a Turtle format serialization of DTSMM has been publicly released <ref type="foot" target="#foot_20">21</ref> within the Joint Research Centre Data Catalogue <ref type="foot" target="#foot_21">22</ref> , as well as within the European Data portal <ref type="foot" target="#foot_22">23</ref> . The direct link is: https://jeodpp.jrc.ec.europa.eu/ftp/jrc-opendata/CC-COIN/se-tracker/DTSMM_KG.ttl.  </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="6.">Conclusions</head><p>We presented an approach to specifically extract a knowledge graph comprising open-domain entities from micro-blogging posts on social media platforms. In a topic-specific test collection of Digital Transformation tweets the pipeline proved to outperform some of the state-of-the-art methods, generating mostly valid triples. Moreover, around 12% of entity mentions are linked to DBpedia entries, suggesting that the method is potentially useful for tracking relevant entities in the target social media text collection. A current limitation is that the entity and relation extraction processes are not backed by an underlying ontology specification. Therefore, on one hand, the extracted entities are not natively typed and no domain-specific classification schema for relations is available for setting up a supervised learning of relation mapping. We plan to work on an enhanced version of the pipeline that builds upon the current entity and relation spans and further classifies them into domain-specific categories, leveraging fine-tuning of contextual word embedding representations from Large Language Models <ref type="bibr" target="#b41">[42]</ref>. Simultaneously, we aim to capitalize on the resultant knowledge graph to develop knowledge plugins <ref type="bibr" target="#b42">[43]</ref>, thus augmenting the proficiency of these language models across various natural language processing tasks.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>Figure 1 :</head><label>1</label><figDesc>Figure 1: Flowchart of the pipeline for generating a knowledge graph from micro-blogging text data.</figDesc><graphic coords="3,89.29,84.19,416.70,140.72" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head>Figure 2 :Figure 3 :</head><label>23</label><figDesc>Figure 2: A shortened sample reification for a statement concerning the ontology instances multi_page_document_classification and machine_learning, with the data property dtsmm-ont:hasSupport reporting the number of tweets grounding the claim.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>Table 1</head><label>1</label><figDesc></figDesc><table><row><cell>Extraction Method</cell><cell cols="2">Generated Triples Precision</cell></row><row><cell>OpenIE Extractor</cell><cell>588</cell><cell>0.52</cell></row><row><cell>PoST Extractor</cell><cell>1,015</cell><cell>0.17</cell></row><row><cell>Dependency-based Extractor</cell><cell>339</cell><cell>0.77</cell></row><row><cell>Entity and Relationship Refiner</cell><cell>348</cell><cell>0.31</cell></row><row><cell>Triplétoile</cell><cell>663</cell><cell>0.82</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_1"><head>Table 2</head><label>2</label><figDesc>A sample of statements extracted by the Triplétoile pipeline.</figDesc><table><row><cell>Subject Entity</cell><cell>Relation</cell><cell>Object Entity</cell></row><row><cell>pandemic</cell><cell cols="2">accelerate digital_transformation</cell></row><row><cell>artificial_intelligence</cell><cell>impact</cell><cell>insurance_sector</cell></row><row><cell>microsoft</cell><cell>buy</cell><cell>riskiq</cell></row><row><cell>data-driven_insight</cell><cell>drive</cell><cell>decision-making</cell></row><row><cell>hootsuite</cell><cell>buy</cell><cell>ai_chatbot_firm</cell></row><row><cell>automl</cell><cell>generate</cell><cell>data-driven_insight</cell></row><row><cell>image_classification</cell><cell>use</cell><cell>transfer_learning</cell></row><row><cell cols="2">image_recognition_framework use</cell><cell>artificial_intelligence</cell></row><row><cell>hsbc_qatar</cell><cell cols="2">introduce mobile_payment</cell></row><row><cell>ford_motor_company</cell><cell>explore</cell><cell>blockchain_technology</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_2"><head>Table 3</head><label>3</label><figDesc>lists the 10 most frequent DBpedia entities linked by DTSMM. The most frequent DBpediainherited types in the graph are: DBpedia:Company (441 unique entities), DBpedia:Person (118), DBpedia:Website (92), DBpedia:Software (59), DBpedia:Bank (31), DBpedia:Politician (29) and DBpedia:City (29). The primary use case of DTSMM fits within the research initiatives at the European Commission's Competence Center on Composite Indicators and Scoreboards 18 within the Joint Research</figDesc><table><row><cell>Top Linked Entities</cell></row><row><cell>Artificial_intelligence</cell></row><row><cell>Pandemic</cell></row><row><cell>Digital_transformation</cell></row><row><cell>Coronavirus_disease_2019</cell></row><row><cell>Microsoft</cell></row><row><cell>Cloud_computing</cell></row><row><cell>Google</cell></row><row><cell>Salesforce.com</cell></row><row><cell>Gartner</cell></row><row><cell>Chatbot</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_3"><head>Table 3</head><label>3</label><figDesc>10 most frequent DBpedia-linked entities in the DTSMM knowledge graph.</figDesc><table /></figure>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="1" xml:id="foot_0">https://www.dbpedia.org/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="2" xml:id="foot_1">https://developers.google.com/knowledge-graph</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="3" xml:id="foot_2">https://babelnet.org/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="4" xml:id="foot_3">https://yago-knowledge.org/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="5" xml:id="foot_4">https://twitter.com/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="6" xml:id="foot_5">For example, for any sequence of size 𝑛 &gt; 1 hashtags/mentions/URL, we drop the sub-sequence with indexes [1 : 𝑛] or drop the entire sequence if preceded by a sentence closing marker like ('!', ':', '?', '. ').</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="7" xml:id="foot_6">https://github.com/explosion/spacy-models/releases/tag/en_core_web_trf-3.6.1</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="8" xml:id="foot_7">https://github.com/richardpaulhudson/coreferee</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="9" xml:id="foot_8">https://github.com/zavavan/dtm_kg/blob/master/resources/paths.txt</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="10" xml:id="foot_9">https://spacy.io/universe/project/spacy-dbpedia-spotlight</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="11" xml:id="foot_10">https://github.com/explosion/spacy-models/releases/tag/en_core_web_lg-3.6.0</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="12" xml:id="foot_11">We tested using various contextual embeddings however it turned out that these representations were not suitable for generalizing enough over relations, probably due to the context-specific information they are encoding.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="13" xml:id="foot_12">https://umap-learn.readthedocs.io/en/latest/parameters.html</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="14" xml:id="foot_13">For example, a triple like &lt; 78%_𝑜𝑓 _#ℎ𝑒𝑎𝑙𝑡ℎ𝑐𝑎𝑟𝑒, 𝑈 𝑆𝐸, 𝐷𝑖𝑔𝑖𝑡𝑎𝑙_𝑇 𝑟𝑎𝑛𝑠𝑓 𝑜𝑟𝑚𝑎𝑡𝑖𝑜𝑛 &gt; would be marked as False if extracted from the text '78% of #healthcare organisations deploy #DigitalTransformation' as the head of the subject noun phrase of the relation is actually 'organisations'.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="15" xml:id="foot_14">https://github.com/danilo-dessi/SKG-pipeline/blob/main/resources/path.txt</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="16" xml:id="foot_15">This may be due to the application of the processing step upstream of the triple extraction process.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="17" xml:id="foot_16">We used the Twitter public API v2 full-archive search endpoint. Near-duplicate tweets were also removed.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="18" xml:id="foot_17">European Commission's Competence Center on Composite Indicators and Scoreboards (COIN): https:// composite-indicators.jrc.ec.europa.eu/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="19" xml:id="foot_18">The Joint Research Centre (JRC) of the European Commission (EC): https://ec.europa.eu/info/departments/ joint-research-centre_en</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="20" xml:id="foot_19">Currently the access is password protected, with credentials available upon request to authors.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="21" xml:id="foot_20">Under Creative Commons Attribution 4.0 International (CC BY 4.0)</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="22" xml:id="foot_21">https://data.jrc.ec.europa.eu/dataset/f7be47f7-49a2-44e8-9dc8-043735af4139</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="23" xml:id="foot_22">https://data.europa.eu/88u/dataset/f7be47f7-49a2-44e8-9dc8-043735af4139</note>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Acknowledgements</head><p>We acknowledge financial support under the National Recovery and Resilience Plan (NRRP), Mission 4 Component 2 Investment 1.5 -Call for tender No.3277 published on December 30, 2021 by the Italian Ministry of University and Research (MUR) funded by the European Union -NextGenerationEU. Project Code ECS0000038 -Project Title eINS Ecosystem of Innovation for Next Generation Sardinia -CUP F53C22000430001-Grant Assignment Decree No. 1056 adopted on June 23, 2022 by the Italian Ministry of University and Research (MUR).</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Knowledge graphs: opportunities and challenges</title>
		<author>
			<persName><forename type="first">C</forename><surname>Peng</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Xia</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Naseriparsa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Artificial Intelligence Review</title>
		<imprint>
			<biblScope unit="page" from="1" to="32" />
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">DBpedia-A large-scale, multilingual knowledge base extracted from Wikipedia</title>
		<author>
			<persName><forename type="first">J</forename><surname>Lehmann</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Isele</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Jakob</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Jentzsch</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Kontokostas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">N</forename><surname>Mendes</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Hellmann</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Morsey</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Van Kleef</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Auer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Bizer</surname></persName>
		</author>
		<idno type="DOI">10.3233/SW-140134</idno>
	</analytic>
	<monogr>
		<title level="j">Semantic Web</title>
		<imprint>
			<biblScope unit="volume">6</biblScope>
			<biblScope unit="page" from="167" to="195" />
			<date type="published" when="2015">2015</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">RDF approach on social network analysis</title>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">S</forename><surname>Raji</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Surendran</surname></persName>
		</author>
		<idno type="DOI">10.1109/RAINS.2016.7764416</idno>
	</analytic>
	<monogr>
		<title level="m">2016 International Conference on Research Advances in Integrated Navigation Systems (RAINS)</title>
				<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="1" to="4" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">From social networks to knowledge graphs: A plea for interdisciplinary approaches</title>
		<author>
			<persName><forename type="first">J</forename><surname>Dörpinghaus</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Klante</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Christian</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Meigen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Düing</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.ssaho.2022.100337</idno>
	</analytic>
	<monogr>
		<title level="j">Social Sciences &amp; Humanities Open</title>
		<imprint>
			<biblScope unit="volume">6</biblScope>
			<biblScope unit="page">100337</biblScope>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Constructing knowledge graph for social networks in a deep and holistic way</title>
		<author>
			<persName><forename type="first">Q</forename><surname>He</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Yang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Shi</surname></persName>
		</author>
		<idno type="DOI">10.1145/3366424.3383112</idno>
	</analytic>
	<monogr>
		<title level="m">Companion Proceedings of the Web Conference 2020</title>
				<meeting><address><addrLine>New York, NY, USA</addrLine></address></meeting>
		<imprint>
			<publisher>Association for Computing Machinery</publisher>
			<date type="published" when="2020">2020</date>
			<biblScope unit="page" from="307" to="308" />
		</imprint>
	</monogr>
	<note>WWW &apos;20</note>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Ontology-based data access: A survey</title>
		<author>
			<persName><forename type="first">G</forename><surname>Xiao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Calvanese</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Kontchakov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Lembo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Poggi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Rosati</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Zakharyaschev</surname></persName>
		</author>
		<idno type="DOI">10.24963/ijcai.2018/777</idno>
	</analytic>
	<monogr>
		<title level="m">IJCAI International Joint Conference on Artificial Intelligence</title>
				<imprint>
			<date type="published" when="2018-07">2018-July, 2018</date>
			<biblScope unit="page" from="5511" to="5519" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">The Semantic Web: Two decades on</title>
		<author>
			<persName><forename type="first">A</forename><surname>Hogan</surname></persName>
		</author>
		<idno type="DOI">10.3233/SW-190387</idno>
	</analytic>
	<monogr>
		<title level="j">Semantic Web</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<biblScope unit="page" from="169" to="185" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">Towards a definition of knowledge graphs</title>
		<author>
			<persName><forename type="first">L</forename><surname>Ehrlinger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><surname>Wöß</surname></persName>
		</author>
		<ptr target="https://ceur-ws.org/Vol-1695/paper4.pdf" />
	</analytic>
	<monogr>
		<title level="m">Joint Proceedings of the Posters and Demos Track of the 12th International Conference on Semantic Systems -SEMANTiCS2016 and the 1st International Workshop on Semantic Change &amp; Evolving Semantics (SuCCESS&apos;16) co-located with the 12th International Conference on Semantic Systems (SEMANTiCS 2016)</title>
		<title level="s">CEUR Workshop Proceedings</title>
		<editor>
			<persName><forename type="first">M</forename><surname>Martin</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">M</forename><surname>Cuquet</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">E</forename><surname>Folmer</surname></persName>
		</editor>
		<meeting><address><addrLine>Leipzig, Germany</addrLine></address></meeting>
		<imprint>
			<date type="published" when="1695">September 12-15, 2016. 1695. 2016</date>
			<biblScope unit="page" from="1" to="4" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">Sara -A Semi-Automatic Framework for Social Network Analysis</title>
		<author>
			<persName><forename type="first">C</forename><surname>Barbosa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Félix</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vieira</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Xavier</surname></persName>
		</author>
		<idno type="DOI">10.5753/webmedia_estendido.2019.8137</idno>
	</analytic>
	<monogr>
		<title level="m">Anais Estendidos do XXV Simpósio Brasileiro de Sistemas Multimídia e Web</title>
				<meeting><address><addrLine>Porto Alegre, RS, Brasil</addrLine></address></meeting>
		<imprint>
			<publisher>SBC</publisher>
			<date type="published" when="2019">2019</date>
			<biblScope unit="page" from="59" to="62" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">Semantic Web Machine Reading with FRED</title>
		<author>
			<persName><forename type="first">H</forename><surname>Alani</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gangemi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Presutti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Reforgiato Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">G</forename><surname>Nuzzolese</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Draicchio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Mongiovì</surname></persName>
		</author>
		<idno type="DOI">10.3233/SW-160240</idno>
	</analytic>
	<monogr>
		<title level="j">Semantic Web</title>
		<imprint>
			<biblScope unit="volume">8</biblScope>
			<biblScope unit="page" from="873" to="893" />
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">OpenIE-based approach for Knowledge Graph construction from text</title>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">L</forename><surname>Martinez-Rodriguez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Lopez-Arevalo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">B</forename><surname>Rios-Alvarado</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.eswa.2018.07.017</idno>
	</analytic>
	<monogr>
		<title level="j">Expert Systems with Applications</title>
		<imprint>
			<biblScope unit="volume">113</biblScope>
			<biblScope unit="page" from="339" to="355" />
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">Semantic web in data mining and knowledge discovery: A comprehensive survey</title>
		<author>
			<persName><forename type="first">P</forename><surname>Ristoski</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Paulheim</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.websem.2016.01.001</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Web Semantics</title>
		<imprint>
			<biblScope unit="volume">36</biblScope>
			<biblScope unit="page" from="1" to="22" />
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">Ontology engineering: Current state, challenges, and future directions</title>
		<author>
			<persName><forename type="first">T</forename><surname>Tudorache</surname></persName>
		</author>
		<idno type="DOI">10.3233/SW-190382</idno>
	</analytic>
	<monogr>
		<title level="j">Semantic Web</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<biblScope unit="page" from="125" to="138" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">Generating knowledge graphs by employing natural language processing and machine learning techniques within the scholarly domain</title>
		<author>
			<persName><forename type="first">D</forename><surname>Dessì</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Reforgiato Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Buscaldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.future.2020.10.026</idno>
	</analytic>
	<monogr>
		<title level="j">Future Generation Computer Systems</title>
		<imprint>
			<biblScope unit="volume">116</biblScope>
			<biblScope unit="page" from="253" to="264" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">AI-KG: An Automatically Generated Knowledge Graph of Artificial Intelligence</title>
		<author>
			<persName><forename type="first">D</forename><surname>Dessì</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Reforgiato Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Buscaldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Sack</surname></persName>
		</author>
		<idno type="DOI">10.1007/978-3-030-62466-8_9</idno>
	</analytic>
	<monogr>
		<title level="j">Lecture Notes in Computer Science</title>
		<imprint>
			<biblScope unit="volume">12507</biblScope>
			<biblScope unit="page" from="127" to="143" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">Aida: A knowledge graph about research dynamics in academia and industry</title>
		<author>
			<persName><forename type="first">S</forename><surname>Angioni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salatino</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">R</forename><surname>Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Quantitative Science Studies</title>
		<imprint>
			<biblScope unit="volume">2</biblScope>
			<biblScope unit="page" from="1356" to="1398" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">Link prediction techniques, applications, and performance: A survey</title>
		<author>
			<persName><forename type="first">A</forename><surname>Kumar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">S</forename><surname>Singh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Singh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Biswas</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Physica A: Statistical Mechanics and its Applications</title>
		<imprint>
			<biblScope unit="volume">553</biblScope>
			<biblScope unit="page">124289</biblScope>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b17">
	<analytic>
		<title level="a" type="main">Trans4e: Link prediction on scholarly knowledge graphs</title>
		<author>
			<persName><forename type="first">M</forename><surname>Nayyeri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><forename type="middle">M</forename><surname>Cil</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Vahdati</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Rahman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Angioni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salatino</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">R</forename><surname>Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Vassilyeva</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.neucom.2021.02.100</idno>
	</analytic>
	<monogr>
		<title level="j">Neurocomputing</title>
		<imprint>
			<biblScope unit="volume">461</biblScope>
			<biblScope unit="page" from="530" to="542" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b18">
	<analytic>
		<title level="a" type="main">Synthesizing knowledge graphs from web sources with the minte+ framework</title>
		<author>
			<persName><forename type="first">D</forename><surname>Collarana</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Galkin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Lange</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Scerri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Auer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M.-E</forename><surname>Vidal</surname></persName>
		</author>
		<idno type="DOI">10.1007/978-3-030-00668-6_22</idno>
	</analytic>
	<monogr>
		<title level="j">Lecture Notes in Computer Science</title>
		<imprint>
			<biblScope unit="volume">11137</biblScope>
			<biblScope unit="page" from="359" to="375" />
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b19">
	<analytic>
		<title level="a" type="main">Constructing and mining web-scale knowledge graphs</title>
		<author>
			<persName><forename type="first">E</forename><surname>Gabrilovich</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Usunier</surname></persName>
		</author>
		<idno type="DOI">10.1145/2911451.2914807</idno>
	</analytic>
	<monogr>
		<title level="m">SIGIR 2016 -Proceedings of the 39th International ACM SIGIR Conference on Research and Development in Information Retrieval</title>
				<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="1195" to="1197" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b20">
	<monogr>
		<title level="m" type="main">Knowledge graphs in the libraries and digital humanities domain</title>
		<author>
			<persName><forename type="first">B</forename><surname>Haslhofer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Isaac</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Simon</surname></persName>
		</author>
		<idno type="DOI">10.1007/978-3-319-63962-8_291-1</idno>
		<imprint>
			<date type="published" when="2018">2018</date>
			<publisher>Springer International Publishing</publisher>
			<biblScope unit="page" from="1" to="8" />
			<pubPlace>Cham</pubPlace>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b21">
	<analytic>
		<title level="a" type="main">Knowledge-based relation discovery in cultural heritage knowledge graphs</title>
		<author>
			<persName><forename type="first">E</forename><surname>Hyvönen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Rantala</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">CEUR Workshop Proceedings</title>
				<imprint>
			<date type="published" when="2019">2019</date>
			<biblScope unit="volume">2364</biblScope>
			<biblScope unit="page" from="230" to="239" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b22">
	<analytic>
		<title level="a" type="main">Towards the representation of claims in ontologies for the digital humanities</title>
		<author>
			<persName><forename type="first">S</forename><surname>Cristofaro</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">M</forename><surname>Sanfilippo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Sichera</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Spampinato</surname></persName>
		</author>
		<ptr target="https://ceur-ws.org/Vol-2949/paper6.pdf" />
	</analytic>
	<monogr>
		<title level="m">CEUR Workshop Proceedings</title>
				<imprint>
			<date type="published" when="2021">2021</date>
			<biblScope unit="volume">2949</biblScope>
			<biblScope unit="page" from="1" to="12" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b23">
	<analytic>
		<title level="a" type="main">A patent recommendation method based on kg representation learning</title>
		<author>
			<persName><forename type="first">Y</forename><surname>Xiao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Li</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Thürer</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.engappai.2023.106722</idno>
	</analytic>
	<monogr>
		<title level="j">Engineering Applications of Artificial Intelligence</title>
		<imprint>
			<biblScope unit="volume">126</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b24">
	<analytic>
		<title level="a" type="main">Synthesis of multilevel knowledge graphs: Methods and technologies for dynamic networks</title>
		<author>
			<persName><forename type="first">T</forename><surname>Man</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Vodyaho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Ignatov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Kulikov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Zhukova</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.engappai.2023.106244</idno>
	</analytic>
	<monogr>
		<title level="j">Engineering Applications of Artificial Intelligence</title>
		<imprint>
			<biblScope unit="volume">123</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b25">
	<analytic>
		<title level="a" type="main">Web of conferences: A conference knowledge graph</title>
		<author>
			<persName><forename type="first">S</forename><surname>Yu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Peng</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Xu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Xia</surname></persName>
		</author>
		<idno type="DOI">10.1145/3539597.3573024</idno>
	</analytic>
	<monogr>
		<title level="m">WSDM 2023 -Proceedings of the 16th ACM International Conference on Web Search and Data Mining</title>
				<imprint>
			<date type="published" when="2023">2023</date>
			<biblScope unit="page" from="1172" to="1175" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b26">
	<analytic>
		<title level="a" type="main">Defining a knowledge graph development process through a systematic review</title>
		<author>
			<persName><forename type="first">G</forename><surname>Tamašauskaite</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Groth</surname></persName>
		</author>
		<idno type="DOI">10.1145/3522586</idno>
	</analytic>
	<monogr>
		<title level="j">ACM Transactions on Software Engineering and Methodology</title>
		<imprint>
			<biblScope unit="volume">32</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b27">
	<analytic>
		<title level="a" type="main">Data-driven methodology for knowledge graph generation within the tourism domain</title>
		<author>
			<persName><forename type="first">A</forename><surname>Chessa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Fenu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Reforgiato Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salatino</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Secchi</surname></persName>
		</author>
		<idno type="DOI">10.1109/ACCESS.2023.3292153</idno>
	</analytic>
	<monogr>
		<title level="j">IEEE Access</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<biblScope unit="page" from="67567" to="67599" />
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b28">
	<monogr>
		<author>
			<persName><forename type="first">A</forename><surname>Dunn</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Dagdelen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Walker</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Lee</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">S</forename><surname>Rosen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Ceder</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Persson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Jain</surname></persName>
		</author>
		<idno type="arXiv">arXiv:2212.05238</idno>
		<title level="m">Structured information extraction from complex scientific text with fine-tuned large language models</title>
				<imprint>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b29">
	<analytic>
		<title level="a" type="main">Exploring incontext learning capabilities of foundation models for generating knowledge graphs from text</title>
		<author>
			<persName><forename type="first">H</forename><surname>Khorashadizadeh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Mihindukulasooriya</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Tiwari</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Groppe</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Groppe</surname></persName>
		</author>
		<ptr target="http://dblp.org/aredistributedunderaCreativeCom-monsCC01.0UniversalPublicDomainDedication" />
	</analytic>
	<monogr>
		<title level="m">TEXT2KG/BiKE@ESWC</title>
				<imprint>
			<date type="published" when="2023">2023</date>
			<biblScope unit="page" from="132" to="153" />
		</imprint>
	</monogr>
	<note>DBLP License: DBLP&apos;s bibliographic metadata records provided through. Although the bibliographic metadata records are provided consistent with CC0 1.0 Dedication, the content described by the metadata records is not. Content may be subject to copyright, rights of privacy, rights of publicity and other restrictions</note>
</biblStruct>

<biblStruct xml:id="b30">
	<analytic>
		<title level="a" type="main">A comparative analysis of knowledge injection strategies for large language models in the scholarly domain</title>
		<author>
			<persName><forename type="first">A</forename><surname>Cadeddu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Chessa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><forename type="middle">De</forename><surname>Leo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Fenu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">R</forename><surname>Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salatino</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Secchi</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Engineering Applications of Artificial Intelligence</title>
		<imprint>
			<biblScope unit="volume">133</biblScope>
			<biblScope unit="page">108166</biblScope>
			<date type="published" when="2024">2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b31">
	<analytic>
		<title level="a" type="main">A large-scale knowledge graph of research entities and claims in computer science</title>
		<author>
			<persName><forename type="first">D</forename><surname>Dessì</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">R</forename><surname>Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Buscaldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Cs-Kg</forename></persName>
		</author>
		<idno type="DOI">10.1007/978-3-031-19433-7_39</idno>
	</analytic>
	<monogr>
		<title level="m">The Semantic Web -ISWC 2022 -21st International Semantic Web Conference, Virtual Event</title>
		<title level="s">Lecture Notes in Computer Science</title>
		<editor>
			<persName><forename type="first">U</forename><surname>Sattler</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">A</forename><surname>Hogan</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">C</forename><forename type="middle">M</forename><surname>Keet</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">V</forename><surname>Presutti</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">J</forename><forename type="middle">P A</forename><surname>Almeida</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">H</forename><surname>Takeda</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">P</forename><surname>Monnin</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">G</forename><surname>Pirrò</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">C</forename><surname>Amato</surname></persName>
		</editor>
		<imprint>
			<publisher>Springer</publisher>
			<date type="published" when="2022">October 23-27, 2022. 2022</date>
			<biblScope unit="volume">13489</biblScope>
			<biblScope unit="page" from="678" to="696" />
		</imprint>
	</monogr>
	<note>Proceedings</note>
</biblStruct>

<biblStruct xml:id="b32">
	<analytic>
		<title level="a" type="main">SCICERO: A deep learning and NLP approach for generating scientific knowledge graphs in the computer science domain</title>
		<author>
			<persName><forename type="first">D</forename><surname>Dessì</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">R</forename><surname>Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Buscaldi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.knosys.2022.109945</idno>
	</analytic>
	<monogr>
		<title level="j">Knowledge-Based Systems</title>
		<imprint>
			<biblScope unit="volume">258</biblScope>
			<biblScope unit="page">109945</biblScope>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b33">
	<analytic>
		<title level="a" type="main">Glove: Global vectors for word representation</title>
		<author>
			<persName><forename type="first">J</forename><surname>Pennington</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Socher</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">D</forename><surname>Manning</surname></persName>
		</author>
		<ptr target="http://www.aclweb.org/anthology/D14-1162" />
	</analytic>
	<monogr>
		<title level="m">Empirical Methods in Natural Language Processing (EMNLP)</title>
				<imprint>
			<date type="published" when="2014">2014</date>
			<biblScope unit="page" from="1532" to="1543" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b34">
	<analytic>
		<title level="a" type="main">A hybrid approach to hierarchical density-based cluster selection</title>
		<author>
			<persName><forename type="first">C</forename><surname>Malzer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Baum</surname></persName>
		</author>
		<idno type="DOI">10.1109/MFI49285.2020.9235263</idno>
	</analytic>
	<monogr>
		<title level="m">IEEE International Conference on Multisensor Fusion and Integration for Intelligent Systems</title>
				<imprint>
			<date type="published" when="2020-09">2020-September, 2020</date>
			<biblScope unit="page" from="223" to="228" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b35">
	<monogr>
		<author>
			<persName><forename type="first">L</forename><surname>Mcinnes</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Healy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Melville</surname></persName>
		</author>
		<idno type="arXiv">arXiv:1802.03426</idno>
		<title level="m">Umap: Uniform manifold approximation and projection for dimension reduction</title>
				<imprint>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b36">
	<analytic>
		<title level="a" type="main">Clustering with the Average Silhouette Width</title>
		<author>
			<persName><forename type="first">F</forename><surname>Batool</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Hennig</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.csda.2021.107190</idno>
	</analytic>
	<monogr>
		<title level="j">Computational Statistics and Data Analysis</title>
		<imprint>
			<biblScope unit="volume">158</biblScope>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b37">
	<analytic>
		<title level="a" type="main">Fleiss&apos; kappa statistic without paradoxes</title>
		<author>
			<persName><forename type="first">R</forename><surname>Falotico</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Quatto</surname></persName>
		</author>
		<idno type="DOI">10.1007/s11135-014-0003-1</idno>
	</analytic>
	<monogr>
		<title level="j">Quality and Quantity</title>
		<imprint>
			<biblScope unit="volume">49</biblScope>
			<biblScope unit="page" from="463" to="470" />
			<date type="published" when="2015">2015</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b38">
	<analytic>
		<title level="a" type="main">Entity, relation, and event extraction with contextualized span representations</title>
		<author>
			<persName><forename type="first">D</forename><surname>Wadden</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Wennberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Luan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Hajishirzi</surname></persName>
		</author>
		<idno type="DOI">10.18653/v1/D19-1585</idno>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), Association for Computational Linguistics</title>
				<meeting>the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), Association for Computational Linguistics<address><addrLine>Hong Kong, China</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2019">2019</date>
			<biblScope unit="page" from="5784" to="5789" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b39">
	<analytic>
		<title level="a" type="main">Leveraging linguistic structure for open domain information extraction</title>
		<author>
			<persName><forename type="first">G</forename><surname>Angeli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">J</forename><surname>Johnson Premkumar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">D</forename><surname>Manning</surname></persName>
		</author>
		<idno type="DOI">10.3115/v1/P15-1034</idno>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing</title>
		<title level="s">Long Papers</title>
		<meeting>the 53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing<address><addrLine>Beijing, China</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2015">2015</date>
			<biblScope unit="volume">1</biblScope>
			<biblScope unit="page" from="344" to="354" />
		</imprint>
	</monogr>
	<note>Association for Computational Linguistics</note>
</biblStruct>

<biblStruct xml:id="b40">
	<analytic>
		<title level="a" type="main">Tracking socio-economic activities in european countries with unconventional data</title>
		<author>
			<persName><forename type="first">M</forename><surname>Colagrossi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Consoli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Panella</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Barbaglia</surname></persName>
		</author>
		<idno type="DOI">10.1145/3524458.3547242</idno>
	</analytic>
	<monogr>
		<title level="m">ACM International Conference Proceeding Series</title>
				<imprint>
			<date type="published" when="2022">2022</date>
			<biblScope unit="page" from="323" to="330" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b41">
	<monogr>
		<author>
			<persName><forename type="first">S</forename><surname>Pan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Luo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Chen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Wu</surname></persName>
		</author>
		<idno type="arXiv">arXiv:2306.08302</idno>
		<title level="m">Unifying large language models and knowledge graphs: A roadmap</title>
				<imprint>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b42">
	<analytic>
		<title level="a" type="main">Integrating conversational agents and knowledge graphs within the scholarly domain</title>
		<author>
			<persName><forename type="first">A</forename><surname>Meloni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Angioni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Salatino</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Osborne</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">R</forename><surname>Recupero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Motta</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">IEEE Access</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<biblScope unit="page" from="22468" to="22489" />
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
