<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">HYBRILIT -THE MAIN COMPONENT OF THE MICC FOR HETEROGENEOUS COMPUTATIONS AT JINR</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Gh</forename><surname>Adam</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Laboratory of Information Technologies</orgName>
								<orgName type="institution">Joint Institute for Nuclear Research</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Joliot-Curie</orgName>
								<address>
									<postCode>141980</postCode>
									<settlement>Dubna, Moscow region</settlement>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
							<affiliation key="aff2">
								<orgName type="institution">Horia Hulubei National Institute for Physics and Nuclear Engineering (IFIN-HH)</orgName>
								<address>
									<addrLine>30, Reactorului St</addrLine>
									<postCode>077125</postCode>
									<settlement>Mǎgurele -Bucharest</settlement>
									<country key="RO">Romania</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Vladimir</forename><forename type="middle">V</forename><surname>Korenkov</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Laboratory of Information Technologies</orgName>
								<orgName type="institution">Joint Institute for Nuclear Research</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Joliot-Curie</orgName>
								<address>
									<postCode>141980</postCode>
									<settlement>Dubna, Moscow region</settlement>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
							<affiliation key="aff3">
								<orgName type="department">Peoples&apos; Friendship</orgName>
								<orgName type="institution">University of Russia (RUDN University)</orgName>
								<address>
									<addrLine>Moscow Miklukho-Maklaya str.6</addrLine>
									<postCode>117198</postCode>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
						</author>
						<author role="corresp">
							<persName><forename type="first">Dmitry</forename><forename type="middle">V</forename><surname>Podgainy</surname></persName>
							<email>apodgainy@jinr.ru</email>
							<affiliation key="aff0">
								<orgName type="laboratory">Laboratory of Information Technologies</orgName>
								<orgName type="institution">Joint Institute for Nuclear Research</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Joliot-Curie</orgName>
								<address>
									<postCode>141980</postCode>
									<settlement>Dubna, Moscow region</settlement>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Oksana</forename><forename type="middle">I</forename><surname>Streltsova</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Laboratory of Information Technologies</orgName>
								<orgName type="institution">Joint Institute for Nuclear Research</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Joliot-Curie</orgName>
								<address>
									<postCode>141980</postCode>
									<settlement>Dubna, Moscow region</settlement>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
							<affiliation key="aff3">
								<orgName type="department">Peoples&apos; Friendship</orgName>
								<orgName type="institution">University of Russia (RUDN University)</orgName>
								<address>
									<addrLine>Moscow Miklukho-Maklaya str.6</addrLine>
									<postCode>117198</postCode>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Tatiana</forename><forename type="middle">A</forename><surname>Strizh</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Laboratory of Information Technologies</orgName>
								<orgName type="institution">Joint Institute for Nuclear Research</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Joliot-Curie</orgName>
								<address>
									<postCode>141980</postCode>
									<settlement>Dubna, Moscow region</settlement>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Peter</forename><forename type="middle">V</forename><surname>Zrelov</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Laboratory of Information Technologies</orgName>
								<orgName type="institution">Joint Institute for Nuclear Research</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">Joliot-Curie</orgName>
								<address>
									<postCode>141980</postCode>
									<settlement>Dubna, Moscow region</settlement>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">HYBRILIT -THE MAIN COMPONENT OF THE MICC FOR HETEROGENEOUS COMPUTATIONS AT JINR</title>
					</analytic>
					<monogr>
						<imprint>
							<date/>
						</imprint>
					</monogr>
					<idno type="MD5">9B3172B153C3A3596DB3CA5138E3BCE4</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-03-24T03:06+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>high performance computing</term>
					<term>heterogeneous cluster</term>
					<term>hybrid architectures</term>
					<term>HPC software and information environment</term>
					<term>parallel programming technologies; computational science</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>The article includes the principles and approaches for the development of IT-ecosystem on the basis of the heterogeneous computing cluster HybriLIT, that satisfies the requirements of users in solution of scientific and engineering tasks that are covered by the research program of JINR. The development of IT-ecosystem requires development of new services, new computational architectures and also adaptation of the software. It is also important to train IT-specialists to learn modern methods and tools for solution of specific tasks.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">IT-ecosystem for HPC</head><p>The decision to extend the JINR MICC [1] by adding a heterogeneous computing cluster devoted to the high performance computing (HPC) in JINR and the JINR Member States follows the modern trends in the world wide computing technologies. Implementation of a heterogeneous cluster HybriLIT <ref type="bibr" target="#b3">[2]</ref> that includes nodes with CPU and GPU architectures into MICC JINR infrastructure allows follow two main direction of computation acceleration development. It provides users of the cluster with possibilities to use available HPC means. The analysis of the needs for high performance computing in JINR resulted in the definition of three basic tasks to be solved by the heterogeneous HPC cluster: design and implementation of parallel software for computing intensive research; porting to the cluster open software packages and numerical libraries which are already tuned for hybrid architectures; development of new mathematical methods and parallel algorithms adapted to heterogeneous architectures. For the purposes of efficient use of the computational architectures developed in the leading companies in the field of HPC -Intel and NVIDIA; and to satisfy the requirements of users in solution of tasks mentioned above, there appeared a need to create an ITecosystem.</p><p>This IT-ecosystem is supposed to provide access to the information space that includes services for organization of an efficient work for JINR employees, software and hardware environment for solution of various tasks, management and processing of data of various volume and structure, training and organization of scientific and research processes.</p><p>To support development of IT-ecosystem, it is necessary to develop information and communication support based on modern network solutions that provide higher capacity and network operational reliability.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Figure 1. IT-ecosystem for HPC</head><p>The developed IT-ecosystem (see Fig. <ref type="figure">1</ref>) unites hardware and information-software environment that include modern computation architectures; applied software, information services, services for work with applied software packages with various GUI, means for debugging and profiling parallel applications and means for computation visualization. One of most important aspects here is training of IT-specialists to learn modern methods and tools for solution of problems connected with the use of HPC in the field of theoretical, experimental and applied tasks <ref type="bibr" target="#b4">[3]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">HybriLIT current status</head><p>In present time HybriLIT consists of ten computational nodes including four nodes with graphics processors NVIDIA Tesla K80 and four nodes with graphics processors NVIDIA Tesla K40, one node with Intel Xeon Phi 7120P coprocessor and a node with NVIDIA Tesla K20x and Intel Xeon Phi 5110P coprocessor. Each computational node includes two Intel Xeon E5-2695v2 processors (12-core). Totally, the cluster consists of 252 CPU-cores, 77184 GPU-cores, 182 PHIcores; 2.4 TB RAM; 57.6 TB HDD. The peak performance with single precision is 142 TFlops and with double precision is 50 TFlops. The cluster is meant for carrying out massive parallel computations using modern computing architectures such as GPUs (Nvidia Tesla K40, K80) and Intel Xeon Phi coprocessors/processors.</p><p>For the purposes of efficiency increase of application development and carrying out computation by means of the resources of the HybriLIT cluster, heterogeneous computation team develops and supports information-software environment that can be divided into two parts. The first level is considered to be system one and it includes basic software:</p><p> OS Scientific Linux 7. <ref type="bibr">4</ref>  The second level includes a set of services by means of which users can arrange their work more efficiently and have access to required and useful information while working on the cluster. Among services provided for users there are those, which contain necessary information about the cluster, and about upcoming events that will be held by the HybriLIT team. Such services include:</p><p>• HybriLIT web-page: it contains detailed information about the resources provided for users of the cluster. Particular emphasis is put on hardware that contains cluster's specifications, and software installed on the cluster. It should be noted that registration procedure is very important. Therefore, detailed description of registration is provided at the web-page. Moreover, users can have a look at instruction for running tasks. This instruction includes basic information about the cluster.</p><p>• Indico system: it is used by the HybriLIT team in order to organize conferences, seminars and meetings dedicated to parallel programming technologies. The system allows creating different events that will take place in the Institute. The created event provides basic information about the event itself, time and place. There is also a possibility to upload all the materials of lectures so that every user can download it. Among services that include detailed information about the cluster and the possibilities it provides, there are also the services aimed at close interaction between users and the HybriLIT team. Such services include:</p><p>• HybriLIT User Support: it is a project developed in the Project Management Service system [6] that allows answer the questions of users, upload useful materials, publish news, etc. This project is developed for a more efficient interaction between users and the HybriLIT team.</p><p>This system provides possibilities for information distribution about the upcoming events and the current state of the cluster. Users can also create tasks on upgrade and debugging. Thus, interaction between users of the cluster and the developers is carried out quickly and efficiently. • GitLab: it is a service aimed at mutual parallel development of applications. This is a version control system and it allows follow the changes in the code of projects. System functional is wide and includes such possibilities as separation of access among users, task management system, wiki, code review, etc. The HybriLIT team has developed several projects within this system. One of the main projects is «Parallel features» [7] was created within the GitLab framework with a threefold purpose:</p><p>-to carry out co-development of software packages and programs by independent user groups; -to provide more effective consultancy to the cluster users and to people foreseeing future development and implementation of parallel programs for calculations on multicore systems (based on MPI, OpenMP, OpenCL) and coprocessors (CUDA for graphics processing units (GPU) NVIDIA, OpenMP for Intel Xeon Phi coprocessors); -to develop parallel applications and methodical examples on their base. The report discusses an instance of parallel computations using the scheduling system SLURM on sequential tasks that require massive calculations for different values of input parameters. The need of such an algorithm rose from the investigation of the Josephson junctions in high temperature superconductors subject to external radiation <ref type="bibr">[4]</ref>. The project already solved the problem to get optimization keys for different compilers installed on the HybriLIT cluster.</p><p>The project «Paralleling features» can serve as a pattern toward the systematic development of parallel applications implemented on different computing platforms containing GPU NVIDIA and Intel Xeon Phi coprocessors. It may also be used for the development of more efficient applications by the cluster users from various JINR laboratories, by students and by participants of training courses conducted on the heterogeneous cluster HybriLIT. With regard to the fact that users of the cluster are scientists and specialists from different countries, bilingual support all resources (Russian and English) is important. Fig. <ref type="figure" target="#fig_0">2</ref> shows software and information environment of the cluster. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">New services</head><p>A new service -HLIT-VDIhas been developed for shared use of applied software packages on the HybriLIT cluster using GUI (graphical user interface). By means of this service, it is now possible to work with applied software packages such as Wolfram Mathematica, Maple, Matlab, COMSOL, GEANT4, etc. via remote access to the virtual machines (VM) in the framework of the HybriLIT cluster (Fig. <ref type="figure">3</ref>). The developed service allows carrying out computations in the frames of VMs and massive computations using the resources of the cluster. HLIT-VDI is developed for solution of the following problems closely connected with the use of HPC for applied software packages.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Figure 3. Workflow of HLIT-VDI service</head><p>First of all, scientific and engineering tasks are connected with the use of floating license software packages used by the organization; thus, the developed service will be optimized for distribution of computation time among users.</p><p>Secondly, in order to solve resource-intensive tasks, there appears a need to use computation clusters including those with GPUs (in case the software packages support GPUs) for reduction of computation time. For example, geometry and/or computation grids are carried out by means of GUI (graphical user interface), and computations are carried out using HPC-platforms. The developed service will have a user-friendly interface which will make it easier to accelerate computations.</p><p>Thirdly, as soon as software packages for engineering computations require a huge amount of work with graphical data in order to provide efficient data analysis, a graphical station with NVIDIA M60 has been added.</p><p>In collaboration with Universität Kassel, in order to receive data on available resources on the cluster, characteristics of nodes, and also the status of launched tasks (for more efficient organization for carrying out computations), a mobile application --MobiLIT --has been developed.</p><p>It provides the following possibilities:</p><p>• monitoring of user's jobs;</p><p>• quick view of user's files (*.out, *.dat, *.in or *.sh);</p><p>• possibility to kill jobs directly via the app; • monitor the expected computation time;</p><p>• monitor available resources on different nodes and partitions of the cluster which are meant for using different computing architectures;</p><p>• possess full information on jobs launched on the cluster, the resources they require, etc. MobiLIT is developed using NativeScript framework. It is available in Google Play Store <ref type="bibr">[4]</ref> for users of smartphones and tablets under Android; for iOS users the application is available in App Store in test mode. To sign in, users need authorization data for the HybriLIT cluster.</p><p>The developed mobile application -MobiLITfor users of HybriLIT enriches its information-software environment with a convenient and modern IT-service, which makes it simpler to carry out parallel computations and provides additional optimization while using computation resources of the cluster.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>Figure 2 .</head><label>2</label><figDesc>Figure 2. Software and information environment of HybriLIT</figDesc><graphic coords="4,125.17,465.17,345.00,258.75" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0"><head></head><label></label><figDesc></figDesc><graphic coords="2,112.42,392.47,369.98,264.95" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0"><head></head><label></label><figDesc></figDesc><graphic coords="5,73.70,209.99,447.95,134.25" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>.4.7, 4.8.4, 4.9.3  Intel Parallel Studio XE 2018;  GEANT4, ROOT, FairSoft, MpdROOT at al.</head><label></label><figDesc></figDesc><table><row><cell>The following software for development, debugging and profiling of parallel applications and</cell></row><row><cell>carrying out resource-demanding computations are installed:</cell></row><row><cell> OpenMPI 1.8.8, 2.1.2;</cell></row><row><cell> CUDA 8.0, 9.0;</cell></row><row><cell> GNU 4</cell></row></table><note>and Extreme Cluster Administration Tool Xcat;  NFS4 и EOS file systems;• SLURM -workload manager and task scheduler that manages tasks between the  nodes of the heterogeneous cluster;• Modules enables dynamic modification (interrogation, allocation, and deallocation) of user's environment;  CernVM-FS software repository.</note></figure>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" xml:id="foot_0">Proceedings of the XXVI International Symposium on Nuclear Electronics &amp; Computing (NEC'2017)Becici, Budva, Montenegro, September 25 -29, 2017</note>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Conclusion and future plans</head><p>The described above conception for HPC is aimed at solution of scientific and applied tasks that are crucial for JINR by means of implementation and development of a wide range of new ITsolutions integrated into an information-software environment of the IT-ecosystem including various technological solutions, concepts and approaches.</p><p>Development of such an IT-ecosystem allows reducing time for development of JINR's experimental projects that require carrying out theoretical and applied computations necessary on the stages of engineering of experimental facilities, works on development of computing models for experiments, solution of tasks connected with data analysis and processing, and also development of an information environment for management of all projects' components.</p><p>This IT-ecosystem is the basic platform for training of IT-specialists to be able to develop algorithmic and program solutions in the field of system and applied programming, mathematical, information and simulation models.</p><p>It is planned to develop IT-ecosystem as a distributed HPC-platform that unites supercomputers (heterogeneous), grid-and cloud-technologies <ref type="bibr" target="#b6">[5]</ref> in order to provide optimal approaches for the solution of various scientific and applied tasks that require both massive-parallel computations, and Big Data methods and technologies which will allow to use modern computation architectures much more efficiently.</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<monogr>
		<title level="m">Proceedings of the XXVI International Symposium on Nuclear Electronics &amp; Computing</title>
				<meeting>the XXVI International Symposium on Nuclear Electronics &amp; Computing<address><addrLine>NEC</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<monogr>
		<title/>
		<author>
			<persName><surname>Becici</surname></persName>
		</author>
		<imprint>
			<date type="published" when="2017">September 25 -29, 2017</date>
			<pubPlace>Budva, Montenegro</pubPlace>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<monogr>
		<title level="m" type="main">Acknowledgement The work was supported by the Russian Foundation for Basic Research (RFBR), grant №15-29-01217</title>
		<imprint>
			<date>0008</date>
		</imprint>
	</monogr>
	<note>the Ministry of Education and Science of the Russian Federation (the Agreement number 02.a03.21</note>
</biblStruct>

<biblStruct xml:id="b3">
	<monogr>
		<ptr target="http://hybrilit.jin.ru" />
		<title level="m">Heterogeneous computing cluster HybriLIT</title>
				<imprint/>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Educational program on HPC technologies on the basic of the HybriLIT heterogeneous cluster</title>
		<author>
			<persName><forename type="first">V</forename><forename type="middle">V</forename><surname>Korenkov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">V</forename><surname>Podgainy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><forename type="middle">I</forename><surname>Streltsova</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">LIT JINR) // Modern Information Technology and IT-education V13</title>
				<imprint>
			<date type="published" when="2017">2017</date>
			<biblScope unit="page" from="P141" to="146" />
		</imprint>
	</monogr>
	<note>in Russian</note>
</biblStruct>

<biblStruct xml:id="b5">
	<monogr>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">I</forename><surname>Streltsov</surname></persName>
		</author>
		<ptr target="https://play.google.com/store/apps/details?id=org.nativescript.mobilit" />
		<title level="m">MobiLIT@HPC in Google Play Market</title>
				<imprint/>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">The development of distributed computing technologies and BigData in LIT</title>
		<author>
			<persName><forename type="first">V</forename><forename type="middle">V</forename><surname>Korenkov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">A</forename><surname>Strizh</surname></persName>
		</author>
		<author>
			<persName><surname>Gh</surname></persName>
		</author>
		<author>
			<persName><surname>Adam</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">V</forename><surname>Podgainy</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">-JINR // Proceedings of the 8-th ROLCG 2015</title>
				<imprint/>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<monogr>
		<title level="m">Conference &quot;Grid, Cloud and High Performance Computing in Science</title>
				<meeting><address><addrLine>Cluj-Napoca, Romania, Editura U.T.</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
