<?xml version="1.0" encoding="utf-8"?>
<raweb xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" year="2018">
  <identification id="datamove" isproject="true">
    <shortname>DATAMOVE</shortname>
    <projectName>Data Aware Large Scale Computing</projectName>
    <theme-de-recherche>Distributed and High Performance Computing</theme-de-recherche>
    <domaine-de-recherche>Networks, Systems and Services, Distributed Computing</domaine-de-recherche>
    <urlTeam>https://team.inria.fr/datamove/</urlTeam>
    <structure_exterieure type="Labs">
      <libelle>Laboratoire d'Informatique de Grenoble (LIG)</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>CNRS</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Institut polytechnique de Grenoble</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Université de Grenoble Alpes</libelle>
    </structure_exterieure>
    <header_dates_team>Creation of the Team: 2016 January 01, updated into Project-Team: 2017 November 01</header_dates_team>
    <LeTypeProjet>Project-Team</LeTypeProjet>
    <keywordsSdN>
      <term>A1.1.4. - High performance computing</term>
      <term>A1.1.5. - Exascale</term>
      <term>A2.1.10. - Domain-specific languages</term>
      <term>A2.6.2. - Middleware</term>
      <term>A7.1.2. - Parallel algorithms</term>
      <term>A8.2. - Optimization</term>
    </keywordsSdN>
    <keywordsSecteurs>
      <term>B1.1.7. - Bioinformatics</term>
      <term>B3.3.2. - Water: sea &amp; ocean, lake &amp; river</term>
      <term>B5.5. - Materials</term>
    </keywordsSecteurs>
    <UR name="Grenoble"/>
    <moreinfo>
      <p>The DataMove team is located in the IMAG building on the Campus of Univ. Grenoble Alpes.</p>
    </moreinfo>
  </identification>
  <team id="uid1">
    <person key="datamove-2018-idp115392">
      <firstname>Fanny</firstname>
      <lastname>Dufosse</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, Researcher</moreinfo>
    </person>
    <person key="datamove-2018-idp117856">
      <firstname>Bruno</firstname>
      <lastname>Raffin</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Team leader, Inria, Senior Researcher</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="datamove-2018-idp120768">
      <firstname>Yves</firstname>
      <lastname>Denneulin</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="datamove-2018-idp123648">
      <firstname>Pierre Francois</firstname>
      <lastname>Dutot</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Univ Grenoble Alpes, Associate Professor</moreinfo>
    </person>
    <person key="datamove-2018-idp126144">
      <firstname>Gregory</firstname>
      <lastname>Mounie</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, Associate Professor</moreinfo>
    </person>
    <person key="datamove-2018-idp128640">
      <firstname>Olivier</firstname>
      <lastname>Richard</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Univ Grenoble Alpes, Associate Professor</moreinfo>
    </person>
    <person key="datamove-2018-idp131136">
      <firstname>Denis</firstname>
      <lastname>Trystram</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="datamove-2018-idp134016">
      <firstname>Frederic</firstname>
      <lastname>Wagner</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, Associate Professor</moreinfo>
    </person>
    <person key="datamove-2018-idp136512">
      <firstname>Giorgio</firstname>
      <lastname>Lucarelli</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, Associate Professor, until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp139024">
      <firstname>Francieli</firstname>
      <lastname>Zanon Boito</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, Researcher, from Nov 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp141504">
      <firstname>Danilo</firstname>
      <lastname>Carastan Dos Santos</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Universidade Federal do ABC Brazil, from May 2017</moreinfo>
    </person>
    <person key="datamove-2018-idp143968">
      <firstname>Estelle</firstname>
      <lastname>Dirand</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>CEA, until Oct 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp146400">
      <firstname>Adrien</firstname>
      <lastname>Faure</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ATOS/BULL, from May 2017</moreinfo>
    </person>
    <person key="datamove-2018-idp148848">
      <firstname>Mohammed</firstname>
      <lastname>Khatiri</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Faculte des sciencesU.M.P, Morocco</moreinfo>
    </person>
    <person key="datamove-2018-idp151296">
      <firstname>Michael</firstname>
      <lastname>Mercier</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ATOS/Bull - Inria, until Jan 2019</moreinfo>
    </person>
    <person key="datamove-2018-idp153744">
      <firstname>Clement</firstname>
      <lastname>Mommessin</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble</moreinfo>
    </person>
    <person key="datamove-2018-idp156192">
      <firstname>Valentin</firstname>
      <lastname>Reis</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp158656">
      <firstname>Salah</firstname>
      <lastname>Zrigui</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Univ Grenoble Alpes</moreinfo>
    </person>
    <person key="datamove-2018-idp161088">
      <firstname>Tristan</firstname>
      <lastname>Ezequel</lastname>
      <categoryPro>Technique</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp163552">
      <firstname>Nicolas</firstname>
      <lastname>Michon</lastname>
      <categoryPro>Technique</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Sep 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp166016">
      <firstname>Clement</firstname>
      <lastname>Labastrou</lastname>
      <categoryPro>Technique</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from Mar 2018 until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp168496">
      <firstname>Pierre</firstname>
      <lastname>Neyron</lastname>
      <categoryPro>Technique</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>CNRS</moreinfo>
    </person>
    <person key="datamove-2018-idp170960">
      <firstname>Theophile</firstname>
      <lastname>Terraz</lastname>
      <categoryPro>Technique</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
    <person key="datamove-2018-idp173424">
      <firstname>Zulhusni</firstname>
      <lastname>Abdul Rahman</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from Feb 2018 until Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp175904">
      <firstname>Sekina</firstname>
      <lastname>Belguendouz</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from May 2018 until Jul 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp178384">
      <firstname>Henrique</firstname>
      <lastname>Colao Zanuz</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from Feb 2018 until Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp180864">
      <firstname>Konstantinos</firstname>
      <lastname>Dogeas</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, from Feb 2018 until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp183376">
      <firstname>Antoine</firstname>
      <lastname>Duquennoy</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp185840">
      <firstname>Pathikrit</firstname>
      <lastname>Ghosh</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Jul 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp188304">
      <firstname>Carlos Eduardo</firstname>
      <lastname>Gomez Hernandez</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from Apr 2018 until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp190784">
      <firstname>Florian</firstname>
      <lastname>Groguelin</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp193248">
      <firstname>Quentin</firstname>
      <lastname>Guilloteau</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp195712">
      <firstname>Ciceron</firstname>
      <lastname>Kapena Bantu Muetu</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Institut polytechnique de Grenoble, until Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp198208">
      <firstname>Tuan Hiep</firstname>
      <lastname>Pham</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from Feb 2018 until Aug 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp200688">
      <firstname>Saurabh Manish</firstname>
      <lastname>Raje</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, from Sep 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp203152">
      <firstname>Ning</firstname>
      <lastname>Tang</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Jul 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp205616">
      <firstname>Dinh Khoa</firstname>
      <lastname>Tran</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Jun 2018</moreinfo>
    </person>
    <person key="datamove-2018-idp208080">
      <firstname>Tuo</firstname>
      <lastname>Zhao</lastname>
      <categoryPro>Stagiaire</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, until Jun 2018</moreinfo>
    </person>
    <person key="polaris-2018-idp152176">
      <firstname>Annie</firstname>
      <lastname>Simon</lastname>
      <categoryPro>Assistant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
  </team>
  <presentation id="uid2">
    <bodyTitle>Overall Objectives</bodyTitle>
    <subsection id="uid3" level="1">
      <bodyTitle>Overall Objectives</bodyTitle>
      <p>Moving data on large supercomputers is becoming a major performance bottleneck, and the situation is expected to worsen even more at exascale and beyond. Data transfer capabilities are growing at a slower rate than processing power ones. The profusion of flops available will be difficult to use efficiently due to constrained communication capabilities. Moving data is also an important source of power consumption. The DataMove team focuses on <b>data aware large scale computing</b>, investigating approaches to reduce data movements on large scale HPC machines. We will investigate data aware scheduling algorithms for job management systems. The growing cost of data movements requires adapted scheduling policies able to take into account the influence of intra-application communications, IOs as well as contention caused by data traffic generated by other concurrent applications.
At the same time experimenting new scheduling policies on real platforms is unfeasible.
Simulation tools are required to probe novel scheduling policies.
Our goal is to investigate how to extract information from actual compute
centers traces in order to replay job allocations and executions
with new scheduling policies.
Schedulers need information about the jobs behavior on the target machine
to actually make efficient allocation decisions.
We will research approaches relying on learning techniques applied
to execution traces to extract data and forecast job behaviors.
In addition to traditional computation intensive numerical simulations,
HPC platforms also need to execute more and more often data intensive
processing tasks like data analysis.
In particular, the ever growing amount of data generated by numerical
simulation calls for a tighter integration between the simulation
and the data analysis.
The goal is to reduce the data traffic and to speed-up result analysis by processing results in-situ, i.e. as closely as possible to the locus and time of data generation. Our goal is here to investigate how to program and schedule such analysis workflows in the HPC context, requiring the development of adapted resource sharing strategies, data structures and parallel analytics schemes. To tackle these issues, we will intertwine theoretical research and practical developments to elaborate solutions generic and effective enough to be of practical interest. Algorithms with performance guarantees will be designed and experimented on large scale platforms with realistic usage scenarios developed with partner scientists or based on logs of the biggest available computing platforms. Conversely, our strong experimental expertise will enable to feed theoretical models with sound hypotheses, to twist proven algorithms with practical heuristics that could be further retro-feeded into adequate theoretical models.</p>
    </subsection>
  </presentation>
  <fondements id="uid4">
    <bodyTitle>Research Program</bodyTitle>
    <subsection id="uid5" level="1">
      <bodyTitle>Motivation</bodyTitle>
      <p>Today's largest supercomputers <footnote id="uid6" id-text="1">Top500 Ranking, <ref xlink:href="http://www.top500.org" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>top500.<allowbreak/>org</ref></footnote> are composed of few millions of cores, with performances almost reaching 100 PetaFlops <footnote id="uid7" id-text="2"><formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msup><mn>10</mn><mn>15</mn></msup></math></formula> floating point operations per second</footnote> for the largest machine. Moving data in such large supercomputers is becoming a major performance bottleneck, and the situation is expected to worsen even more at exascale and beyond. The data transfer capabilities are growing at a slower rate than processing power ones. The profusion of available flops will very likely be underused due to constrained communication capabilities. It is commonly admitted that data movements account for 50% to 70% of the global power consumption <footnote id="uid8" id-text="3">SciDAC Review, 2010</footnote>. Thus, data movements are potentially one of the most important source of savings for enabling supercomputers to stay in the commonly adopted energy barrier of 20 MegaWatts. In the mid to long term, non volatile memory (NVRAM) is expected to deeply change the machine I/Os. Data distribution will shift from disk arrays with an access time often considered as uniform, towards permanent storage capabilities at each node of the machine, making data locality an even more prevalent paradigm.</p>
      <p>The proposed DataMove team will work on <b>optimizing data movements for large scale computing</b> mainly at two related levels:</p>
      <simplelist>
        <li id="uid9">
          <p noindent="true">Resource allocation</p>
        </li>
        <li id="uid10">
          <p noindent="true">Integration of numerical simulation and data analysis</p>
        </li>
      </simplelist>
      <p>The resource and job management system (also called batch scheduler or RJMS) is in charge of allocating resources upon user requests for executing their parallel applications.
The growing cost of data movements requires adapted scheduling policies able to take into account the influence of intra-application communications, I/Os as well as contention caused by data traffic generated by other concurrent applications.
Modelling the application behavior to anticipate its actual resource usage on such architecture is known to be challenging, but it becomes
critical for improving performances (execution time, energy, or any other relevant objective). The job management system also needs to handle new types of workloads: high performance platforms now need to execute more and more often data intensive processing tasks like data analysis in addition to traditional computation intensive numerical simulations. In particular, the ever growing amount of data generated by numerical simulation calls for a tighter integration between the simulation and the data analysis. The challenge here is to reduce data traffic and to speed-up result analysis by performing result processing (compression, indexation, analysis, visualization, etc.) as closely as possible to the locus and time of data generation. This emerging trend called <i>in-situ analytics</i> requires to revisit the traditional workflow (loop of batch processing followed by postmortem analysis). The application becomes a whole including the simulation, in-situ processing and I/Os. This motivates the development of new well-adapted resource sharing strategies, data structures and parallel analytics schemes to efficiently interleave the different components of the application and globally improve the performance.
</p>
    </subsection>
    <subsection id="uid11" level="1">
      <bodyTitle>Strategy</bodyTitle>
      <p>DataMove targets HPC (High Performance Computing) at Exascale. But such machines and the associated applications are expected to be available only in 5 to 10 years.
Meanwhile, we expect to see a growing number of petaflop machines to answer the needs for advanced numerical simulations. A sustainable exploitation of these petaflop machines is a real and hard challenge that we will address. We may also see in the coming years a convergence between HPC and Big Data, HPC platforms becoming more elastic and supporting Big Data jobs, or HPC applications being more commonly executed on cloud like architectures. This is the second top objective of the 2015 US Strategic Computing Initiative  <footnote id="uid12" id-text="4"><ref xlink:href="https://www.whitehouse.gov/the-press-office/2015/07/29/executive-order-creating-national-strategic-computing-initiative" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>www.<allowbreak/>whitehouse.<allowbreak/>gov/<allowbreak/>the-press-office/<allowbreak/>2015/<allowbreak/>07/<allowbreak/>29/<allowbreak/>executive-order-creating-national-strategic-computing-initiative</ref></footnote>: <i>Increasing coherence between the technology base used for modelling and simulation and that used for data analytic computing</i>. We will contribute to that convergence at our level, considering more dynamic and versatile target platforms and types of workloads.</p>
      <p>Our approaches should entail minimal modifications on the code of numerical simulations. Often large scale numerical simulations are complex domain specific codes with a long life span. We assume these codes as being sufficiently optimized. We will influence the behavior of numerical simulations through resource allocation at the job management system level or when interleaving them with analytics code.</p>
      <p>To tackle these issues, we propose to intertwine theoretical research and practical developments in an agile mode. Algorithms with performance guarantees will be designed and experimented on large scale platforms with realistic usage scenarios developed with partner scientists or based on logs of the biggest available computing platforms (national supercomputers like Curie, or the BlueWaters machine accessible through our collaboration with Argonne National Lab). Conversely, a strong experimental expertise will enable to feed theoretical models with sound hypotheses, to twist proven algorithms with practical heuristics that could be further retro-feeded into adequate theoretical models.</p>
      <p>A central scientific question is to make the relevant choices for optimizing performance (in a broad sense) in a reasonable time. HPC architectures and applications are increasingly complex systems (heterogeneity, dynamicity, uncertainties), which leads to consider the <b>optimization of resource allocation based on multiple objectives</b>, often contradictory (like energy and run-time for instance). Focusing on the optimization of one particular objective usually leads to worsen the others. The historical positioning of some members of the team who are specialists in multi-objective optimization is to generate a (limited) set of trade-off configurations, called <i>Pareto points</i>, and choose when required the most suitable trade-off between all the objectives. This methodology differs from the classical approaches, which simplify the problem into a single objective one (focus on a particular objective, combining the various objectives or agglomerate them). The real challenge is thus to combine algorithmic techniques to account for this diversity while guaranteeing a target efficiency for all the various objectives.</p>
      <p>The DataMove team aims to elaborate generic and effective solutions of practical interest. We will make our new algorithms accessible through the team flagship software tools, <b>the OAR batch scheduler and the in-situ processing framework FlowVR</b>. We will maintain and enforce strong links with teams closely connected with large architecture design and operation (CEA DAM, BULL, Argonne National Lab), as well as scientists of other disciplines, in particular computational biologists, with whom we will elaborate and validate new usage scenarios (IBPC, CEA DAM, EDF).
</p>
    </subsection>
    <subsection id="uid13" level="1">
      <bodyTitle>Research Directions</bodyTitle>
      <p>DataMove research activity is organised around three directions. When a parallel job executes on a machine, it triggers data movements through the
input data it needs to read, the results it produces (simulation results as well as traces) that need to be stored in the file system, as well as internal communications and temporary storage (for fault tolerance related data for instance). Modeling in details the simulation and the target machines to analyze scheduling policies
is not feasible at large scales. We propose to investigate alternative approaches, including learning approaches, to capture and model the influence of data movements on the
performance metrics of each job execution to develop <b>Data Aware Batch Scheduling</b> models and algorithms (Sec. <ref xlink:href="#uid15" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).
Experimenting new scheduling policies on real platforms at scale is unfeasible.
Theoretical performance guarantees are not sufficient to ensure a new
algorithm will actually perform as expected on a real platform.
An intermediate evaluation level is required to probe novel scheduling policies.
The second research axe focuses on the
<b>Empirical Studies of Large Scale Platforms</b> (Sec. <ref xlink:href="#uid21" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).
The goal is to investigate how we could extract from actual
computing centers traces information to replay the job allocations and executions
on a simulated or emulated platform with new scheduling policies.
Schedulers need information about jobs behavior on target machines
to actually be able to make efficient allocation decisions.
Asking users to caracterize jobs often does not lead to reliable information.
The third research direction
<b>Integration of High Performance Computing and Data Analytics</b> (Sec. <ref xlink:href="#uid27" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>)
addresses the data movement issue from a different perspective.
New data analysis techniques on the HPC platform introduce new type of workloads,
potentially more data than compute intensive,
but could also enable to reduce data movements by directly enabling
to pipe-line simulation execution with a live analysis of the produced results.
Our goal is here to investigate how to program and schedule such analysis workflows in the HPC context.
</p>
    </subsection>
  </fondements>
  <domaine id="uid14">
    <bodyTitle>Application Domains</bodyTitle>
    <subsection id="uid15" level="1">
      <bodyTitle>Data Aware Batch Scheduling</bodyTitle>
      <p>Large scale high performance computing platforms are becoming
increasingly complex. Determining efficient allocation and
scheduling strategies that can adapt to technological evolutions is a
strategic and difficult challenge. We are interested in
scheduling jobs in hierarchical and heterogeneous large scale
platforms. On such platforms, application developers typically submit their jobs in
centralized waiting queues. The job management system aims at
determining a suitable allocation for the jobs, which all compete
against each other for the available computing resources.
Performances are measured using different classical metrics like maximum
completion time or slowdown. Current systems make use of very simple (but fast)
algorithms that however rely on simplistic platform and execution models, and thus,
have limited performances.</p>
      <p>For all target scheduling problems we aim to provide both theoretical analysis and
complementary analysis through simulations. Achieving meaningful results will require strong improvements on existing models
(on power for example) and the design of new approximation algorithms with various objectives such as stretch, reliability,
throughput or energy consumption, while keeping in focus the need for a low-degree polynomial complexity.</p>
      <subsection id="uid16" level="2">
        <bodyTitle>Algorithms</bodyTitle>
        <p>The most common batch scheduling policy is to consider the jobs according to the First Come First Served order
(FCFS) with backfilling (BF). BF is the most widely used policy due to its easy and robust implementation and known benefits such as high system utilization. It is well-known that this strategy does not optimize any sophisticated function, but it is simple to implement and it guarantees that there is no starvation (i.e. every job will be scheduled at some moment).</p>
        <p>More advanced algorithms are seldom used on production platforms due to both the gap
between theoretical models and practical systems and speed constraints. When looking at
theoretical scheduling problems, the generally accepted goal is to
provide polynomial algorithms (in the number of submitted jobs and the number of involved computing units).
However, with millions of processing cores where every process and data transfer have to be individually
scheduled, polynomial algorithms are prohibitive as soon as the
polynomial degree is too large. The model of <i>parallel tasks</i> simplifies this
problem by bundling many threads and communications into single boxes,
either rigid, rectangular or malleable.
Especially malleable tasks capture the dynamicity of the execution. Yet these models are
ill-adapted to heterogeneous platforms, as the running time depends on
more than simply the number of allotted resources, and some of the
common underlying assumptions on the speed-up functions (such as
monotony or concavity) are most often only partially verified.</p>
        <p>In practice, the job execution times depend on their allocation (due to
communication interferences and heterogeneity in both computation and
communication), while theoretical models of parallel jobs usually
consider jobs as black boxes with a fixed (maximum) execution time. Though
interesting and powerful, the classical models (namely, synchronous PRAM model, delay,
LogP) and their variants (such as hierarchical delay), are
not well-suited to large scale parallelism on platforms where the cost of
moving data is significant, non uniform and may change over time. Recent studies are still
refining such models in order to take into account communication contentions
more accurately while remaining tractable enough to provide a useful tool
for algorithm design.</p>
        <p>Today, all algorithms in use in production systems are oblivious
to communications. One of our main goals is to <b>design a new generation
of scheduling algorithms fitting more closely job schedules according
to platform topologies</b>.</p>
      </subsection>
      <subsection id="uid17" level="2">
        <bodyTitle>Locality Aware Allocations</bodyTitle>
        <p>Recently, we developed modifications of the standard back-filling algorithm taking into account platform
topologies.
The proposed algorithms take into account locality and contiguity
in order to hide communication patterns within parallel tasks.
The main result here is to establish good lower bounds and small approximation ratios for policies respecting the locality constraints.
The algorithms work in an online fashion, improving the global behavior of the system while still keeping a low running time.
These improvements rely mainly on our past experience in designing approximation algorithms.
Instead of relying on complex networking models and communication patterns for
estimating execution times, the communications are disconnected from the execution time.
Then, the scheduling problem leads to a trade-off: optimizing locality
of communications on one side and a performance objective (like the makespan or stretch) on the other side.</p>
        <p>In the perspective of taking care of locality, other ongoing works include the study of schedulers for platforms whose interconnection network
is a static structured topology (like the 3D-torus of the BlueWaters platform we work on in collaboration with the Argonne National Laboratory).
One main characteristic of this 3D-torus platform is to provide I/O nodes at
specific locations in the topology. Applications generate and access specific data
and are thus bounded to specific I/O nodes.
Resource allocations are constrained in a strong and unusual way. This problem is close for actual hierarchical platforms.
The scheduler needs to compute a schedule such that I/O nodes requirements are
filled for each application while at the same time
avoiding communication interferences.
Moreover, extra constraints can arise for applications requiring accelerators
that are gathered on the nodes at the edge of the network topology.</p>
        <p>While current results are encouraging, they are however limited in performance by
the low amount of information available to the scheduler. We look forward to
extend ongoing work by progressively increasing application and network knowledge (by technical mechanisms like profiling or monitoring or by more sophisticated methods like learning).
It is also important to anticipate on application resource usage in terms of compute units, memory as well as network and I/Os to
efficiently schedule a mix of applications with different profiles.
For instance, a simple solution is to partition the jobs as "communication intensive" or
"low communications". Such a tag could be achieved by the users them selves or obtained by learning techniques.
We could then schedule low communications jobs using leftover spaces while taking care of high communication jobs.
More sophisticated options are possible, for instance those that use more detailed communication patterns and networking models.
Such options would leverage the work proposed in Section <ref xlink:href="#uid21" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> for gathering application traces.</p>
      </subsection>
      <subsection id="uid18" level="2">
        <bodyTitle>Data-Centric Processing</bodyTitle>
        <p>Exascale computing is shifting away from the traditional compute-centric models to a more data-centric one.
This is driven by the evolving nature of large scale distributed computing, no longer dominated by pure computations
but also by the need to handle and analyze large volumes of data. These data can be large databases of results, data streamed from
a running application or another scientific instrument (collider for instance). These new workloads call for specific resource allocation strategies.</p>
        <p>Data movements and storage are expected to be a major energy and performance bottleneck on next generation platforms.
Storage architectures are also evolving, the standard centralized parallel file system being complemented with local persistent storage (Burst Buffers, NVRAM).
Thus, one data producer can stage data on some nodes' local storage, requiring to schedule close by the associated analytics tasks to limit data movements.
This kind of configuration, often referred as <i>in-situ analytics</i>, is expected to become common as it enables to switch from the traditional I/O intensive workflow (batch-processing followed by <i>post mortem</i> analysis and visualization) to a more storage conscious approach where data are processed as closely as possible to where and when they are produced (in-situ processing is addressed in details in section <ref xlink:href="#uid27" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).
By reducing data movements and scheduling the extra processing on resources not fully exploited yet, in-situ processing is expected to have also a significant positive energetic impact. Analytics codes can be executed in the same nodes than the application, often on dedicated cores commonly called helper cores, or on dedicated nodes called stagging nodes. The results are either forwarded to the users for visualization or saved to disk through I/O nodes. In-situ analytics can also take benefit of node local disks or burst buffers to reduce data movements.
Future job scheduling strategies should take into account in-situ processes in addition to the job allocation to optimize both energy consumption and execution time.
On the one hand, this problem can be reduced to an allocation problem of extra asynchronous tasks to idle computing units. But on the other hand, embedding analytics in applications brings extra difficulties by making the application more heterogeneous and imposing more constraints (data affinity) on the required resources.
Thus, the main point here is to develop efficient algorithms for dealing with heterogeneity without increasing the global computational cost.</p>
      </subsection>
      <subsection id="uid19" level="2">
        <bodyTitle>Learning</bodyTitle>
        <p>Another important issue is to adapt the job management system to deal with the bad effects of uncertainties, which may be catastrophic in large scale heterogeneous HPC platforms
(jobs delayed arbitrarly far or jobs killed).
A natural question is then: <i>is it possible to have a good estimation of the job and platform parameters in order to be able to obtain a better scheduling ?</i>
Many important parameters (like the number or type of required resources or the estimated running time of the jobs) are asked to the users when they submit their jobs. However, some of these values are not accurate and in many cases, they are not even provided by the end-users.
In DataMove, we propose to study new methods for a better prediction of the characteristics of the jobs and their execution in order to improve the optimization process. In particular, the methods well-studied in the field of big data (in supervised Machine Learning, like classical regression methods, Support Vector Methods, random forests, learning to rank techniques or deep learning) could and must be used to improve job scheduling in large scale HPC platforms. This topic received a great attention recently in the field of parallel and distributed processing.
A preliminary study has been done recently by our team with the target of predicting the job running times (called wall times).
We succeeded to improve significantly in average the reference EASY Back Filling algorithm by estimating the wall time of the jobs, however,
this method leads to big delay for the stretch of few jobs.
Even if we succeed in determining more precisely hidden parameters, like the wall time of the jobs, this is not enough to determine an optimized solution.
The shift is not only to learn on dedicated parameters but also on the scheduling policy. The data collected from the accounting and profiling of jobs can be used to better understand the needs of the jobs and through learning to propose adaptations for future submissions. The goal is to propose extensions to further improve the job scheduling and improve the performance and energy efficiency of the application. For instance preference learning may enable to compute on-line new priorities to back-fill the ready jobs.</p>
      </subsection>
      <subsection id="uid20" level="2">
        <bodyTitle>Multi-objective Optimization</bodyTitle>
        <p>Several optimization questions that arise in allocation and scheduling problems lead to the study of several objectives at the same time.
The goal is then not a single optimal solution, but a more complicated mathematical object that captures the notion of trade-off.
In broader terms, the goal of multi-objective optimization is not to externally arbitrate on disputes between entities with different
goals, but rather to explore the possible solutions to highlight the whole range of interesting compromises.
A classical tool for studying such multi-objective optimization problems is to use <i>Pareto curves</i>.
However, the full description of the Pareto curve can be very hard because of both the number of solutions and the hardness of computing each point.
Addressing this problem will opens new methodologies for the analysis of algorithms.</p>
        <p>To further illustrate this point here are three possible case studies with emphasis on conflicting interests measured with
different objectives. While these cases are good representatives of our HPC context, there are other pertinent trade-offs we may
investigate depending on the technology evolution in the coming years. This enumeration is certainly not limitative.</p>
        <p><b>Energy versus Performance</b>.
The classical scheduling algorithms designed for the purpose of performance can no longer be used because performance and energy are contradictory objectives to some extent.
The scheduling problem with energy becomes a multi-objective problem in nature since the energy consumption should be considered as equally important as performance at exascale.
A global constraint on energy could be a first idea for determining trade-offs but
the knowledge of the Pareto set (or an approximation of it) is also very useful.</p>
        <p><b>Administrators versus application developers</b>.
Both are naturally interested in different objectives:
In current algorithms, the performance is mainly computed from the point of view of administrators, but the users should be in the loop since they can give useful information and help to the construction of better schedules.
Hence, we face again a multi-objective problem where, as in the above case, the approximation of the Pareto set provides the trade-off between the administrator view and user demands.
Moreover, the objectives are usually of the same nature.
For example, <i>max stretch</i> and <i>average stretch</i> are two objectives based on the slowdown factor that can interest administrators and users, respectively.
In this case the study of the norm of stretch can be also used to describe the trade-off
(recall that the <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>L</mi><mn>1</mn></msub></math></formula>-norm corresponds to the average objective while the <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>L</mi><mi>∞</mi></msub></math></formula>-norm to the max objective).
Ideally, we would like to design an algorithm that gives good approximate solutions at the same time for all norms.
The <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>L</mi><mn>2</mn></msub></math></formula> or <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>L</mi><mn>3</mn></msub></math></formula>-norm are useful since they describe the performance of the whole schedule from the administrator point of view as well as they provide a fairness indication to the users.
The hard point here is to derive theoretical analysis for such complicated tools.</p>
        <p><b>Resource Augmentation</b>.
The classical resource augmentation models, i.e. speed and machine augmentation, are not sufficient to get good results when the execution of jobs cannot be frequently interrupted.
However, based on a resource augmentation model recently introduced, where the algorithm may reject a small number of jobs,
some members of our team have given the first interesting results in the non-preemptive direction.
In general, resource augmentation can explain the intuitive good behavior of some greedy algorithms while, more interestingly, it can give ideas for new algorithms. For example, in the rejection context we could dedicate a small number of nodes for the usually problematic rejected jobs.
Some initial experiments show that this can lead to a schedule for the remaining jobs that is very close to the optimal one.</p>
      </subsection>
    </subsection>
    <subsection id="uid21" level="1">
      <bodyTitle>Empirical Studies of Large Scale Platforms</bodyTitle>
      <p>Experiments or realistic simulations are required to take into account
the impact of allocations and assess the real behavior of scheduling algorithms.
While theoretical models still have their interest to lay the
groundwork for algorithmic designs, the models are necessarily
reflecting a purified view of the reality. As transferring our
algorithm in a more practical setting is an important part of our
creed, we need to ensure that the theoretical results found using
simplified models can really be transposed to real situations.
On the way to exascale computing, large scale systems become harder
to study, to develop or to calibrate because of the costs in both time
and energy of such processes. It is often impossible to convince
managers to use a production cluster for several hours simply to test
modifications in the RJMS. Moreover, as the existing RJMS production
systems need to be highly reliable, each evolution requires several
real scale test iterations. The consequence is that scheduling
algorithms used in production systems are mostly outdated and not
customized correctly. To circumvent this pitfall, we need to develop tools and methodologies for alternative empirical studies, from analysis of workload traces, to job models, simulation and emulation with reproducibility concerns.</p>
      <subsection id="uid22" level="2">
        <bodyTitle>Workload Traces with Resource Consumption</bodyTitle>
        <p>Workload traces are the base element to capture the behavior of complete systems composed of submitted jobs, running applications, and operating tools. These traces must be obtained on production platforms to provide relevant and representative data. To get a better understanding of the use of such systems, we need to look at both, how the jobs interact with the job management system, and how they use the allocated resources. We propose a general workload trace format that adds jobs resource consumption to the commonly used SWF <footnote id="uid23" id-text="5">Standard Workload Format: http://www.cs.huji.ac.il/labs/parallel/workload/swf.html</footnote> workload trace format. This requires to instrument the platforms, in particular to trace resource consumptions like CPU, data movements at memory, network and I/O levels, with an acceptable performance impact. In a previous work we studied and proposed a dedicated job monitoring tool whose impact on the system has been measured as lightweight (0.35<formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mo>%</mo></math></formula> speed-down) with a 1 minute sampling rate. Other tools also explore job monitoring, like TACC Stats. A unique feature from our tool is its ability to monitor distinctly jobs sharing common nodes.</p>
        <p>Collected workload traces with jobs resource consumption will be publicly released and serve to provide data for works presented in Section <ref xlink:href="#uid15" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. The trace analysis is expected to give valuable insights to define models encompassing complex behaviours like network topology sensitivity, network congestion and resource interferences.</p>
        <p>We expect to join efforts with partners for collecting quality traces (ATOS/Bull, Ciment meso center, Joint Laboratory on Extreme Scale Computing) and will collaborate with the Inria team POLARIS for their analysis.</p>
      </subsection>
      <subsection id="uid24" level="2">
        <bodyTitle>Simulation</bodyTitle>
        <p>Simulations of large scale systems are faster by multiple orders of
magnitude than real experiments. Unfortunately, replacing experiments
with simulations is not as easy as it may sound, as it brings a host
of new problems to address in order to ensure that the simulations are
closely approximating the execution of typical workloads on real
production clusters. Most of these problems are actually not directly
related to scheduling algorithms assessment, in the sense that the
workload and platform models should be defined independently from
the algorithm evaluations, in order to ensure a fair assessment of
the algorithms' strengths and weaknesses. These research
topics (namely platform modeling, job models and simulator calibration)
are addressed in the other subsections.</p>
        <p>We developed an open source platform simulator within
DataMove (in conjunction with the OAR development
team) to provide a widely distributable test
bed for reproducible scheduling algorithm evaluation. Our simulator,
named Batsim, allows to simulate the behavior of a computational
platform executing a workload scheduled by any given scheduling
algorithm. To obtain sound simulation results and to broaden the scope
of the experiments that can be done thanks to Batsim, we did not chose
to create a (necessarily limited) simulator from scratch, but instead
to build on top of the SimGrid simulation framework.</p>
        <p>To be open to as many batch schedulers as possible, Batsim
decouples the platform simulation and the scheduling decisions in two
clearly-separated software components communicating through a complete
and documented protocol. The Batsim component is in charge of
simulating the computational resources behaviour whereas the scheduler
component is in charge of taking scheduling decisions. The scheduler
component may be both a resource and a job management system. For
jobs, scheduling decisions can be to execute a job, to delay its
execution or simply to reject it. For resources, other decisions can
be taken, for example to change the power state of a machine i.e. to
change its speed (in order to lower its energy consumption) or to
switch it on or off. This separation of concerns also enables
interfacing with potentially any commercial RJMS, as long as the
communication protocol with Batsim is implemented. A proof of concept
is already available with the OAR RJMS.</p>
        <p>Using this test bed opens new research perspectives. It allows to test a
large range of platforms and workloads to better understand the real
behavior of our algorithms in a production setting. In turn, this
opens the possibility to tailor algorithms for a particular platform
or application, and to precisely identify the possible shortcomings of
the theoretical models used.</p>
      </subsection>
      <subsection id="uid25" level="2">
        <bodyTitle>Job and Platform Models</bodyTitle>
        <p>The central purpose of the Batsim simulator is to simulate job behaviors on a given target platform under a given resource allocation policy. Depending on the workload, a significant number of jobs are parallel applications with communications and file system accesses. It is not conceivable to simulate individually all these operations for each job on large plaforms with their associated workload due to implied simulation complexity. The challenge is to define a coarse grain job model accurate enough to reproduce parallel application behavior according to the target platform characteristics. We will explore models similar to the BSP (Bulk Synchronous Program) approach that decomposes an application in local computation supersteps ended by global communications and a global synchronization. The model parameters will be established by means of trace analysis as discussed previously, but also by instrumenting some parallel applications to capture communication patterns.
This instrumentation will have a significant impact on the concerned application performance, restricting its use to a few applications only. There are a lot of recurrent applications executed on HPC platform, this fact will help to reduce the required number of instrumentations and captures.
To assign each job a model, we are considering to adapt the concept of application signatures as proposed in.
Platform models and their calibration are also required. Large parts of these models, like those related to network, are provided by Simgrid. Other parts as the filesystem and energy models are comparatively recent and will need to be enhanced or reworked to reflect the HPC platform evolutions. These models are then generally calibrated by running suitable benchmarks.</p>
      </subsection>
      <subsection id="uid26" level="2">
        <bodyTitle>Emulation and Reproducibility</bodyTitle>
        <p>The use of coarse models in simulation implies to set aside some details. This simplification may hide system behaviors that could impact significantly and negatively the metrics we try to enhance. This issue is particularly relevant when large scale platforms are considered due to the impossibility to run tests at nominal scale on these real platforms. A common approach to circumvent this issue is the use of emulation techniques to reproduce, under certain conditions, the behavior of large platforms on smaller ones.
Emulation represents a natural complement to simulation by allowing to execute directly large parts of the actual evaluated software and system, but at the price of larger compute times and a need for more resources.
The emulation approach was chosen in to compare two job management systems from workload traces of the CURIE supercomputer (80000 cores). The challenge is to design methods and tools to emulate with sufficient accuracy the platform and the workload (data movement, I/O transfers, communication, applications interference). We will also intend to leverage emulation tools like Distem from the MADYNES team. It is also important to note that the Batsim simulator also uses emulation techniques to support the core scheduling module from actual RJMS. But the integration level is not the same when considering emulation for larger parts of the system (RJMS, compute node, network and filesystem).</p>
        <p>Replaying traces implies to prepare and manage complex software stacks including the OS, the resource management system, the distributed filesystem and the applications as well as the tools required to conduct experiments. Preparing these stacks generate specific issues, one of the major one being the support for reproducibility. We propose to further develop the concept of reconstructability to improve experiment reproducibility by capturing the build process of the complete software stack. This approach ensures reproducibility over time better than other ways
by keeping all data (original packages, build recipe and Kameleon engine) needed to build the software stack.</p>
        <p>In this context, the Grid'5000 (see Sec. <ref xlink:href="#uid47" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) experimentation infrastructure that gives users the control on the complete software stack is a crucial tool for our research goals. We will pursue our strong implication in this infrastructure.
</p>
      </subsection>
    </subsection>
    <subsection id="uid27" level="1">
      <bodyTitle>Integration of High Performance Computing and Data Analytics</bodyTitle>
      <p>Data produced by large simulations are traditionally handled by an I/O layer that moves them from
the compute cores to the file system. Analysis of these data are performed after reading them back
from files, using some domain specific codes or some scientific visualisation libraries like VTK.
But writing and then reading back these data generates a lot of data movements and puts under pressure
the file system. To reduce these data movements, <b>the in situ analytics
paradigm proposes to process the data as closely as possible to where and when the data are
produced</b>. Some early solutions emerged either as extensions of visualisation
tools or of I/O libraries like ADIOS. But significant
progresses are still required to provide efficient and flexible high performance scientific data analysis
tools. Integrating data analytics in the HPC context will have an impact on resource allocation
strategies, analysis algorithms, data storage and access, as well as computer architectures and
software infrastructures. But this paradigm shift imposed by the machine performance also
sets the basis for a deep change on the way users work with numerical simulations.
The traditional workflow needs to be reinvented to make HPC more user-centric, more interactive
and turn HPC into a commodity tool for scientific discovery and engineering developments.
In this context DataMove aims at investigating programming environments for in situ analytics
with a specific focus on task scheduling in particular, to ensure an efficient sharing of resources with the simulation.</p>
      <subsection id="uid28" level="2">
        <bodyTitle>Programming Model and Software Architecture</bodyTitle>
        <p>In situ creates a tighter loop between the scientist and her/his simulation. As such, an in situ
framework needs to be flexible to let the user define and deploy its own set of analysis. A
manageable flexibility requires to favor simplicity and understandability, while still enabling an
efficient use of parallel resources. Visualization libraries like VTK
or Visit, as well as domain specific environments like VMD have initially been developed for traditional post-mortem
data analysis. They have been extended to support in situ processing with some simple resource
allocation strategies
but the level of performance, flexibility and
ease of use that is expected requires to rethink new environments. There is a need to develop a middleware and programming
environment taking into account in its fundations this specific context of high performance scientific
analytics.</p>
        <p>Similar needs for new data processing architectures occurred for the
emerging area of Big Data Analytics, mainly targeted to web data on
cloud-based infrastructures. Google Map/Reduce and its successors like Spark or
Stratosphere/Flink have been designed to match the specific context of
efficient analytics for large volumes of data produced on the web, on
social networks, or generated by business applications. These systems
have mainly been developed for cloud infrastructures based on commodity
architectures. They do not leverage the specifics of HPC
infrastructures. Some preliminary adaptations have been proposed for
handling scientific data in a HPC
context. However, these approaches do not support
in situ processing.</p>
        <p>Following the initial development of FlowVR, our middleware for in situ processing,
we will pursue our effort to develop a programming environment and software architecture for high
performance scientific data analytics. Like FlowVR, the map/reduce tools, as well as the machine
learning frameworks like TensorFlow, adopted a dataflow graph for
expressing analytics pipe-lines. We are convinced that this dataflow approach is both easy to
understand and yet expresses enough concurrency to enable efficient executions. The graph description
can be compiled towards lower level representations, a mechanism that is intensively used by
Stratosphere/Flink for instance. Existing in situ frameworks, including FlowVR, inherit from the
HPC way of programming with a thiner software stack and a programming model close to the machine.
Though this approach enables to program high performance applications, this is usually too low level
to enable the scientist to write its analysis pipe-line in a short amount of time. The data model, i.e. the data semantics level accessible at the framework level
for error check and optimizations, is also a fundamental aspect of such environments. The key/value store has been adopted by all map/reduce
tools. Except in some situations, it cannot be adopted as such for
scientific data. Results from numerical simulations are often more structured than web data,
associated with acceleration data structures to be processed
efficiently. We will investigate data models for scientific data building on existing approaches like Adios or DataSpaces.</p>
      </subsection>
      <subsection id="uid29" level="2">
        <bodyTitle>Resource Sharing</bodyTitle>
        <p>To alleviate the I/O bottleneck, the in situ paradigm proposes to start processing data as soon as
made available by the simulation, while still residing in the memory of the compute node. In situ
processings include data compression, indexing, computation of various types of descriptors (1D, 2D,
images, etc.). Per se, reducing data output to limit I/O related performance drops or keep the
output data size manageable is not new. Scientists have relied on solutions as simple as decreasing
the frequency of result savings. In situ processing proposes to move one step further, by providing a full
fledged processing framework enabling scientists to more easily and thoroughly manage the available
I/O budget.</p>
        <p>The most direct way to perform in situ analytics is to inline computations directly in the
simulation code. In this case, in situ processing is executed in sequence with the simulation that
is suspended meanwhile. Though this approach is direct to implement and does not require complex framework
environments, it does not enable to overlap analytics related computations and data movements with the simulation execution,
preventing to efficiently use the available resources. Instead of relying on this simple time sharing approach, several works propose to
rely on space sharing where one or several cores per node, called <i>helper cores</i>, are dedicated
to analytics. The simulation responsibility is simply to handle a copy of the relevant data to the
node-local in situ processes, both codes being executed concurrently. This approach often lead to significantly beter performance than in-simulation analytics.</p>
        <p>For a better isolation of the simulation and in situ processes, one solution consists in offloading in situ tasks from the simulation nodes towards
extra dedicated nodes, usually called <i>staging nodes</i>. These computations are said to be
performed <i>in-transit</i>. But this approach may not always be beneficial compared to processing on simulation nodes due to the costs of
moving the data from the simulation nodes to the staging nodes.</p>
        <p>FlowVR enables to mix these different resources allocation strategies for the different stages of
an analytics pile-line. Based on a component model, the scientist designs analytics workflows
by first developing processing components that are next assembled in a dataflow graph through a
Python script. At runtime the graph is instantiated according to the execution context, FlowVR
taking care of deploying the application on the target architecture, and of coordinating the
analytics workflows with the simulation execution.</p>
        <p>But today the choice of the resource allocation strategy is mostly ad-hoc and defined by the
programmer. We will investigate solutions that enable a cooperative use of the resource between the
analytics and the simulation with minimal hints from the programmer. In situ processings inherit
from the parallelization scale and data distribution adopted by the simulation, and must execute
with minimal perturbations on the simulation execution (whose actual resource usage is difficult to
know a priori). We need to develop adapted scheduling strategies that operate at compile and run
time. Because analysis are often data intensive, such solutions must take into consideration data
movements, a point that classical scheduling strategies designed first for compute intensive
applications often overlook. We expect to develop new scheduling strategies relying on the
methodologies developed in Sec. <ref xlink:href="#uid20" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Simulations as well as analysis are iterative processes exposing a strong spatial and temporal coherency that we can take benefit of to anticipate their behavior and then take
more relevant resources allocation strategies, possibly based on advanced learning algorithms or as developed in Section <ref xlink:href="#uid15" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
        <p>In situ analytics represent a specific workload that needs to be scheduled very closely to the simulation, but not necessarily active during the full extent of the simulation execution and that may also require to access data from previous runs (stored in the file system or on specific burst-buffers). Several users may also need to run concurrent analytics pipe-lines on shared data. This departs significantly from the traditional batch scheduling model, motivating the need for a more elastic approach to resource provisioning. These issues will be conjointly addressed with research on batch scheduling policies (Sec. <ref xlink:href="#uid15" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
      </subsection>
      <subsection id="uid30" level="2">
        <bodyTitle>Co-Design with Data Scientists</bodyTitle>
        <p>Given the importance of users in this context, it is of primary importance
that in situ tools be co-designed with advanced users, even if such multidisciplinary collaborations are challenging and require constant long term
investments to learn and understand the specific practices and expectations of the other domain.</p>
        <p>We will tightly collaborate with scientists of some application domains, like molecular dynamics or fluid simulation,
to design, develop, deploy and assess in situ analytics scenarios, as already done
with Marc Baaden, a computational biologist from LBT.</p>
        <p>We recently extended our collaboration network. We started in 2015 a PhD
co-advised with CEA DAM to investigate in situ analytics scenarios in the context of atomistic material simulations.
CEA DAM is a French energy lab hosting one of the largest european supercomputer.
They gather physicists, numerical scientists as well as high performance computer engineers,
making it a very interesting partner for developing new scientific data analysis solutions.
We also got a national grant (2015-2018) to compute in situ statistics for multi-parametric
parallel studies with the research department of French power company EDF.
In this context we collaborate with statisticians and fluid simulation experts to define in situ
scenarios, revisit the statistic operators to be amenable to in situ processing, and define an
adapted in situ framework.</p>
      </subsection>
    </subsection>
  </domaine>
  <logiciels id="uid31">
    <bodyTitle>New Software and Platforms</bodyTitle>
    <subsection id="uid32" level="1">
      <bodyTitle>FlowVR</bodyTitle>
      <p><span class="smallcap" align="left">Scientific Description:</span> FlowVR adopts the "data-flow" paradigm, where your application is divided as a set of components exchanging messages (think of it as a directed graph). FlowVR enables to encapsulate existing codes in components, interconnect them through data channels, and deploy them on distributed computing resources. FlowVR takes care of all the heavy lifting such as application deployment and message exchange.</p>
      <p>The base entity, called a module or component, is an autonomous process, potentially multi-threaded with tools like OpenMP, TBB, or deferring computations to a GPU or Xeon Phi. This module processes data coming from input ports and write data on output ports. A module has no global insight on where the data comes from or goes to. The programming interface is designed to limit code refactoring, easing turning an existing code into a FlowVR component. The three main functions are:</p>
      <p>wait(): Blocking function call that waits for the availability of new messages on input ports.
get(): Retrieve a handle to access the message received at the previous wait() call on a given input port.
put(): Notify FlowVR that a new message on a given output port is ready for dispatch.
FlowVR manages data transfers. Intra-node communications between two components take place through a shared memory segment, avoiding copies. Once the sender has prepared the data in a shared memory segment, it simply handles a pointer to the destination that can directly access them. Inter-node communications extend this mechanism, FlowVR taking care of packing and transferring the data from the source shared memory segment to the destination shared memory segment.</p>
      <p>Assembling components to build an application consists in writing a Python script, instanciate it according to the target machine. FlowVR will process it and prepare everything so that in one command line you can deploy and start your application.</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> FlowVR adopts the "data-flow" paradigm, where your application is divided as a set of components exchanging messages (think of it as a directed graph). FlowVR enables to encapsulate existing codes in components, interconnect them through data channels, and deploy them on distributed computing resources. FlowVR takes care of all the heavy lifting such as application deployment and message exchange.</p>
      <simplelist>
        <li id="uid33">
          <p noindent="true">Participants: Bruno Raffin, Clément Ménier, Emmanuel Melin, Jean Denis Lesage, Jérémie Allard, Jérémy Jaussaud, Matthieu Dreher, Sébastien Limet, Sophie Robert and Valérie Gourantou</p>
        </li>
        <li id="uid34">
          <p noindent="true">Contact: Bruno Raffin</p>
        </li>
        <li id="uid35">
          <p noindent="true">URL: <ref xlink:href="http://flowvr.sf.net" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>flowvr.<allowbreak/>sf.<allowbreak/>net</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid36" level="1">
      <bodyTitle>OAR</bodyTitle>
      <p><span class="smallcap" align="left">Keywords:</span> HPC - Cloud - Clusters - Resource manager - Light grid</p>
      <p noindent="true"><span class="smallcap" align="left">Scientific Description:</span> This batch system is based on a database (PostgreSQL (preferred) or MySQL), a script language (Perl) and an optional scalable administrative tool (e.g. Taktuk). It is composed of modules which interact mainly via the database and are executed as independent programs. Therefore, formally, there is no API, the system interaction is completely defined by the database schema. This approach eases the development of specific modules. Indeed, each module (such as schedulers) may be developed in any language having a database access library.</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> OAR is a versatile resource and task manager (also called a batch scheduler) for HPC clusters, and other computing infrastructures (like distributed computing experimental testbeds where versatility is a key).</p>
      <simplelist>
        <li id="uid37">
          <p noindent="true">Participants: Bruno Bzeznik, Olivier Richard and Pierre Neyron</p>
        </li>
        <li id="uid38">
          <p noindent="true">Partners: LIG - CNRS - Grid'5000 - CIMENT</p>
        </li>
        <li id="uid39">
          <p noindent="true">Contact: Olivier Richard</p>
        </li>
        <li id="uid40">
          <p noindent="true">URL: <ref xlink:href="http://oar.imag.fr" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>oar.<allowbreak/>imag.<allowbreak/>fr</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid41" level="1">
      <bodyTitle>MELISSA</bodyTitle>
      <p>
        <i>Modular External Library for In Situ Statistical Analysis</i>
      </p>
      <p noindent="true"><span class="smallcap" align="left">Keyword:</span> Sensitivity Analysis</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> Melissa is an in situ solution for sensitivity analysis. It implements iterative algorithms to compute spatio-temporal statistic fields over results of large scale sensitivity studies. Melissa relies on a client/server architecture, composed of three main modules:</p>
      <p>Melissa Server: an independent parallel executable. It receives data from the simulations, updates iterative statistics as soon as possible, then trow data away.
Melissa API: a shared library to be linked within the simulation code. It mainly transmit simulation data to Melissa Server at each timestep. The simulations of the sensitivity analysis become the clients of Melissa Server.
Melissa Launcher: A Python script in charge of generating and managing the whole global sensitivity analysis.</p>
      <simplelist>
        <li id="uid42">
          <p noindent="true">Authors: Théophile Terraz, Bruno Raffin, Alejandro Ribes and Bertrand Iooss</p>
        </li>
        <li id="uid43">
          <p noindent="true">Partner: Edf</p>
        </li>
        <li id="uid44">
          <p noindent="true">Contact: Bruno Raffin</p>
        </li>
        <li id="uid45">
          <p noindent="true">Publications: <ref xlink:href="https://hal.inria.fr/hal-01383860" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">In Situ Statistical Analysis for Parametric Studies</ref> -
<ref xlink:href="https://hal.inria.fr/hal-01607479" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">Melissa: Large Scale In Transit Sensitivity Analysis Avoiding Intermediate Files</ref></p>
        </li>
        <li id="uid46">
          <p noindent="true">URL: <ref xlink:href="https://melissa-sa.github.io" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>melissa-sa.<allowbreak/>github.<allowbreak/>io</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid47" level="1">
      <bodyTitle>Platforms</bodyTitle>
      <subsection id="uid48" level="2">
        <bodyTitle>Grid'5000 (<ref xlink:href="https://www.grid5000.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>www.<allowbreak/>grid5000.<allowbreak/>fr/</ref>) and Meso
Center Ciment (<ref xlink:href="https://ciment.ujf-grenoble.fr" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>ciment.<allowbreak/>ujf-grenoble.<allowbreak/>fr</ref>) </bodyTitle>
        <p>We have been very active in promoting the factorization of compute
resources at a regional and national level. We have a three level
implication, locally to maintain a pool of very flexible
experimental machines (hundreds of cores), regionally through the
CIMENT meso center (Equipex Grant), and nationally by contributing
to the Grid'5000 platform, our local resources being included in
this platform. Olivier Richard is member of Grid'5000 scientific
committee and Pierre Neyron is member of the technical committee.
The OAR scheduler in particular is deployed on both infrastructures.
We are currently preparing proposals for the next generation machines within the context of the new university association (Univ. Grenoble-Alpes).</p>
      </subsection>
    </subsection>
  </logiciels>
  <resultats id="uid49">
    <bodyTitle>New Results</bodyTitle>
    <subsection id="uid50" level="1">
      <bodyTitle>Integration of High Performance Computing and Data Analytics</bodyTitle>
      <subsection id="uid51" level="2">
        <bodyTitle>I/O Survey</bodyTitle>
        <p>First contribution is a comprehensive survey on parallel I/O in the HPC context <ref xlink:href="#datamove-2018-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. As the available processing power and amount of data increase, I/O remains a central issue for the scientific community. This survey focuses on a traditional I/O stack, with a POSIX parallel file system. Through the comprehensive study of publications from the most important conferences and journals in a five-year time window, we discuss the state of the art of I/O optimization approaches, access pattern extraction techniques, and performance modeling, in addition to general aspects of parallel I/O research. This survey enables us to identify the general characteristics of the field and the main current and future research topics.</p>
      </subsection>
      <subsection id="uid52" level="2">
        <bodyTitle>Task Based In Situ Processing</bodyTitle>
        <p>One approach to bypass the I/O bottleneck is <i>in situ</i> processing, an important research topic at DataMove.
The <i>in situ</i> paradigm proposes to reduce data movement and to analyze
data while still resident in the memory of the compute node by
co-locating simulation and analytics on the same compute node. The
simplest approach consists in modifying the simulation timeloop to
directly call analytics routines. However, several works have shown
that an <i>asynchronous</i> approach where analytics and simulation run
concurrently can lead to a significantly better performance. Today, the most
efficient approach consists in running the analytics processes on a
set of dedicated cores, called helper cores, to isolate them from
the simulation processes. Simulation and analytics thus run concurrently on different cores but this static isolation can lead to underused
resources if the simulation or the analytics do not fully use all
the assigned cores.</p>
        <p>In this work performed in collaboration with CEA, we developed TINS, a task-based in situ framework
that implements a novel <i>dynamic helper core</i> strategy. TINS relies on
a work stealing scheduler and on task-based programming. Simulation
and analytics tasks are created concurrently and scheduled on a set
of worker threads created by a single instance of the work stealing
scheduler. Helper cores are assigned dynamically: some worker
threads are dedicated to analytics when analytics tasks are
available while they join the other threads for processing simulation
tasks otherwise, leading to a better resource usage. We leverage
the good compositionality properties of task-based
programming to seamlessly keep the analytics and simulation codes
well separated and a plugin system enables to develop parallel
analytics codes outside of the simulation code.</p>
        <p>TINS is implemented with the Intel Threading Building Blocks (TBB)
library that provides a task-based programming model and a work
stealing scheduler. The experiments are conducted with the hybrid
MPI+TBB ExaStamp molecular dynamics code that we associate with a set of analytics representative of
computational physics algorithms. We show up to <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>40</mn><mo>%</mo></mrow></math></formula> performance
improvement over various other approaches, including the standard
helper core, on experiments on up to 14,336 Broadwell cores.</p>
      </subsection>
      <subsection id="uid53" level="2">
        <bodyTitle>Stream Processing</bodyTitle>
        <p>Stream processing is the Big Data equivalent of in situ processing. It consists in analyzing on-line incoming streams of data, often produced from
sensors or social networks like Twitter. We investigated the convergence between both paradigms through different directions: how the programming environment developed specifically for stream processing can applied to the data produced by large parallel simulations <ref xlink:href="#datamove-2018-bid1" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>; Proposing a dynamics data structure to keep sorted data streams <ref xlink:href="#datamove-2018-bid2" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>; Evaluating the performance of the FlameMR framework on data produced from a parallel simulation<ref xlink:href="#datamove-2018-bid3" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. We summarize here the 2 first contributions.</p>
        <subsection id="uid54" level="3">
          <bodyTitle>Packed Memory QuadTree.</bodyTitle>
          <p>Over the past years, several in-memory big-data management systems have appeared in academia and industry. In-memory databases systems avoid the overheads related to traditional I/O disk-based systems and have made possible to perform interactive data-analysis over large amounts of data. A vast literature of systems and research strategies deals with different aspects, such as the limited storage size and a multi-level memory-hierarchy of caches. Maintaining the right data layout that favors locality of accesses is a determinant factor for the performance of in-memory processing systems. Stream processing engines like Spark or Flink support the concept of <i>window</i>, which collects the latest events without a specific data organization. It is possible to trigger the analysis upon the occurrence of a given criterion (time, volume, specific event occurrence). After a window is updated, the system shifts the processing to the next batch of events. There is a need to go one step further to keep a live window continuously updated while having a fine grain data replacement policy to control the memory footprint. The challenge is the design of dynamic data structures to absorb high rate data streams, stash away the oldest data to stay in the allowed memory budget while enabling fast queries executions to update visual representations. A possible solution is the extension of database structures like R-trees used in SpatiaLite or PostGis, or to develop dedicated frameworks like Kit based on a pyramid structure.</p>
          <p>We developed a novel self-organized cache-oblivious data structure, called PMQ, for in-memory
storage and indexing of fixed length records tagged with a spatiotemporal index.
We store the data in an array with a controlled density of gaps (<i>i.e.</i>, empty slots) that benefits from the properties of the <i>Packed Memory Arrays</i>. The empty slots guarantee that insertions can be performed with a low amortized number of data movements (<formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>𝑂</mi><mo>(</mo><msup><mo form="prefix">log</mo><mn>2</mn></msup><mrow><mo>(</mo><mi>N</mi><mo>)</mo></mrow><mo>)</mo></mrow></math></formula>) while enabling efficient spatiotemporal queries. During insertions, we rebalance parts of the array when required to respect density constraints, and the oldest data is stashed away when reaching the memory budget. To spatially subdivide the data, we sort the records according to their Morton index, thus ensuring spatial locality in the array while defining an implicit, recursive quadtree, which leads to efficient spatiotemporal queries. We validate PMQ for consuming a stream of tweets to answer visual and range queries. PMQ significantly outperforms the widely adopted spatial indexing data structure R-tree, typically used by relational databases, as well as the conjunction of Geohash and B<sup>+</sup>-tree, typically used by NoSQL databases.</p>
        </subsection>
        <subsection id="uid55" level="3">
          <bodyTitle>Flink based in situ Processing.</bodyTitle>
          <p>We proposed to leverage Apache Flink, a scalable stream processing engine from the
Big Data domain, in this HPC context. Flink enables
to program analyses within a simple window based map/reduce model, while
the runtime takes care of the deployment, load balancing and fault tolerance.
We build a complete in transit analytics workflow, connecting an MD
simulation to Apache Flink and to a distributed database, Apache
HBase, to persist all the desired data. To demonstrate the
expressivity of this programming model and its suitability for HPC
scientific environments, two common analytics in the Molecular Dynamics field have
been implemented. We assessed the performance of this framework,
concluding that it can handle simulations of sizes used in the
literature while providing an effective and versatile tool for
scientists to easily incorporate on-line parallel analytics in their
current workflows.</p>
        </subsection>
      </subsection>
    </subsection>
    <subsection id="uid56" level="1">
      <bodyTitle>Data Aware Batch Scheduling</bodyTitle>
      <subsection id="uid57" level="2">
        <bodyTitle>Batch Scheduling for Energy</bodyTitle>
        <p>The project COSMIC <ref xlink:href="#datamove-2018-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#datamove-2018-bid5" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#datamove-2018-bid6" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#datamove-2018-bid7" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, in collaboration with Myriads team in Inria Rennes-Atlantique, targets the optimization of green energy usage in Clouds. The project considers
a geographically distributed cloud, with each data center associated with a
local photovoltaic (PV) farm. The objective is to maximize the photovoltaic energy by
allocation the computing workload to the data centers according to its energy production.
The production forecasting is modeled with a truncated normal law, permitting to
consider the uncertainty of the forecast.</p>
        <p>Chapter <ref xlink:href="#datamove-2018-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> considers a simple model with homogeneous Virtual Machines submitted at unpredictable rate. This study has resulted in a scheduling algorithm for task allocation. The chapter demonstrates the optimality of
this algorithm at current time slot according to production forecast parameters.</p>
        <p>Paper <ref xlink:href="#datamove-2018-bid5" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> extends these results to heterogeneous VM. Each VM is defined by its arrival date, its execution time, its memory requirement and
its CPU usage. In this model, due to execution time durations, the possibility to
migrate running VM was considered. An algorithm is detailed in the paper that is
compared to standard algorithm through simulations.</p>
        <p>A third study <ref xlink:href="#datamove-2018-bid6" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#datamove-2018-bid7" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> has carefully modeled
the interactions between the Cloud and the energy supplier. Due to variability of
PV production and workload submission, each data center will alternatively inject energy into the electricity grid or purchase energy. The energy model considers
a virtual energy pool mitigating the surplus and deficit of the different data center, with reduced costs regarding the difference between electricity cost and
electricity injection tariff. The algorithm detailed in this paper outperforms
well-known round-robin approaches, as shown by simulations.</p>
      </subsection>
      <subsection id="uid58" level="2">
        <bodyTitle>Learning Methods for Batch Scheduling</bodyTitle>
        <p>Most of Job Scheduling algorithms apply greedy tasks ordering, as First Come
First Served (FCFS) or Shortest Processing time First (SPF). They give simple
methods, highly practical with certain guarantees. They are however far from
optimal. Mixed methods, combining many of this basic methods permit to improve
their performance. DataMove has developed <ref xlink:href="#datamove-2018-bid8" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> a learning method permitting to
adapt the Mixed method to benchmarks. An extensive experimental campaign has permitted to determine the possibilities of basic and mixed methods according to the benchmarks characteristics, enhancing the efficiency of mixed methods.</p>
      </subsection>
      <subsection id="uid59" level="2">
        <bodyTitle>Reproducibility</bodyTitle>
        <p>Related to batch scheduling experimentation, DataMove has led investigations on reproducibility <ref xlink:href="#datamove-2018-bid9" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Existing approaches focus on repeatability, but this is only the first step to reproducibility: Continuing a scientific work from a previous experiment requires to be able to modify it. This ability is called reproducibility with Variation. We show that capturing the environment of execution is necessary but not sufficient ; we also need the environment of development. The variation also implies that those environments are subject to evolution, so the whole software development lifecycle needs to be considered. To take into account these evolutions, software environments need to be clearly defined, reconstructible with variation, and easy to share. In this context, we propose new way of seeing reproducibility through the scientific software development lifecycle. Each step in this lifecycle requires a software environment. We define a software environment by a set of applications and libraries, with all their dependencies, and their configurations, required to achieve a step in a scientific workflow.</p>
      </subsection>
      <subsection id="uid60" level="2">
        <bodyTitle>Online Algorithms</bodyTitle>
        <p>Rob van Stee wrote a review of 2018 online algorithms including our recent contributions on
resource augmentation <footnote id="uid61" id-text="6">Rob van Stee. 2018. SIGACT News Online Algorithms Column 34: 2018 in review. SIGACT News 49, 4 (December 2018), 36-45.</footnote>
We quote him here:</p>
        <p>
          <i>Progress was also made on scheduling to minimize weighted flow time on unrelated machines. In ESA 2016, Giorgio Lucarelli et al. <ref xlink:href="#datamove-2018-bid10" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> had considered a version where the online algorithm can reject some <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><msub><mi>ε</mi><mi>r</mi></msub><mo>&gt;</mo><mn>0</mn></mrow></math></formula> fraction (by weight) of the jobs and have machines that are <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>1</mn><mo>+</mo><msub><mi>ε</mi><mi>s</mi></msub></mrow></math></formula> as fast as the offline machines, for some <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><msub><mi>ε</mi><mi>s</mi></msub><mo>&gt;</mo><mn>0</mn></mrow></math></formula>. They showed that this is already enough to achieve a competitive ratio of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>O</mi><mo>(</mo><mn>1</mn><mo>/</mo><mrow><mo>(</mo><msub><mi>ε</mi><mi>s</mi></msub><msub><mi>ε</mi><mi>r</mi></msub><mo>)</mo></mrow><mo>)</mo></mrow></math></formula>.</i>
        </p>
        <p>
          <i>In SPAA 2018, Giorgio Lucarelli et al.<ref xlink:href="#datamove-2018-bid11" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> (a superset of the previous authors) showed that it is in fact sufficient to reject a <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>2</mn><mi>ε</mi></mrow></math></formula> fraction of the total number of jobs to achieve a competitive ratio of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>2</mn><mo>(</mo><mfrac><mrow><mn>1</mn><mo>+</mo><mi>ε</mi></mrow><mi>ε</mi></mfrac><mo>)</mo></mrow></math></formula> for minimizing the total flow time. This algorithm sometimes rejects a job other than the one that has just arrived. The authors show that this is necessary, as otherwise there is a lower bound of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>Ω</mi><mo>(</mo><mi>Δ</mi><mo>)</mo></mrow></math></formula> even on a single machine. Here <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>Δ</mi></math></formula> is the size ratio (the ratio of largest to smallest job size). (Obviously this lower bound also holds if you cannot reject jobs at all.)</i>
        </p>
        <p>
          <i>They also consider the speed scaling model, in which machines can be sped up if additional energy is invested, and the goal is to minimize the total weighted flow time plus energy usage. If the power function of machine <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>i</mi></math></formula> is given by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>P</mi><mrow><mo>(</mo><msub><mi>s</mi><mi>i</mi></msub><mrow><mo>(</mo><mi>t</mi><mo>)</mo></mrow><mo>)</mo></mrow><mo>=</mo><msub><mi>s</mi><mi>i</mi></msub><msup><mrow><mo>(</mo><mi>t</mi><mo>)</mo></mrow><mi>α</mi></msup></mrow></math></formula>, where <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><msub><mi>s</mi><mi>i</mi></msub><mrow><mo>(</mo><mi>t</mi><mo>)</mo></mrow></mrow></math></formula> is the current speed of machine <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>i</mi></math></formula>, there is an algorithm which is <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>O</mi><mo>(</mo><msup><mrow><mo>(</mo><mn>1</mn><mo>+</mo><mn>1</mn><mo>/</mo><mi>ε</mi><mo>)</mo></mrow><mrow><mi>α</mi><mo>/</mo><mo>(</mo><mi>α</mi><mo>-</mo><mn>1</mn><mo>)</mo><mo>)</mo></mrow></msup></mrow></math></formula>-competitive that rejects jobs of total weight at most a fraction <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>ε</mi></math></formula> of the total weight of all the jobs. They also give a positive result for jobs with hard deadlines, where the goal is to minimize the total energy usage and no job may be rejected.</i>
        </p>
        <p>
          <i>In ESA 2018, the same set of authors <ref xlink:href="#datamove-2018-bid12" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> improved/generalized these results by showing that rejection alone is sufficient for an algorithm to be competitive even for weighted flow time. They presented an <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>O</mi><mo>(</mo><mn>1</mn><mo>/</mo><msup><mi>ε</mi><mn>3</mn></msup><mo>)</mo></mrow></math></formula>-competitive algorithm that rejects at most <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>O</mi><mo>(</mo><mi>ε</mi><mo>)</mo></mrow></math></formula> of the total weight of the jobs. In this algorithm, jobs are assigned (approximately) greedily to machines, and each machine runs the jobs assigned to it using Highest Density First. A job may be rejected if it is running while much heavier jobs arrive or if it is in the queue while very many jobs arrive. The second rule simulates the resource augmentation on the speed.
</i>
        </p>
      </subsection>
    </subsection>
  </resultats>
  <contrats id="uid62">
    <bodyTitle>Bilateral Contracts and Grants with Industry</bodyTitle>
    <subsection id="uid63" level="1">
      <bodyTitle>Bilateral Contracts with Industry</bodyTitle>
      <simplelist>
        <li id="uid64">
          <p noindent="true"><b>BULL-ATOS SE (2016-2019)</b>. Two PhD grants
(Michael Mercier and Adrien Faure). Job and resource management algorithms.</p>
        </li>
        <li id="uid65">
          <p noindent="true"><b>CEA DAM (2016-2018)</b>. PhD grant support contract (PhD of Estelle Dirand, funded by CEA). In situ analysis for Molecular Simulations.</p>
        </li>
      </simplelist>
    </subsection>
  </contrats>
  <partenariat id="uid66">
    <bodyTitle>Partnerships and Cooperations</bodyTitle>
    <subsection id="uid67" level="1">
      <bodyTitle>National Initiatives</bodyTitle>
      <subsection id="uid68" level="2">
        <bodyTitle>ANR</bodyTitle>
        <simplelist>
          <li id="uid69">
            <p noindent="true"><b>ANR grant GRECO (2017-2020).</b>
Resource manager for cloud of things. Coordinator: Quarnot Computing. Partners: Quarnot Computing, Grenoble-INP, Inria.</p>
          </li>
          <li id="uid70">
            <p noindent="true"><b>ANR grant Energumen (2018-2022).</b> Resource management: malleable jobs for a better use of the resources along with energy optimization. Coordinator: Denis Trystram. Partners: Grenoble-INP, IRIT, Sorbonne Université.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection id="uid71" level="2">
        <bodyTitle>Competitivity Clusters</bodyTitle>
        <simplelist>
          <li id="uid72">
            <p noindent="true"><b>PIA Avido (2015-2018)</b>. In situ analysis and visualization
for large scale numerical simulation. Coordinator: EDF SA. Partners: EDF R&amp;D, Total SA,
Kitware SAS , Université Pierre et Marie CURIE, Inria (DataMove).</p>
          </li>
          <li id="uid73">
            <p noindent="true"><b>FUI OverMind (2015-2018)</b>. Task planification and asset
management for the cartoon productions. Coordinator: Teamto Studio.
Partners: Teamto Studio, Folimage Studio, Ecole de Gobelins, Inria
(DataMove).</p>
          </li>
          <li id="uid74">
            <p noindent="true"><b>FUI IDIOM (2018-2020)</b>. Monitoring and optimization of I/Os. Coordinator DDN Storage. Partners: DDN Storage, Criteo, Quarnot, QuasarDB, CEA, Université de Bretagne Occidentale, Telecom SudParis, Inria (DataMove).</p>
          </li>
        </simplelist>
      </subsection>
      <subsection id="uid75" level="2">
        <bodyTitle>Inria</bodyTitle>
        <simplelist>
          <li id="uid76">
            <p noindent="true">Inria PRE COSMIC (exploratory research project), 2017-2019. Photovoltaic Energy Management for Distributed Cloud Platforms. Myriads, DataMove.</p>
          </li>
          <li id="uid77">
            <p noindent="true">Inria IPL HPC-BigData, 2018-2021). Convergence between HPC, Big Data and AI. Coordinator: Bruno Raffin. Partners:
the Inria teams Zenith, Kerdata, Datamove, Tadaam, SequeL, Parietal, Tau, and the external partners ATOS, ANL, IBPC, ESI-Group. See <ref xlink:href="https://project.inria.fr/hpcbigdata/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>project.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hpcbigdata/</ref></p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
    <subsection id="uid78" level="1">
      <bodyTitle>European Initiatives</bodyTitle>
      <subsection id="uid79" level="2">
        <bodyTitle>Collaborations in European Programs, Except FP7 &amp; H2020</bodyTitle>
        <sanspuceslist>
          <li id="uid80">
            <p noindent="true">Program: SKŁODOWSKA-CURIE ACTIONS - Individual Fellowship</p>
          </li>
          <li id="uid81">
            <p noindent="true">Project acronym: DAMA</p>
          </li>
          <li id="uid82">
            <p noindent="true">Project title: Extreme-Scale Data Management</p>
          </li>
          <li id="uid83">
            <p noindent="true">Duration: November 2018 - October 2020</p>
          </li>
          <li id="uid84">
            <p noindent="true">Coordinator: Bruno Raffin</p>
          </li>
          <li id="uid85">
            <p noindent="true">Followship Recipient: Francieli Zanon Boito.</p>
          </li>
          <li id="uid86">
            <p noindent="true">Abstract: This project is concerned with the I/O challenges that arise from the convergence between these two
different paradigms. It is clear data analytics tools cannot simply replace their typical storage solutions for the
HPC I/O stack, centered on the abstraction of files and powered by a parallel file system, because their workload
is not well suited for that and would observe poor performance. Moreover, the separated storage infrastructure
breaks the data affinity idea in which they are built upon. Finally, even among traditional HPC applications
there is a need to minimize data movement, as it imposes high latency and increases energy consumption.</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
    <subsection id="uid87" level="1">
      <bodyTitle>International Initiatives</bodyTitle>
      <subsection id="uid88" level="2">
        <bodyTitle>Inria International Labs</bodyTitle>
        <subsection id="uid89" level="3">
          <bodyTitle>JLESC</bodyTitle>
          <sanspuceslist>
            <li id="uid90">
              <p noindent="true">Title: Joint Laboratory for Extreme-Scale-Computing.</p>
            </li>
            <li id="uid91">
              <p noindent="true">International Partners:</p>
              <sanspuceslist>
                <li id="uid92">
                  <p noindent="true">University of Illinois at Urbana Champaign (USA)</p>
                </li>
                <li id="uid93">
                  <p noindent="true">Argonne National Laboratory (USA),</p>
                </li>
                <li id="uid94">
                  <p noindent="true">Barcelona Supercomputing Center (Spain),</p>
                </li>
                <li id="uid95">
                  <p noindent="true">Jülich Supercomputing Centre (Germany)</p>
                </li>
                <li id="uid96">
                  <p noindent="true">Riken Advanced Institute for Computational Science (Japan)</p>
                </li>
              </sanspuceslist>
            </li>
            <li id="uid97">
              <p noindent="true">Start year: 2009</p>
            </li>
            <li id="uid98">
              <p noindent="true">See also: <ref xlink:href="https://jlesc.github.io/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>jlesc.<allowbreak/>github.<allowbreak/>io/</ref></p>
            </li>
            <li id="uid99">
              <p noindent="true">The purpose of the Joint Laboratory for Extreme Scale Computing is to be an international, virtual organization whose goal is to enhance the ability of member organizations and investigators to make the bridge between Petascale and Extreme computing. The JLESC organizes a workshop every 6 months DataMove participates to. DataMove developed several collaborations related to in situ processing with Tom Peterka group (ANL) , the Argo exascale operating system with Swann Perarnau (ANL).</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
      <subsection id="uid100" level="2">
        <bodyTitle>Participation in Other International Programs</bodyTitle>
        <subsection id="uid101" level="3">
          <bodyTitle>LICIA</bodyTitle>
          <sanspuceslist>
            <li id="uid102">
              <p noindent="true">Title: International Laboratory in High Performance and Ubiquitous Computing</p>
            </li>
            <li id="uid103">
              <p noindent="true">International Partner (Institution - Laboratory - Researcher):</p>
              <sanspuceslist>
                <li id="uid104">
                  <p noindent="true">UFRGS (Brazil)</p>
                </li>
              </sanspuceslist>
            </li>
            <li id="uid105">
              <p noindent="true">Duration: 2011 - 2018</p>
            </li>
            <li id="uid106">
              <p noindent="true">See also: <ref xlink:href="http://licia-lab.org/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>licia-lab.<allowbreak/>org/</ref></p>
            </li>
            <li id="uid107">
              <p noindent="true">The LICIA is an Internacional Laboratory and High Performance
and Ubiquitous Computing born in 2011 from the common desire of
members of Informatics Institute of the Federal University of Rio
Grande do Sul and of Laboratoire d’Informatique de Grenoble to
enhance and develop their scientific parternship that started by
the end of the 1970. LICIA is an Internacional Associated Lab of
the CNRS, a public french research institution. It has support from
several brazilian and french research funding agencies, such as
CNRS, Inria, ANR, European Union (from the french side) and CAPES,
CNPq, FAPERGS (from the Brazilian side). DataMove is deeply involved
in the animation of LICIA. Bruno Raffin is LICIA associate director.</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
    </subsection>
    <subsection id="uid108" level="1">
      <bodyTitle>International Research Visitors</bodyTitle>
      <subsection id="uid109" level="2">
        <bodyTitle>Visits of International Scientists</bodyTitle>
        <sanspuceslist>
          <li id="uid110">
            <p noindent="true">Professor visit: Alba Cristina Magalhaes Alves De Melo, Professor at University of Brasilia, visited the Datamove for one month in 2018.</p>
          </li>
          <li id="uid111">
            <p noindent="true">PhD in progress: Danilo Carastan Dos Santos, Dynamic Scheduling of Tasks in High Performance Platforms with Machine Learning (Sao Paulo, Brasil). 1 year "sandwich" visit. Local adviser: Denis Trystram</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
  </partenariat>
  <diffusion id="uid112">
    <bodyTitle>Dissemination</bodyTitle>
    <subsection id="uid113" level="1">
      <bodyTitle>Promoting Scientific Activities</bodyTitle>
      <subsection id="uid114" level="2">
        <bodyTitle>Scientific Events Organisation</bodyTitle>
        <subsection id="uid115" level="3">
          <bodyTitle>General Chair, Scientific Chair</bodyTitle>
          <sanspuceslist>
            <li id="uid116">
              <p noindent="true">President of the steering committee of Edu-Europar.</p>
            </li>
            <li id="uid117">
              <p noindent="true">President of the steering committee of EGPGV (Eurographics Symposium on Parallel Graphics and Visualization).</p>
            </li>
            <li id="uid118">
              <p noindent="true">Member of the steering committee of Europar.</p>
            </li>
            <li id="uid119">
              <p noindent="true">Member of the steering committee of <i>Journée de visualisation scientifique</i>.</p>
            </li>
            <li id="uid120">
              <p noindent="true">Member of the steering committee of HeteroPar.</p>
            </li>
            <li id="uid121">
              <p noindent="true">Co-chair of the First HPML Workshop collocated with SBAC-PAD Lyon , October 2018.</p>
            </li>
          </sanspuceslist>
        </subsection>
        <subsection id="uid122" level="3">
          <bodyTitle>Member of the Organizing Committees</bodyTitle>
          <sanspuceslist>
            <li id="uid123">
              <p noindent="true">Euro-Par Advisory Board Member</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
      <subsection id="uid124" level="2">
        <bodyTitle>Scientific Events Selection</bodyTitle>
        <subsection id="uid125" level="3">
          <bodyTitle>Member of the Conference Program Committees</bodyTitle>
          <sanspuceslist>
            <li id="uid126">
              <p noindent="true">ISAV 2018 (Workshop on In Situ Infrastructures for Enabling Extreme-scale Analysis and Visualization) , November, Dallas, USA</p>
            </li>
            <li id="uid127">
              <p noindent="true">EGPGV 2018 (Eurographics Symposium on Parallel Graphics and Visualization), June, Brno, Czech Republic.</p>
            </li>
            <li id="uid128">
              <p noindent="true">LADV 2018 (IEEE Symposium on Large Data Analysis and Visualization), October, Berlin, Germany.</p>
            </li>
            <li id="uid129">
              <p noindent="true">IPDPS 2018 (nternational Parallel and Distributed Processing Symposium ), May, Vancouver, Canada.</p>
            </li>
            <li id="uid130">
              <p noindent="true">LATIN, April 2018, Buenos Aires, Argentina.</p>
            </li>
            <li id="uid131">
              <p noindent="true">CCgrid 2018 (18th IEEE/ACM International Symposium on Cluster, Cloud and Grid
Computing), May, Washington DC.</p>
            </li>
            <li id="uid132">
              <p noindent="true">SPAA (30th ACM Symposium on Parallelism in Algorithms and Architecture), July 2018,
Vienna, Austria.</p>
            </li>
            <li id="uid133">
              <p noindent="true">ISPDC, June 2018, Geneva, Switzerland.</p>
            </li>
            <li id="uid134">
              <p noindent="true">CONPAS (Conference d'informatique en Parallelisme, Architecture et Systeme), July 2018, Toulouse, France.</p>
            </li>
            <li id="uid135">
              <p noindent="true">HiPC 2018 (IEEE internat. Conf on High Performance Computing, Data and Analytics), December 2018, Bengaluru, India.</p>
            </li>
            <li id="uid136">
              <p noindent="true">EURO 2018 (29th European Conference On Operational Research), July, Valencia.</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
      <subsection id="uid137" level="2">
        <bodyTitle>Journal</bodyTitle>
        <subsection id="uid138" level="3">
          <bodyTitle>Member of the Editorial Boards</bodyTitle>
          <sanspuceslist>
            <li id="uid139">
              <p noindent="true">Associate Editor of the Parallel Computing journal PARCO.</p>
            </li>
            <li id="uid140">
              <p noindent="true">Member of the Editorial Board of Computational Methods in Science and Technology.</p>
            </li>
            <li id="uid141">
              <p noindent="true">Member of the Editorial Board of ARIMA (revue africaine de recherche en informatique et maths appliquées).</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
      <subsection id="uid142" level="2">
        <bodyTitle>Scientific Expertise</bodyTitle>
        <sanspuceslist>
          <li id="uid143">
            <p noindent="true">ANR project evaluation expert</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid144" level="2">
        <bodyTitle>Research Administration</bodyTitle>
        <sanspuceslist>
          <li id="uid145">
            <p noindent="true">Director of Pôle MSTIC of COMUE Univ. Grenoble-Alpes.</p>
          </li>
          <li id="uid146">
            <p noindent="true">Head of the international Master program ( MOSIG1 ) at Grenoble INP (ENSIMAG)</p>
          </li>
          <li id="uid147">
            <p noindent="true">Steering committee of Grid'5000</p>
          </li>
          <li id="uid148">
            <p noindent="true">Steering committee of GRICAD</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
    <subsection id="uid149" level="1">
      <bodyTitle>Teaching - Supervision - Juries</bodyTitle>
      <subsection id="uid150" level="2">
        <bodyTitle>Teaching</bodyTitle>
        <sanspuceslist>
          <li id="uid151">
            <p noindent="true">Master: Denis Trystram is responsible of the first year (M1) of the international
Master of Science in Informatics at Grenoble (MOSIG-M1). 200 hours per year in average.</p>
          </li>
          <li id="uid152">
            <p noindent="true">Master: Fanny Dufossé. 30 hours per year. Combinatorial scientific computing in Master at ENS Lyon and Algorithmic in Licence at Grenoble INP.</p>
          </li>
          <li id="uid153">
            <p noindent="true">Master: Pierre-François Dutot. 226 hours per year. Licence (first
and second year) at IUT2/UPMF (Institut Universitaire Technologique
de Univ. Grenoble-Alpes) and 9 hours Master M2R-ISC
Informatique-Systèmes-Communication at Univ. Grenoble-Alpes.</p>
          </li>
          <li id="uid154">
            <p noindent="true">Master: Grégory Mounié. 242 hours per year. Master (M1/2nd year and M2/3rd year) at
Engineering school ENSIMAG, Grenoble-INP.</p>
          </li>
          <li id="uid155">
            <p noindent="true">Master: Bruno Raffin. 28 hours per year. Parallel System. International
Master of Science in Informatics at Grenoble (MOSIG-M2).</p>
          </li>
          <li id="uid156">
            <p noindent="true">Master: Olivier Richard is responsible of the third year of the computer science department of Grenoble INP. 222 hours per year. Master at
Engineering school Polytech-Grenoble, Univ. Grenoble-Alpes.</p>
          </li>
          <li id="uid157">
            <p noindent="true">Master: Frédéric Wagner. 220 hours per year. Engineering
school ENSIMAG, Grenoble-INP (M1/2nd year and M2/3rd year).</p>
          </li>
          <li id="uid158">
            <p noindent="true">Master: Yves Denneulin. 192 hours per year. Engineering
school ENSIMAG, Grenoble-INP (M1/2nd year and M2/3rd year).</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid159" level="2">
        <bodyTitle>Supervision</bodyTitle>
        <sanspuceslist>
          <li id="uid160">
            <p noindent="true">PhD: Estelle Dirand, Integration of High-Performance Data Analytics and IOs for Molecular Dynamics on Exascale Computer, Univ. Grenoble-Alpes. November 2018. Bruno Raffin and Laurent Colombet (CEA).</p>
          </li>
          <li id="uid161">
            <p noindent="true">PhD: Valentin Reis, Learning to Control Large-Scale Parallel Platforms, Univ. Grenoble-Alpes. October 2018. Advisers: Denis Trystram and Eric Gaussier</p>
          </li>
          <li id="uid162">
            <p noindent="true">PhD in progress: Michael Mercier, Resource Management and Job Scheduling in HPC–Cloud environments towards the Big Data era, Univ. Grenoble Alpes. Started October 2016. Advisers: Olivier Richard and Bruno Raffin.</p>
          </li>
          <li id="uid163">
            <p noindent="true">PhD in progress: Alessandro Kraemer, Scheduling in the Cloud, Univ Grenoble-Alpes and UFPR (co-tutelle). Started October 2014. Advisers: Olivier Richard and Denis Trystram.</p>
          </li>
          <li id="uid164">
            <p noindent="true">PhD in progress: Mohammed Khatiri, Tasks scheduling on heterogeneous Multicore, Univ. Grenoble-Alpes and University Mohammed First (co-tutelle), Advisers: Denis Trystram, El Mostafa DAOUDI (University Mohammed First, Oujda, Morocco)</p>
          </li>
          <li id="uid165">
            <p noindent="true">PhD in progress: Adrien Faure, Scheduling with Resource Augmentation, Advisers: Denis Trystram</p>
          </li>
          <li id="uid166">
            <p noindent="true">PhD in progress: Clément Mommessin, Scheduling on heterogeneous platforms, Advisers: Denis Trystram</p>
          </li>
          <li id="uid167">
            <p noindent="true">PhD in progress: Loris Felardos, Deep Learning for the Analytics of Molecular Systems, Advisers: Bruno Raffin, Guillaume Charpiat (Inria team Tau), Jérome Hénin (IBPC).</p>
          </li>
          <li id="uid168">
            <p noindent="true">PhD in Progress: Salah Zrigui, Learning Scheduling Strategies, Advisers: Denis Trystram and Fanny Dufossé.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid169" level="2">
        <bodyTitle>Juries</bodyTitle>
        <sanspuceslist>
          <li id="uid170">
            <p noindent="true">PhD Defense of Jonathan Sarton, Visualisations interactives haute-performance de donnes volumiques massives : une approche out-of-core multi-resolution basee GPUs,
28 Novembre 2018, Université de Reims Champagne-Ardenne. Reviewer</p>
          </li>
          <li id="uid171">
            <p noindent="true">PhD Defense of Adrian Perez Dieguez, Parallel Prefix Operations on Heterogeneous Platforms,
December 2018, Universidad da Coruna. Reviewer.</p>
          </li>
          <li id="uid172">
            <p noindent="true">PhD Defense of Khalil Labidi,
Parallelisation of hybrid metaheuristics for COP solving, 20 septembre 2018, Université de Tunis et Université Paris-Dauphine. President</p>
          </li>
          <li id="uid173">
            <p noindent="true">PhD Defense of Stéphane Durand, Contrôle distribué et théorie des jeux : application aux
systèmes auto-optimisants, 13 décembre 2018, Univ Grenoble Alpes. President</p>
          </li>
          <li id="uid174">
            <p noindent="true">HDR Defense of Samuel Thibault, 13 décembre 2018, University Bordeaux I. Reviewer</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
    <subsection id="uid175" level="1">
      <bodyTitle>Popularization</bodyTitle>
      <subsection id="uid176" level="2">
        <bodyTitle>Interventions</bodyTitle>
        <simplelist>
          <li id="uid177">
            <p noindent="true">Talk <i>Des besoins en calcul de plus en plus performant</i> for the conference cycle "Accompagnement de l'informatique au lycée en 2018".</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
  </diffusion>
  <biblio id="bibliography" html="bibliography" numero="10" titre="Bibliography">
    
    <biblStruct id="datamove-2018-bid10" type="inproceedings" rend="refer" n="refercite:lucarelli:hal-01334219">
      <identifiant type="doi" value="10.4230/LIPIcs.ESA.2016.63"/>
      <identifiant type="hal" value="hal-01334219"/>
      <analytic>
        <title level="a">Online Non-preemptive Scheduling in a Resource Augmentation Model based on Duality</title>
        <author>
          <persName key="datamove-2018-idp136512">
            <foreName>Giorgio</foreName>
            <surname>Lucarelli</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Nguyen</foreName>
            <surname>Kim Thang</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Abhinav</foreName>
            <surname>Srivastav</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">European Symposium on Algorithms (ESA 2016)</title>
        <loc>Aarhus, Denmark</loc>
        <imprint>
          <biblScope type="volume">57</biblScope>
          <biblScope type="number">63</biblScope>
          <dateStruct>
            <month>August</month>
            <year>2016</year>
          </dateStruct>
          <biblScope type="pages">1-17</biblScope>
          <ref xlink:href="http://hal.univ-grenoble-alpes.fr/hal-01334219" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>univ-grenoble-alpes.<allowbreak/>fr/<allowbreak/>hal-01334219</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid20" type="phdthesis" rend="year" n="cite:dirand:tel-01949170">
      <identifiant type="hal" value="tel-01949170"/>
      <monogr>
        <title level="m">Integration of High-Performance Task-Based In Situ for Molecular Dynamics on Exascale Computers</title>
        <author>
          <persName key="datamove-2018-idp143968">
            <foreName>Estelle</foreName>
            <surname>Dirand</surname>
            <initial>E.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">Université Grenoble - Alpes</orgName>
          </publisher>
          <dateStruct>
            <month>November</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/tel-01949170" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>tel-01949170</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Theses</note>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid28" type="phdthesis" rend="year" n="cite:reis:tel-01965150">
      <identifiant type="hal" value="tel-01965150"/>
      <monogr>
        <title level="m">Learning to control large-scale parallel platforms</title>
        <author>
          <persName key="datamove-2018-idp156192">
            <foreName>Valentin</foreName>
            <surname>Reis</surname>
            <initial>V.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">Université Grenoble Alpes (France)</orgName>
          </publisher>
          <dateStruct>
            <month>September</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/tel-01965150" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>tel-01965150</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Theses</note>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid14" type="article" rend="year" n="cite:amaris:hal-01896868">
      <identifiant type="doi" value="10.1002/cpe.4647"/>
      <identifiant type="hal" value="hal-01896868"/>
      <analytic>
        <title level="a">Generic Algorithms for Scheduling Applications on Heterogeneous Platforms</title>
        <author>
          <persName>
            <foreName>Marcos</foreName>
            <surname>Amaris</surname>
            <initial>M.</initial>
          </persName>
          <persName key="datamove-2018-idp136512">
            <foreName>Giorgio</foreName>
            <surname>Lucarelli</surname>
            <initial>G.</initial>
          </persName>
          <persName key="datamove-2018-idp153744">
            <foreName>Clément</foreName>
            <surname>Mommessin</surname>
            <initial>C.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00435">
        <idno type="issn">1532-0626</idno>
        <title level="j">Concurrency and Computation: Practice and Experience</title>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-29</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01896868" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01896868</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid24" type="article" rend="year" n="cite:bampis:hal-01725140">
      <identifiant type="doi" value="10.1007/s10951-016-0500-2"/>
      <identifiant type="hal" value="hal-01725140"/>
      <analytic>
        <title level="a">Energy Efficient Scheduling and Routing via Randomized Rounding</title>
        <author>
          <persName>
            <foreName>Evripidis</foreName>
            <surname>Bampis</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>Alexander</foreName>
            <surname>Kononov</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Dimitrios</foreName>
            <surname>Letsios</surname>
            <initial>D.</initial>
          </persName>
          <persName key="datamove-2018-idp136512">
            <foreName>Giorgio</foreName>
            <surname>Lucarelli</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Maxim</foreName>
            <surname>Sviridenko</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid01258">
        <idno type="issn">1094-6136</idno>
        <title level="j">Journal of Scheduling</title>
        <imprint>
          <biblScope type="volume">21</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <month>February</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">35-51</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01725140" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01725140</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid27" type="article" rend="year" n="cite:blazewicz:hal-01963221">
      <identifiant type="doi" value="10.1007/s10951-018-0571-3"/>
      <identifiant type="hal" value="hal-01963221"/>
      <analytic>
        <title level="a">New challenges in scheduling theory</title>
        <author>
          <persName>
            <foreName>Jacek</foreName>
            <surname>Blazewicz</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Benjamin</foreName>
            <surname>Moseley</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Erwin</foreName>
            <surname>Pesch</surname>
            <initial>E.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Guochuan</foreName>
            <surname>Zhang</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid01258">
        <idno type="issn">1094-6136</idno>
        <title level="j">Journal of Scheduling</title>
        <imprint>
          <biblScope type="volume">21</biblScope>
          <biblScope type="number">6</biblScope>
          <dateStruct>
            <month>December</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">581-582</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01963221" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01963221</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid4" type="incollection" rend="year" n="cite:camus:hal-01945821">
      <identifiant type="hal" value="hal-01945821"/>
      <analytic>
        <title level="a">The SAGITTA approach for optimizing solar energy consumption in distributed clouds with stochastic modeling</title>
        <author>
          <persName key="myriads-2018-idp159264">
            <foreName>Benjamin</foreName>
            <surname>Camus</surname>
            <initial>B.</initial>
          </persName>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="myriads-2018-idp140720">
            <foreName>Anne-Cécile</foreName>
            <surname>Orgerie</surname>
            <initial>A.-C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no">
        <title level="m">Smart Cities, Green Technologies, and Intelligent Transport Systems</title>
        <imprint>
          <dateStruct>
            <month>December</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-25</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01945821" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01945821</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid22" type="article" rend="year" n="cite:dufosse:hal-01586245">
      <identifiant type="doi" value="10.1016/j.laa.2018.05.017"/>
      <identifiant type="hal" value="hal-01586245"/>
      <analytic>
        <title level="a">Further notes on Birkhoff-von Neumann decomposition of doubly stochastic matrices</title>
        <author>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="roma-2018-idp159376">
            <foreName>Ioannis</foreName>
            <surname>Panagiotas</surname>
            <initial>I.</initial>
          </persName>
          <persName key="roma-2018-idp128816">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid01353">
        <idno type="issn">0024-3795</idno>
        <title level="j">Linear Algebra and Applications</title>
        <imprint>
          <biblScope type="volume">554</biblScope>
          <dateStruct>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">68–78</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01586245" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01586245</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid26" type="article" rend="year" n="cite:gaussier:hal-01963216">
      <identifiant type="doi" value="10.1109/TPDS.2018.2820699"/>
      <identifiant type="hal" value="hal-01963216"/>
      <analytic>
        <title level="a">Online Tuning of EASY-Backfilling using Queue Reordering Policies</title>
        <author>
          <persName>
            <foreName>Éric</foreName>
            <surname>Gaussier</surname>
            <initial>É.</initial>
          </persName>
          <persName key="mathrisk-2018-idp195728">
            <foreName>Jerome</foreName>
            <surname>Lelong</surname>
            <initial>J.</initial>
          </persName>
          <persName key="datamove-2018-idp156192">
            <foreName>Valentin</foreName>
            <surname>Reis</surname>
            <initial>V.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00746">
        <idno type="issn">1045-9219</idno>
        <title level="j">IEEE Transactions on Parallel and Distributed Systems</title>
        <imprint>
          <biblScope type="volume">29</biblScope>
          <biblScope type="number">10</biblScope>
          <dateStruct>
            <month>October</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">2304-2316</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01963216" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01963216</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid18" type="article" rend="year" n="cite:jourdan:hal-01716581">
      <identifiant type="doi" value="10.1007/s11590-018-1237-y"/>
      <identifiant type="hal" value="hal-01716581"/>
      <analytic>
        <title level="a">An exact algorithm for the bi-objective timing problem</title>
        <author>
          <persName>
            <foreName>Laetitia</foreName>
            <surname>Jourdan</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>Sophie</foreName>
            <surname>Jacquin</surname>
            <initial>S.</initial>
          </persName>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid02255">
        <idno type="issn">1862-4472</idno>
        <title level="j">Optimization Letters</title>
        <imprint>
          <biblScope type="volume">12</biblScope>
          <biblScope type="number">4</biblScope>
          <dateStruct>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">903–914</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01716581" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01716581</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid25" type="article" rend="year" n="cite:kedadsidhoum:hal-01516700">
      <identifiant type="doi" value="10.1142/S012905411850003X"/>
      <identifiant type="hal" value="hal-01516700"/>
      <analytic>
        <title level="a">A Family of Scheduling Algorithms for Hybrid Parallel Platforms</title>
        <author>
          <persName>
            <foreName>Safia</foreName>
            <surname>Kedad-Sidhoum</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Florence</foreName>
            <surname>Monna</surname>
            <initial>F.</initial>
          </persName>
          <persName key="datamove-2018-idp126144">
            <foreName>Grégory</foreName>
            <surname>Mounié</surname>
            <initial>G.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00906">
        <idno type="issn">0129-0541</idno>
        <title level="j">International Journal of Foundations of Computer Science</title>
        <imprint>
          <biblScope type="volume">29</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">63-90</biblScope>
          <ref xlink:href="https://hal.sorbonne-universite.fr/hal-01516700" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>sorbonne-universite.<allowbreak/>fr/<allowbreak/>hal-01516700</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid12" type="article" rend="year" n="cite:lucarelli:hal-01986352">
      <identifiant type="doi" value="10.4230/LIPIcs.ESA.2018.59"/>
      <identifiant type="hal" value="hal-01986352"/>
      <analytic>
        <title level="a">Online Non-Preemptive Scheduling to Minimize Weighted Flow-time on Unrelated Machines</title>
        <author>
          <persName key="datamove-2018-idp136512">
            <foreName>Giorgio</foreName>
            <surname>Lucarelli</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Benjamin</foreName>
            <surname>Moseley</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Nguyen Kim</foreName>
            <surname>Thang</surname>
            <initial>N. K.</initial>
          </persName>
          <persName>
            <foreName>Abhinav</foreName>
            <surname>Srivastav</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid02734">
        <idno type="issn">1868-8969</idno>
        <title level="j">Leibniz International Proceedings in Informatics </title>
        <imprint>
          <biblScope type="volume">112</biblScope>
          <dateStruct>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01986352" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01986352</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid2" type="article" rend="year" n="cite:toss:hal-01876579">
      <identifiant type="doi" value="10.1016/j.cag.2018.09.005"/>
      <identifiant type="hal" value="hal-01876579"/>
      <analytic>
        <title level="a">Packed-Memory Quadtree: a cache-oblivious data structure for visual exploration of streaming spatiotemporal big data</title>
        <author>
          <persName>
            <foreName>Julio</foreName>
            <surname>Toss</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Cicero A. L.</foreName>
            <surname>Pahins</surname>
            <initial>C. A. L.</initial>
          </persName>
          <persName key="datamove-2018-idp117856">
            <foreName>Bruno</foreName>
            <surname>Raffin</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>João Luiz Dihl</foreName>
            <surname>Comba</surname>
            <initial>J. L. D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00410">
        <idno type="issn">0097-8493</idno>
        <title level="j">Computers and Graphics</title>
        <imprint>
          <biblScope type="volume">76</biblScope>
          <dateStruct>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">117-128</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01876579" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01876579</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid3" type="article" rend="year" n="cite:exposito:hal-01955503">
      <identifiant type="doi" value="10.1109/ACCESS.2018.2880842"/>
      <identifiant type="hal" value="hal-01955503"/>
      <analytic>
        <title level="a">Optimization of Real-World MapReduce Applications With Flame-MR: Practical Use Cases</title>
        <author>
          <persName>
            <foreName>Jorge</foreName>
            <surname>Veiga</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Roberto R.</foreName>
            <surname>Expósito</surname>
            <initial>R. R.</initial>
          </persName>
          <persName key="datamove-2018-idp117856">
            <foreName>Bruno</foreName>
            <surname>Raffin</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Juan</foreName>
            <surname>Tourino</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid02813">
        <idno type="issn">2169-3536</idno>
        <title level="j">IEEE Access</title>
        <imprint>
          <biblScope type="volume">6</biblScope>
          <dateStruct>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">69750-69762</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01955503" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01955503</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid0" type="article" rend="year" n="cite:zanonboito:hal-01591755">
      <identifiant type="doi" value="10.1145/3152891"/>
      <identifiant type="hal" value="hal-01591755"/>
      <analytic>
        <title level="a">A Checkpoint of Research on Parallel I/O for High Performance Computing</title>
        <author>
          <persName key="datamove-2018-idp139024">
            <foreName>Francieli</foreName>
            <surname>Zanon Boito</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Eduardo</foreName>
            <surname>Camilo Inacio</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>Jean</foreName>
            <surname>Luca Bez</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Philippe O A</foreName>
            <surname>Navaux</surname>
            <initial>P. O. A.</initial>
          </persName>
          <persName>
            <foreName>Mario A R</foreName>
            <surname>Dantas</surname>
            <initial>M. A. R.</initial>
          </persName>
          <persName key="datamove-2018-idp120768">
            <foreName>Yves</foreName>
            <surname>Denneulin</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00004">
        <idno type="issn">0360-0300</idno>
        <title level="j">ACM Computing Surveys</title>
        <imprint>
          <biblScope type="volume">51</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <month>March</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">23:1-23:35</biblScope>
          <ref xlink:href="http://hal.univ-grenoble-alpes.fr/hal-01591755" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>univ-grenoble-alpes.<allowbreak/>fr/<allowbreak/>hal-01591755</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid16" type="inproceedings" rend="year" n="cite:bleuse:hal-01884542">
      <identifiant type="doi" value="10.1007/978-3-319-96983-1_15"/>
      <identifiant type="hal" value="hal-01884542"/>
      <analytic>
        <title level="a">Interference-Aware Scheduling using Geometric Constraints</title>
        <author>
          <persName>
            <foreName>Raphaël</foreName>
            <surname>Bleuse</surname>
            <initial>R.</initial>
          </persName>
          <persName key="datamove-2018-idp180864">
            <foreName>Konstantinos</foreName>
            <surname>Dogeas</surname>
            <initial>K.</initial>
          </persName>
          <persName key="datamove-2018-idp136512">
            <foreName>Giorgio</foreName>
            <surname>Lucarelli</surname>
            <initial>G.</initial>
          </persName>
          <persName key="datamove-2018-idp126144">
            <foreName>Grégory</foreName>
            <surname>Mounié</surname>
            <initial>G.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">Euro-Par 2018 - European Conference on Parallel Processing</title>
        <loc>Torino, Italy</loc>
        <title level="s">Euro-Par 2018: Parallel Processing</title>
        <imprint>
          <biblScope type="volume">LNCS 11014</biblScope>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <month>August</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">205-217</biblScope>
          <ref xlink:href="http://hal.univ-grenoble-alpes.fr/hal-01884542" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>univ-grenoble-alpes.<allowbreak/>fr/<allowbreak/>hal-01884542</ref>
        </imprint>
        <meeting id="cid306382">
          <title>International Euro-Par Conference on Parallel Processing</title>
          <num>24</num>
          <abbr type="sigle">Euro-Par</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid5" type="inproceedings" rend="year" n="cite:camus:hal-01856665">
      <identifiant type="hal" value="hal-01856665"/>
      <analytic>
        <title level="a">Harnessing the geographical flexibility of distributed computing clouds for cooperative self-consumption</title>
        <author>
          <persName key="myriads-2018-idp159264">
            <foreName>Benjamin</foreName>
            <surname>Camus</surname>
            <initial>B.</initial>
          </persName>
          <persName key="myriads-2018-idp235456">
            <foreName>Anne</foreName>
            <surname>Blavette</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="myriads-2018-idp140720">
            <foreName>Anne-Cécile</foreName>
            <surname>Orgerie</surname>
            <initial>A.-C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="no" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">ISGT-Europe 2018 - 8th IEEE PES Innovative Smart Grid Technologies Conference Europe</title>
        <loc>Sarajevo, Bosnia and Herzegovina</loc>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-6</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01856665" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01856665</ref>
        </imprint>
        <meeting id="cid625805">
          <title>IEEE International Conference on Innovative Smart Grid Technologies</title>
          <num>8</num>
          <abbr type="sigle">ISGT</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid6" type="inproceedings" rend="year" n="cite:camus:hal-01856660">
      <identifiant type="hal" value="hal-01856660"/>
      <analytic>
        <title level="a">Self-Consumption Optimization of Renewable Energy Production in Distributed Clouds</title>
        <author>
          <persName key="myriads-2018-idp159264">
            <foreName>Benjamin</foreName>
            <surname>Camus</surname>
            <initial>B.</initial>
          </persName>
          <persName key="myriads-2018-idp235456">
            <foreName>Anne</foreName>
            <surname>Blavette</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="myriads-2018-idp140720">
            <foreName>Anne-Cécile</foreName>
            <surname>Orgerie</surname>
            <initial>A.-C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">Cluster 2018 - IEEE International Conference on Cluster Computing</title>
        <loc>Belfast, United Kingdom</loc>
        <imprint>
          <publisher>
            <orgName>IEEE</orgName>
          </publisher>
          <dateStruct>
            <month>September</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-11</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01856660" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01856660</ref>
        </imprint>
        <meeting id="cid81665">
          <title>IEEE International Conference on Cluster Computing</title>
          <num>2018</num>
          <abbr type="sigle">Cluster</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid7" type="inproceedings" rend="year" n="cite:camus:hal-01856657">
      <identifiant type="hal" value="hal-01856657"/>
      <analytic>
        <title level="a">Network-aware energy-efficient virtual machine management in distributed Cloud infrastructures with on-site photovoltaic production</title>
        <author>
          <persName key="myriads-2018-idp159264">
            <foreName>Benjamin</foreName>
            <surname>Camus</surname>
            <initial>B.</initial>
          </persName>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="myriads-2018-idp235456">
            <foreName>Anne</foreName>
            <surname>Blavette</surname>
            <initial>A.</initial>
          </persName>
          <persName key="myriads-2018-idp148528">
            <foreName>Martin</foreName>
            <surname>Quinson</surname>
            <initial>M.</initial>
          </persName>
          <persName key="myriads-2018-idp140720">
            <foreName>Anne-Cécile</foreName>
            <surname>Orgerie</surname>
            <initial>A.-C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">SBAC-PAD 2018 - International Symposium on Computer Architecture and High Performance Computing</title>
        <loc>Lyon, France</loc>
        <imprint>
          <dateStruct>
            <month>September</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-8</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01856657" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01856657</ref>
        </imprint>
        <meeting id="cid313009">
          <title>International Symposium on Computer Architecture and High Performance Computing</title>
          <num>30</num>
          <abbr type="sigle">SBAC-PAD</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid1" type="inproceedings" rend="year" n="cite:dirand:hal-01730910">
      <identifiant type="doi" value="10.1007/978-3-319-69953-0_10"/>
      <identifiant type="hal" value="hal-01730910"/>
      <analytic>
        <title level="a">TINS: A Task-Based Dynamic Helper Core Strategy for In Situ Analytics</title>
        <author>
          <persName key="datamove-2018-idp143968">
            <foreName>Estelle</foreName>
            <surname>Dirand</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>Laurent</foreName>
            <surname>Colombet</surname>
            <initial>L.</initial>
          </persName>
          <persName key="datamove-2018-idp117856">
            <foreName>Bruno</foreName>
            <surname>Raffin</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">SCA18 - Supercomputing Frontiers Asia 2018</title>
        <loc>Singapore, Singapore</loc>
        <imprint>
          <dateStruct>
            <month>March</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">159-178</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01730910" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01730910</ref>
        </imprint>
        <meeting id="cid626013">
          <title>Supercomputing Asia</title>
          <num>2018</num>
          <abbr type="sigle">SCA</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid15" type="inproceedings" rend="year" n="cite:dufosse:hal-01740403">
      <identifiant type="doi" value="10.1137/1.9781611975215.6"/>
      <identifiant type="hal" value="hal-01740403"/>
      <analytic>
        <title level="a">Approximation algorithms for maximum matchings in undirected graphs</title>
        <author>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="roma-2018-idp159376">
            <foreName>Ioannis</foreName>
            <surname>Panagiotas</surname>
            <initial>I.</initial>
          </persName>
          <persName key="roma-2018-idp128816">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">CSC 2018 - SIAM Workshop on Combinatorial Scientific Computing</title>
        <loc>Bergen, Norway</loc>
        <title level="s">Proceedings of the Seventh SIAM Workshop on Combinatorial Scientific Computing</title>
        <imprint>
          <publisher>
            <orgName>SIAM</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">56-65</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01740403" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01740403</ref>
        </imprint>
        <meeting id="cid361657">
          <title>SIAM Workshop on Combinatorial Scientific Computing</title>
          <num>2018</num>
          <abbr type="sigle">CSC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid11" type="inproceedings" rend="year" n="cite:lucarelli:hal-01986312">
      <identifiant type="doi" value="10.1145/3210377.3210402"/>
      <identifiant type="hal" value="hal-01986312"/>
      <analytic>
        <title level="a">Online Non-preemptive Scheduling on Unrelated Machines with Rejections</title>
        <author>
          <persName key="datamove-2018-idp136512">
            <foreName>Giorgio</foreName>
            <surname>Lucarelli</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Benjamin</foreName>
            <surname>Moseley</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Nguyen Kim</foreName>
            <surname>Thang</surname>
            <initial>N. K.</initial>
          </persName>
          <persName>
            <foreName>Abhinav</foreName>
            <surname>Srivastav</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">Proceedings of the 30th on Symposium on Parallelism in Algorithms and Architectures</title>
        <loc>Vienna, Austria</loc>
        <imprint>
          <publisher>
            <orgName>ACM Press</orgName>
          </publisher>
          <dateStruct>
            <month>July</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">291-300</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01986312" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01986312</ref>
        </imprint>
        <meeting id="cid24479">
          <title>ACM Symposium on Parallelism in Algorithms and Architectures</title>
          <num>30</num>
          <abbr type="sigle">SPAA</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid9" type="inproceedings" rend="year" n="cite:mercier:hal-01891084">
      <identifiant type="hal" value="hal-01891084"/>
      <analytic>
        <title level="a">Considering the Development Workflow to Achieve Reproducibility with Variation</title>
        <author>
          <persName key="datamove-2018-idp151296">
            <foreName>Michael</foreName>
            <surname>Mercier</surname>
            <initial>M.</initial>
          </persName>
          <persName key="datamove-2018-idp146400">
            <foreName>Adrien</foreName>
            <surname>Faure</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp128640">
            <foreName>Olivier</foreName>
            <surname>Richard</surname>
            <initial>O.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="no" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">SC 2018 - Workshop: ResCuE-HPC</title>
        <loc>Dallas, United States</loc>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-5</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01891084" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01891084</ref>
        </imprint>
        <meeting id="cid626014">
          <title>Workshop on Reproducible, Customizable and Portable Workflows for HPC</title>
          <num>1</num>
          <abbr type="sigle">ResCuE-HPC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid13" type="inproceedings" rend="year" n="cite:zanuz:hal-01889939">
      <identifiant type="hal" value="hal-01889939"/>
      <analytic>
        <title level="a">In-Transit Molecular Dynamics Analysis with Apache Flink</title>
        <author>
          <persName>
            <foreName>Henrique C</foreName>
            <surname>Zanúz</surname>
            <initial>H. C.</initial>
          </persName>
          <persName key="datamove-2018-idp117856">
            <foreName>Bruno</foreName>
            <surname>Raffin</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Omar A</foreName>
            <surname>Mures</surname>
            <initial>O. A.</initial>
          </persName>
          <persName>
            <foreName>Emilio J</foreName>
            <surname>Padrón</surname>
            <initial>E. J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">ISAV 2018 - In Situ Infrastructures for Enabling Extreme-scale Analysis and Visualization</title>
        <loc>DALLAS, United States</loc>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-8</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01889939" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01889939</ref>
        </imprint>
        <meeting id="cid624921">
          <title>Workshop on In Situ Infrastructures for Enabling Extreme-Scale Analysis and Visualization</title>
          <num>2018</num>
          <abbr type="sigle"/>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid21" type="techreport" rend="year" n="cite:dufosse:hal-01924180">
      <identifiant type="hal" value="hal-01924180"/>
      <monogr>
        <title level="m">Effective heuristics for matchings in hypergraphs</title>
        <author>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="roma-2018-idp159376">
            <foreName>Ioannis</foreName>
            <surname>Panagiotas</surname>
            <initial>I.</initial>
          </persName>
          <persName key="roma-2018-idp128816">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-9224</biblScope>
          <publisher>
            <orgName type="institution">Inria Grenoble Rhône-Alpes</orgName>
          </publisher>
          <dateStruct>
            <month>November</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-18</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01924180" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01924180</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid23" type="techreport" rend="year" n="cite:dufosse:hal-01743802">
      <identifiant type="hal" value="hal-01743802"/>
      <monogr>
        <title level="m">Scaling matrices and counting the perfect matchings in graphs</title>
        <author>
          <persName key="datamove-2018-idp115392">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="roma-2018-idp159376">
            <foreName>Ioannis</foreName>
            <surname>Panagiotas</surname>
            <initial>I.</initial>
          </persName>
          <persName key="roma-2018-idp128816">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-9161</biblScope>
          <publisher>
            <orgName type="institution">Inria Grenoble Rhône-Alpes</orgName>
          </publisher>
          <dateStruct>
            <month>March</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-22</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01743802" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01743802</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid8" type="techreport" rend="year" n="cite:legrand:hal-01896121">
      <identifiant type="hal" value="hal-01896121"/>
      <monogr>
        <title level="m">Adapting Batch Scheduling to Workload Characteristics: What can we expect From Online Learning?</title>
        <author>
          <persName key="polaris-2018-idp120992">
            <foreName>Arnaud</foreName>
            <surname>Legrand</surname>
            <initial>A.</initial>
          </persName>
          <persName key="datamove-2018-idp131136">
            <foreName>Denis</foreName>
            <surname>Trystram</surname>
            <initial>D.</initial>
          </persName>
          <persName key="datamove-2018-idp158656">
            <foreName>Salah</foreName>
            <surname>Zrigui</surname>
            <initial>S.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-9212</biblScope>
          <publisher>
            <orgName type="institution">Grenoble 1 UGA - Université Grenoble Alpe</orgName>
          </publisher>
          <dateStruct>
            <month>October</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-23</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01896121" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01896121</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid19" type="unpublished" rend="year" n="cite:faure:hal-01779936">
      <identifiant type="hal" value="hal-01779936"/>
      <monogr>
        <title level="m">Évaluation d'algorithmes d'ordonnancement par simulation réaliste</title>
        <author>
          <persName key="datamove-2018-idp146400">
            <foreName>Adrien</foreName>
            <surname>Faure</surname>
            <initial>A.</initial>
          </persName>
          <persName key="myriads-2018-idp166704">
            <foreName>Millian</foreName>
            <surname>Poquet</surname>
            <initial>M.</initial>
          </persName>
          <persName key="datamove-2018-idp128640">
            <foreName>Olivier</foreName>
            <surname>Richard</surname>
            <initial>O.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>April</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01779936" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01779936</ref>
        </imprint>
      </monogr>
      <note type="bnote">working paper or preprint</note>
    </biblStruct>
    
    <biblStruct id="datamove-2018-bid17" type="unpublished" rend="year" n="cite:neyron:hal-01805122">
      <identifiant type="hal" value="hal-01805122"/>
      <monogr>
        <title level="m">Grid'5000</title>
        <author>
          <persName key="datamove-2018-idp168496">
            <foreName>Pierre</foreName>
            <surname>Neyron</surname>
            <initial>P.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01805122" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01805122</ref>
        </imprint>
      </monogr>
      <note type="bnote">working paper or preprint</note>
    </biblStruct>
  </biblio>
</raweb>
