<?xml version="1.0" encoding="utf-8"?>
<raweb xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" year="2013">
  <identification id="roma" isproject="false">
    <shortname>ROMA</shortname>
    <projectName>Resource Optimization: Models, Algorithms, and scheduling</projectName>
    <theme-de-recherche>Distributed and High Performance Computing</theme-de-recherche>
    <domaine-de-recherche>Networks, Systems and Services, Distributed Computing</domaine-de-recherche>
    <datecreation>2012 February 01</datecreation>
    <structure_exterieure type="Labs">
      <libelle>Laboratoire de l'Informatique du Parallélisme (LIP)</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>CNRS</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Université Claude Bernard (Lyon 1)</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Ecole normale supérieure de Lyon</libelle>
    </structure_exterieure>
    <UR name="Grenoble"/>
    <keywords>
      <term>Scheduling</term>
      <term>Parallel And Distributed Algorithms</term>
      <term>Combinatorial Optimization</term>
      <term>Exascale Systems</term>
      <term>Fault Tolerance</term>
    </keywords>
    <moreinfo/>
  </identification>
  <team id="uid1">
    <person key="graal-2005-id18145">
      <firstname>Frédéric</firstname>
      <lastname>Vivien</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Team leader, Inria, Senior Researcher</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="roma-2013-idp140544574271440">
      <firstname>Jean-Yves</firstname>
      <lastname>L'Excellent</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, Researcher</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="graal-2005-id18473">
      <firstname>Loris</firstname>
      <lastname>Marchal</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>CNRS, Researcher</moreinfo>
    </person>
    <person key="graal-2009-id59570">
      <firstname>Bora</firstname>
      <lastname>Uçar</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>CNRS, Researcher</moreinfo>
    </person>
    <person key="graal-2005-id18164">
      <firstname>Anne</firstname>
      <lastname>Benoit</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ENS Lyon and IUF, Associate Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="graal-2005-id18220">
      <firstname>Yves</firstname>
      <lastname>Robert</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ENS Lyon and IUF, Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="scalapplix-2005-id18472">
      <firstname>Patrick</firstname>
      <lastname>Amestoy</lastname>
      <categoryPro>CollaborateurExterieur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>INP Toulouse</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="graal-2008-id18788">
      <firstname>Alfredo</firstname>
      <lastname>Buttari</lastname>
      <categoryPro>CollaborateurExterieur</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>CNRS</moreinfo>
    </person>
    <person key="mescal-2012-idp140606033435856">
      <firstname>Sheng</firstname>
      <lastname>Di</lastname>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, since Dec. 2013, funded by Genci project</moreinfo>
    </person>
    <person key="graal-2011-idp140410991004288">
      <firstname>Guillaume</firstname>
      <lastname>Aupy</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ENS Lyon</moreinfo>
    </person>
    <person key="roma-2013-idp140544574293712">
      <firstname>Julien</firstname>
      <lastname>Herrmann</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ENS Lyon</moreinfo>
    </person>
    <person key="roma-2013-idp140544574296016">
      <firstname>Wissam M.</firstname>
      <lastname>Sid-Lakhdar</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>ENS Lyon</moreinfo>
    </person>
    <person key="graal-2011-idp140410991039440">
      <firstname>Dounia</firstname>
      <lastname>Zaidouni</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, funded by ANR RESCUE project</moreinfo>
    </person>
    <person key="roma-2013-idp140544574300624">
      <firstname>Enver</firstname>
      <lastname>Kayaaslan</lastname>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria, since Oct. 2013</moreinfo>
    </person>
    <person key="graal-2009-id59416">
      <firstname>Evelyne</firstname>
      <lastname>Blesle</lastname>
      <categoryPro>Assistant</categoryPro>
      <research-centre>Grenoble</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
  </team>
  <presentation id="uid2">
    <bodyTitle>Overall Objectives</bodyTitle>
    <subsection id="uid3" level="1">
      <bodyTitle>Introduction</bodyTitle>
      <p>The <span class="smallcap" align="left">Roma</span> project aims at designing models, algorithms, and scheduling
strategies to optimize the execution of scientific applications.</p>
      <p>Scientists now have access to tremendous computing power. For
instance, the four most powerful computing platforms in the TOP 500
list <ref xlink:href="#roma-2013-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> each includes more than 500,000 cores and
deliver a sustained performance of more than 10 Peta FLOPS. The
volunteer computing platform BOINC <ref xlink:href="#roma-2013-bid1" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> is another example
with more than 440,000 enlisted computers and, on average, an
aggregate performance of more than 9 Peta FLOPS. Furthermore, it had
never been so easy for scientists to have access to parallel computing
resources, either through the multitude of local clusters or through
distant cloud computing platforms.</p>
      <p>Because parallel computing resources are ubiquitous, and because the
available computing power is so huge, one could believe that
scientists no longer need to worry about finding computing resources,
even less to optimize their usage. Nothing is farther from the
truth. Institutions and government agencies keep building larger and
more powerful computing platforms with a clear goal. These
platforms must allow to solve problems in reasonable timescales, which
were so far out of reach. They must also allow to solve
problems more precisely where the existing solutions are not deemed to be sufficiently
accurate. For those platforms to fulfill their purposes, their
computing power must therefore be carefully exploited and not be wasted.
This often requires an efficient management of all types of platform
resources: computation, communication, memory, storage, energy,
etc. This is often hard to achieve because of the characteristics of
new and emerging platforms. Moreover, because of technological
evolutions, new problems arise, and fully tried and tested solutions
need to be thoroughly overhauled or simply discarded and replaced.
Here are some of the difficulties that have, or
will have, to be overcome:</p>
      <simplelist>
        <li id="uid4">
          <p noindent="true">computing platforms are hierarchical: a processor includes
several cores, a node includes several processors, and the nodes
themselves are gathered into clusters. Algorithms must take
this hierarchical structure into account, in order to fully harness
the available computing power;</p>
        </li>
        <li id="uid5">
          <p noindent="true">the probability for a platform to suffer from a hardware fault automatically increases
with the number of its components. Fault-tolerance techniques become
unavoidable for large-scale platforms;</p>
        </li>
        <li id="uid6">
          <p noindent="true">the ever increasing gap between the computing power of nodes and
the bandwidths of memories and networks, in conjunction with the organization of
memories in deep hierarchies, requires to take more and more care of
the way algorithms use memory;</p>
        </li>
        <li id="uid7">
          <p noindent="true">energy considerations are unavoidable nowadays. Design specifications
for new computing platforms always include a maximal energy
consumption. The energy bill of a supercomputer may represent a
significant share of its cost over its lifespan. These issues must be
taken into account at the algorithm-design level.</p>
        </li>
      </simplelist>
      <p spacebefore="12.0pt">We are convinced that dramatic breakthroughs in algorithms and scheduling strategies
are required for the scientific computing community to overcome all
the challenges posed by new and emerging computing platforms.
This is required for
applications to be successfully deployed at very large scale, and hence for enabling the scientific computing community to push the frontiers of knowledge
as far as possible.
The <span class="smallcap" align="left">Roma</span> project-team aims at providing
fundamental algorithms, scheduling strategies, protocols, and software
packages to fulfill the needs encountered by a wide class of scientific
computing applications, including domains as diverse as geophysics,
structural mechanics, chemistry, electromagnetism, numerical
optimization, or computational fluid dynamics, to quote a few. To fulfill this goal, the <span class="smallcap" align="left">Roma</span> project-team takes a
special interest in dense and sparse linear algebra.</p>
      <p spacebefore="12.0pt">The work in the <span class="smallcap" align="left">Roma</span> team is organized along three research
themes.</p>
      <orderedlist>
        <li id="uid8">
          <p noindent="true"><b>Algorithms for probabilistic environments.</b> In this
theme, we consider problems where some of the platform
characteristics, or some of the application characteristics, are
described by probability distributions. This is in particular the case when
considering the resilience of applications in failure-prone
environments: the possibility of faults is modeled by probability distributions.</p>
        </li>
        <li id="uid9">
          <p noindent="true"><b>Platform-aware scheduling strategies.</b> In this theme, we
focus on the design of scheduling strategies that finely take into
account some platform characteristics beyond the most classical
ones, namely the computing speed of processors and accelerators,
and the communication bandwidth of network links. In the scope of
this theme, when designing scheduling strategies, we focus
either on the energy consumption or on the memory behavior. All
optimization problems under study are multi-criteria.</p>
        </li>
        <li id="uid10">
          <p noindent="true"><b>High-performance computing and linear algebra.</b> We work
on algorithms and tools for both sparse and dense linear algebra. In
sparse linear algebra, we work on most aspects of direct multifrontal
solvers for linear systems. In dense linear algebra, we focus on the
adaptation of factorization kernels to emerging and future
platforms. In addition, we also work on combinatorial scientific
computing, that is, on the design of combinatorial algorithms and
tools to solve combinatorial problems, such as those
encountered, for instance, in the preprocessing phases of solvers of
sparse linear systems.</p>
        </li>
      </orderedlist>
    </subsection>
    <subsection id="uid11" level="1">
      <bodyTitle>Highlights of the Year</bodyTitle>
      <p>Anne Benoit, Yves Robert and Frédéric Vivien published a textbook
entitled “A Guide to Algorithm Design: Paradigms, Methods, and
Complexity Analysis” <ref xlink:href="#roma-2013-bid2" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
    </subsection>
  </presentation>
  <fondements id="uid12">
    <bodyTitle>Research Program</bodyTitle>
    <subsection id="uid13" level="1">
      <bodyTitle>Algorithms for probabilistic environments</bodyTitle>
      <p>There are two main research directions under this research theme. In
the first one, we consider the problem of the efficient execution of
applications in a failure-prone environment. Here, probability
distributions are used to describe the potential behavior of computing
platforms, namely when hardware components are subject to faults. In
the second research direction, probability distributions are used to
describe the characteristics and behavior of applications.</p>
      <subsection id="uid14" level="2">
        <bodyTitle>Application resilience</bodyTitle>
        <p>An application is resilient if it can successfully produce a correct
result in spite of potential faults in the underlying
system. Application resilience can involve a broad range of
techniques, including fault prediction, error detection, error
containment, error correction, checkpointing, replication, migration,
recovery, etc. Faults
are quite frequent in the most powerful existing supercomputers. The
Jaguar platform, which ranked third in the TOP 500 list in November
2011 <ref xlink:href="#roma-2013-bid3" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, had an average of 2.33 faults per day during
the period from August 2008 to February 2010 <ref xlink:href="#roma-2013-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. The
mean-time between faults of a platform is inversely proportional to its
number of components. Progresses will certainly be made in the coming
years with respect to the reliability of individual components.
However, designing and building high-reliability hardware components
is far more expensive than using lower reliability top-of-the-shelf
components. Furthermore, low-power components may not be available
with high-reliability. Therefore, it is feared that the progresses in
reliability will far from compensate the steady projected increase of
the number of components in the largest supercomputers. Already,
application failures have a huge computational cost. In 2008, the DARPA white
paper on “System resilience at extreme
scale” <ref xlink:href="#roma-2013-bid5" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> stated that high-end systems wasted
20% of their computing capacity on application failure and recovery.</p>
        <p>In such a context, any application using a significant fraction of a
supercomputer and running for a significant amount of time will have
to use some fault-tolerance solution. It would indeed be unacceptable
for an application failure to destroy centuries of CPU-time (some of the simulations
run on the Blue Waters platform consumed more than 2,700 years
of core computing time <ref xlink:href="#roma-2013-bid6" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> and lasted over 60
hours; the most time-consuming simulations of the US Department of
Energy (DoE) run for weeks to months on the most powerful existing
platforms <ref xlink:href="#roma-2013-bid7" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
        <p>Our research on resilience follows two different directions. On the
one hand we design new resilience solutions, either generic
fault-tolerance solutions or algorithm-based solutions. On the other
hand we model and theoretically analyze the performance of existing
and future solutions, in order to tune their usage and help determine
which solution to use in which context.</p>
      </subsection>
      <subsection id="uid15" level="2">
        <bodyTitle>Scheduling strategies for applications with a
probabilistic behavior</bodyTitle>
        <p>Static scheduling algorithms are algorithms where all decisions are
taken before the start of the application execution. On the contrary,
in non-static algorithms, decisions may depend on events that happen
during the execution. Static scheduling algorithms are known to be
superior to dynamic and system-oriented approaches in stable
frameworks <ref xlink:href="#roma-2013-bid8" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid9" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid10" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid11" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, that is, when all
characteristics of platforms and applications are perfectly known,
known a priori, and do not evolve during the application execution.
In practice, the prediction of application characteristics may be
approximative or completely infeasible. For instance, the amount of
computations and of communications required to solve a given problem
in parallel may strongly depend on some input data that are hard to
analyze (this is for instance the case when solving linear systems
using full pivoting).</p>
        <p>We plan to consider applications whose characteristics change dynamically and are subject to
uncertainties. In order to benefit
nonetheless from the power of static approaches, we plan to model
application uncertainties and variations through probabilistic models,
and to design for these applications scheduling strategies that are
either static, or partially static and partially dynamic.</p>
      </subsection>
    </subsection>
    <subsection id="uid16" level="1">
      <bodyTitle>Platform-aware scheduling strategies</bodyTitle>
      <p>In this theme, we study and design scheduling strategies, focusing
either on energy consumption or on memory behavior.
In other words, when designing and evaluating these
strategies, we do not limit our view to the most classical
platform characteristics, that is, the computing speed of cores and
accelerators, and the bandwidth of communication links.</p>
      <p>In most existing studies, a single optimization objective is
considered, and the target is
some sort of absolute performance. For instance, most optimization
problems aim at the minimization of the overall execution time of the
application considered. Such an approach can lead to a very
significant waste of resources, because it does not take into account any
notion of efficiency nor of yield. For instance, it may not be
meaningful to use twice as many resources just to decrease by 10% the
execution time. In all our work, we plan to look only for algorithmic
solutions that make a “clever” usage of resources. However, looking
for the solution that optimizes a metric such as the efficiency, the
energy consumption, or the memory-peak minimization, is doomed for the
type of applications we consider. Indeed, in most cases, any optimal
solution for such a metric is a sequential solution, and sequential
solutions have prohibitive execution times.
Therefore, it becomes mandatory to consider multi-criteria approaches
where one looks for trade-offs between some user-oriented metrics that
are typically related to notions of Quality of Service—execution
time, response time, stretch, throughput, latency, reliability,
etc.—and some system-oriented metrics that guarantee that resources
are not wasted. In general, we will not look for the Pareto curve, that is, the
set of all dominating solutions for the considered
metrics. Instead, we will rather look for solutions that minimize some
given objective while satisfying some bounds, or “budgets”, on all
the other objectives.</p>
      <subsection id="uid17" level="2">
        <bodyTitle>Energy-aware algorithms</bodyTitle>
        <p>Energy-aware scheduling has proven an important issue in the past
decade, both for economical and environmental reasons. Energy issues
are obvious for battery-powered systems. They are now also important
for traditional computer systems. Indeed, the design specifications
of any new computing platform now always include an upper bound on energy
consumption. Furthermore, the energy bill of a supercomputer may
represent a significant share of its cost over its lifespan.</p>
        <p>Technically, a processor running at speed <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>s</mi></math></formula> dissipates <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msup><mi>s</mi><mi>α</mi></msup></math></formula> watts
per unit of time with <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>2</mn><mo>≤</mo><mi>α</mi><mo>≤</mo><mn>3</mn></mrow></math></formula> <ref xlink:href="#roma-2013-bid12" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid13" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid14" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>; hence, it consumes
<formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><msup><mi>s</mi><mi>α</mi></msup><mo>×</mo><mi>d</mi></mrow></math></formula> joules when operated during <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>d</mi></math></formula> units of
time. Therefore, energy consumption can be reduced by using speed
scaling techniques. However it was shown in <ref xlink:href="#roma-2013-bid15" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> that
reducing the speed of a processor increases the rate of transient
faults in the system. The probability of faults increases
exponentially, and this probability cannot be neglected in large-scale
computing <ref xlink:href="#roma-2013-bid16" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. In order to make up for the loss in <i>reliability</i> due to the energy efficiency, different models have
been proposed for fault tolerance: (i) <i>re-execution</i> consists in
re-executing a task that does not meet the reliability constraint <ref xlink:href="#roma-2013-bid15" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>; (ii) <i>replication</i> consists in executing the
same task on several processors simultaneously, in order to meet the
reliability constraints <ref xlink:href="#roma-2013-bid17" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>; and (iii)
<i>checkpointing</i> consists in “saving” the work done at some
certain instants, hence reducing the amount of work lost
when a failure occurs <ref xlink:href="#roma-2013-bid18" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
        <p>Energy issues must be
taken into account at all levels, including the algorithm-design
level. We plan to both evaluate the energy consumption of existing
algorithms and to design new algorithms that minimize energy
consumption using tools such as resource selection, dynamic frequency
and voltage scaling, or powering-down of hardware components.</p>
      </subsection>
      <subsection id="uid18" level="2">
        <bodyTitle>Memory-aware algorithms</bodyTitle>
        <p>For many years, the bandwidth between memories and processors
has increased more slowly than the computing power of processors, and the
latency of memory accesses has been improved at an even slower pace.
Therefore, in the time needed for a processor to perform a floating
point operation, the amount of data transferred between the memory and the
processor has been decreasing
with each passing year. The risk is for
an application to reach a point where the time needed to solve a
problem is no longer dictated by the processor computing power but by
the memory characteristics, comparable to the <i>memory wall</i> that
limits CPU performance. In such a case, processors would be greatly
under-utilized, and a large part of the computing power of the platform
would be wasted. Moreover, with the advent of multicore processors,
the amount of memory per core has started to stagnate, if not to
decrease. This is especially harmful to memory intensive
applications. The problems related to the sizes and the bandwidths of
memories are further exacerbated on modern computing platforms because
of their deep and highly heterogeneous hierarchies. Such a hierarchy
can extend from core private caches to shared memory within a CPU, to disk
storage and even tape-based storage systems, like in the Blue Waters
supercomputer <ref xlink:href="#roma-2013-bid19" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. It may also be the case that
heterogeneous cores are used (such as hybrid CPU and GPU computing),
and that each of them has a limited memory.</p>
        <p>Because of these trends, it is becoming more and more important to
precisely take memory constraints into account when designing
algorithms. One must not only take care of the amount of memory
required to run an algorithm, but also of the way this memory is
accessed. Indeed, in some cases, rather than to minimize the amount of
memory required to solve the given problem, one will have to maximize
data reuse and, especially, to minimize the amount of data transferred
between the different levels of the memory hierarchy (minimization
of the volume of memory inputs-outputs). This is, for instance, the
case when a problem cannot be solved by just using the in-core memory
and that any solution must be out-of-core, that is, must use disks as
storage for temporary data.</p>
        <p>It is worth noting that the cost of moving data has lead to the
development of so called “communication-avoiding
algorithms” <ref xlink:href="#roma-2013-bid20" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Our approach is orthogonal to
these efforts: in communication-avoiding algorithms, the application
is modified, in particular some redundant work is done, in order to
get rid of some communication operations, whereas in our approach, we do not modify
the application, which is provided as a task graph, but we
minimize the needed memory peak only by carefully scheduling tasks.</p>
      </subsection>
    </subsection>
    <subsection id="uid19" level="1">
      <bodyTitle>High-performance computing and linear algebra</bodyTitle>
      <p>Our work on high-performance computing and linear algebra is organized
along three research directions. The first direction is devoted to direct solvers
of sparse linear systems. The second direction is devoted to combinatorial
scientific computing, that is, the design of combinatorial algorithms
and tools that solve problems encountered in some of the other
research themes, like the problems faced in the preprocessing phases of
sparse direct solvers. The last direction deals with the adaptation of
classical dense linear algebra kernels to the architecture of future
computing platforms.</p>
      <subsection id="uid20" level="2">
        <bodyTitle>Direct solvers for sparse linear systems</bodyTitle>
        <p>The solution of sparse systems of linear equations (symmetric or
unsymmetric, often with an irregular structure, from a few hundred
thousand to a few hundred million equations) is at the heart
of many scientific applications arising in domains such as
geophysics, structural mechanics, chemistry, electromagnetism,
numerical optimization, or computational fluid dynamics, to cite
a few. The importance and diversity of
applications are a main motivation to pursue research
on sparse linear solvers. Because of this wide range of applications,
any significant progress on solvers will have a significant
impact in the world of simulation.
Research on sparse direct solvers in general is very active for the following main reasons:</p>
        <simplelist>
          <li id="uid21">
            <p noindent="true">many applications fields require large-scale simulations
that are still too big or too complicated with respect to today's
solution methods;</p>
          </li>
          <li id="uid22">
            <p noindent="true">the current evolution of architectures with massive,
hierarchical, multicore parallelism imposes to overhaul all existing
solutions, which represents a major challenge for algorithm and
software development;</p>
          </li>
          <li id="uid23">
            <p noindent="true">the evolution of numerical needs and types of simulations increase the
importance, frequency, and size of certain classes of matrices, which may benefit from a specialized processing (rather than resort
to a generic one).</p>
          </li>
        </simplelist>
        <p>Our research in the field is strongly related to the
software package <span class="smallcap" align="left">Mumps</span> (see Section <ref xlink:href="#uid29" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).
<span class="smallcap" align="left">Mumps</span> is both an experimental
platform for academics in the field of sparse
linear algebra, and a software package that is widely used in both
academia and industry. The
software package <span class="smallcap" align="left">Mumps</span> enables us to (i) confront our research to the real world,
(ii) develop contacts and collaborations, and (iii) receive continuous
feedback from real-life applications, which is extremely critical to
validate our research work. The feedback from a large user community
also enables us to direct our long-term objectives towards meaningful
directions.</p>
        <p>In this context, we aim at designing parallel sparse direct methods that will
scale to large modern platforms, and that are able to answer new challenges
arising from applications, both
efficiently—from a resource consumption point of view—and
accurately—from a numerical point of view. For that, and even with
increasing parallelism, we do not want to sacrifice in any manner numerical
stability, based on threshold partial pivoting, one of the main originalities
of our approach (our “trademark”)
in the context of direct solvers for distributed-memory
computers; although this makes the parallelization more complicated,
applying the same pivoting strategy as in the serial case ensures
numerical robustness of our approach, which we generally measure in
terms of sparse backward error.
In order to solve the hard problems
resulting from the always-increasing demands in simulations,
special attention must also necessarily be paid to memory usage (and not only execution
time). This requires specific algorithmic choices
and scheduling techniques. From a complementary point of view, it is
also necessary to be aware of the functionality requirements from
the applications and from the users, so that robust solutions can
be proposed for a wide range of applications.</p>
        <p>Among direct methods, we rely on the multifrontal
method <ref xlink:href="#roma-2013-bid21" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid22" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid23" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.
This method usually exhibits a good data locality and hence is efficient in cache-based systems.
The task graph associated with the multifrontal method is in the form of a tree whose characteristics
should be exploited in a parallel implementation.</p>
        <p>Our work is organized along two main research directions. In the
first one we aim at efficiently addressing new architectures that
include massive, hierarchical parallelism. In the second one, we aim
at reducing the running time complexity and the memory requirements of
direct solvers, while controlling accuracy.</p>
      </subsection>
      <subsection id="uid24" level="2">
        <bodyTitle>Combinatorial scientific computing</bodyTitle>
        <p>Combinatorial scientific computing (CSC) is a recently coined term (circa 2002)
for interdisciplinary research at the intersection of discrete mathematics,
computer science, and scientific computing. In particular, it refers to the
development, application, and analysis of combinatorial algorithms to enable
scientific computing applications. CSC's deepest roots are in the realm of
direct methods for solving sparse linear systems of equations where graph
theoretical models have been central to the exploitation of sparsity,
since the 1960s.
The general approach is to identify performance
issues in a scientific computing problem, such as memory use, parallel speed up, and/or the rate of convergence
of a method, and to develop combinatorial
algorithms and models to tackle those issues.</p>
        <p>Our target scientific computing applications are (i) the preprocessing
phases of direct methods (in particular MUMPS), iterative methods, and hybrid methods
for solving linear systems of equations; and (ii) the mapping of tasks
(mostly the sub-tasks of the mentioned solvers) onto modern computing
platforms. We focus on the development and use of graph and
hypergraph models, and related tools such as hypergraph partitioning algorithms,
to solve problems of load balancing and task mapping. We also focus on
bipartite graph matching and vertex ordering methods for reducing the memory
overhead and computational requirements of solvers. Although we direct
our attention on these models and algorithms through the lens of
linear system solvers, our solutions are general enough to be applied to some
other resource optimization problems.</p>
      </subsection>
      <subsection id="uid25" level="2">
        <bodyTitle>Dense linear algebra on post-petascale multicore platforms</bodyTitle>
        <p>The quest for efficient, yet portable, implementations of dense linear
algebra kernels (QR, LU, Cholesky) has never stopped, fueled in part by each new
technological evolution. First, the LAPACK library <ref xlink:href="#roma-2013-bid24" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>
relied on BLAS level 3 kernels (Basic Linear Algebra Subroutines) that
enable to fully harness the computing power of a single CPU. Then the
<span class="smallcap" align="left">ScaLAPACK</span> library <ref xlink:href="#roma-2013-bid25" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> built upon LAPACK to
provide a coarse-grain parallel version, where processors operate on
large block-column panels. Inter-processor communications occur
through highly tuned MPI send and receive primitives. The advent of
multi-core processors has led to a major modification in these
algorithms <ref xlink:href="#roma-2013-bid26" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid27" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid28" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Each
processor runs several threads in parallel to keep all cores within
that processor busy. Tiled versions of the algorithms have thus been
designed: dividing large block-column panels into several tiles allows
for a decrease in the granularity down to a level where many
smaller-size tasks are spawned. In the current panel, the diagonal
tile is used to eliminate all the lower tiles in the panel. Because the
factorization of the whole panel is now broken into the elimination of
several tiles, the update operations can also be partitioned at the
tile level, which generates many tasks to feed all cores.</p>
        <p>The number of cores per processor will keep increasing in the
following years. It is projected that high-end processors will include
at least a few hundreds of cores. This evolution will require to
design new versions of libraries. Indeed, existing libraries rely on a
static distribution of the work: before the beginning of the execution
of a kernel, the location and time of the execution of all of its
component is decided. In theory, static solutions enable to precisely
optimize executions, by taking parameters like data
locality into account. At run time, these solutions proceed at the pace of the
slowest of the cores, and they thus require a perfect
load-balancing. With a few hundreds, if not a thousand, cores per
processor, some tiny differences between the computing times on the
different cores (“jitter”) are unavoidable and irremediably condemn purely static
solutions. Moreover, the increase in the number of cores per processor
once again mandates to increase the number of tasks that can be
executed in parallel.</p>
        <p>We study solutions that are part-static part-dynamic, because such
solutions have been shown to outperform purely dynamic ones <ref xlink:href="#roma-2013-bid29" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.
On the one hand, the distribution of work among the different nodes will
still be statically defined. On the other hand, the mapping and the
scheduling of tasks inside a processor will be dynamically
defined. The main difficulty when building such a solution will be to
design lightweight dynamic schedulers that are able to guarantee both an excellent
load-balancing and a very efficient use of data locality.</p>
      </subsection>
    </subsection>
  </fondements>
  <domaine id="uid26">
    <bodyTitle>Application Domains</bodyTitle>
    <subsection id="uid27" level="1">
      <bodyTitle>Application of sparse direct solvers</bodyTitle>
      <p>Sparse direct (multifrontal) solvers in distributed-memory
environments have a wide range of applications as they are
used at the heart of many numerical methods in simulation: whether a
model uses finite elements or finite differences, or requires the
optimization of a complex linear or nonlinear function, one often
ends up solving a linear system of equations involving sparse
matrices. There are therefore a number of application fields,
among which some of the ones cited by the users of
our sparse direct solver <span class="smallcap" align="left">Mumps</span> (see
Section <ref xlink:href="#uid29" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) are:
structural mechanics, biomechanics, medical image processing, tomography,
geophysics,
electromagnetism, fluid dynamics, econometric models, oil reservoir
simulation, magneto-hydro-dynamics, chemistry, acoustics,
glaciology, astrophysics, circuit simulation, and work on hybrid
direct-iterative methods.</p>
    </subsection>
  </domaine>
  <logiciels id="uid28">
    <bodyTitle>Software and Platforms</bodyTitle>
    <subsection id="uid29" level="1">
      <bodyTitle>MUMPS</bodyTitle>
      <participants>
        <person key="scalapplix-2005-id18472">
          <firstname>Patrick</firstname>
          <lastname>Amestoy</lastname>
        </person>
        <person key="graal-2008-id18788">
          <firstname>Alfredo</firstname>
          <lastname>Buttari</lastname>
        </person>
        <person key="roma-2013-idp140544574271440">
          <firstname>Jean-Yves</firstname>
          <lastname>L'Excellent</lastname>
          <moreinfo>correspondent</moreinfo>
        </person>
        <person key="roma-2013-idp140544574296016">
          <firstname>Wissam M.</firstname>
          <lastname>Sid-Lakhdar</lastname>
        </person>
        <person key="graal-2009-id59570">
          <firstname>Bora</firstname>
          <lastname>Uçar</lastname>
        </person>
      </participants>
      <p><span class="smallcap" align="left">Mumps</span> (for <i>MUltifrontal Massively Parallel Solver</i>)
see
<ref xlink:href="http://mumps-solver.org" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>mumps-solver.<allowbreak/>org</ref>
is a software package for the solution of large sparse systems of linear equations.
It implements a direct method, the so called multifrontal method; it is a parallel
code capable of exploiting distributed-memory computers as well as multithreaded
libraries; its main originalities
are its numerical robustness and the wide range of functionalities available.</p>
      <p>The latest public release is <span class="smallcap" align="left">Mumps</span> 4.10.0 (May 2011).</p>
      <p>The development of <span class="smallcap" align="left">Mumps</span> was initiated by the European
project PARASOL (Esprit 4, LTR project 20160, 1996-1999), whose
results and developments were public domain. Since then,
<span class="smallcap" align="left">Mumps</span> has been supported by CERFACS,
CNRS, ENS Lyon, INPT(ENSEEIHT)-IRIT,
Inria, and University of Bordeaux.
Following a contractual agreement signed by those institutes,
the next release of <span class="smallcap" align="left">Mumps</span> will be distributed under the
Cecill-C license; a technical committee was also defined,
currently composed of Patrick Amestoy, Abdou Guermouche,
and Jean-Yves L'Excellent.</p>
      <p>In the context of an ADT project (Action of Technological Development),
Maurice Brémond (from Inria “SED” service in Grenoble) also worked part-time
on the project, in particular on visualization tools helping
researchers to analyze the behaviour of a parallel MUMPS execution.</p>
      <p>More information on <span class="smallcap" align="left">Mumps</span> is available on
<ref xlink:href="http://mumps-solver.org" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>mumps-solver.<allowbreak/>org</ref>.
See also Section <ref xlink:href="#uid50" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> of this report.</p>
    </subsection>
  </logiciels>
  <resultats id="uid30">
    <bodyTitle>New Results</bodyTitle>
    <subsection id="uid31" level="1">
      <bodyTitle>Scheduling tree-shaped task graphs to minimize memory and makespan</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid30" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we investigate the
execution of tree-shaped task graphs using multiple processors. Each
edge of such a tree represents a large IO file. A task can only be
executed if all input and output files fit into memory, and a file
can only be removed from memory after it has been consumed. Such
trees arise, for instance, in the multifrontal method of sparse
matrix factorization. The maximum amount of memory needed depends on
the execution order of the tasks. With one processor the objective
of the tree traversal is to minimize the required memory. This
problem was well studied and optimal polynomial algorithms were
proposed. Here, we extend the problem by considering multiple
processors, which is of obvious interest in the application area of
matrix factorization. With the multiple processors comes the
additional objective to minimize the time needed to traverse the
tree, i.e., to minimize the makespan. Not surprisingly, this problem
proves to be much harder than the sequential one. We study the
computational complexity of this problem and provide an
inapproximability result even for unit weight trees. Several
heuristics are proposed, each with a different optimization focus,
and they are analyzed in an extensive experimental evaluation using
realistic trees.
</p>
    </subsection>
    <subsection id="uid32" level="1">
      <bodyTitle>Model and complexity results for tree traversals on hybrid platforms</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid31" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we study the complexity
of traversing tree-shaped workflows whose tasks require large I/O
files. We target a heterogeneous architecture with two resources of
different types, where each resource has its own memory, such as a
multicore node equipped with a dedicated accelerator (FPGA or
GPU). Tasks in the workflow are tagged with the type of resource
needed for their processing. Besides, a task can be processed on a
given resource only if all its input files and output files can be
stored in the corresponding memory. At a given execution step, the
amount of data stored in each memory strongly depends upon the
ordering in which the tasks are executed, and upon when
communications between both memories are scheduled. The objective is
to determine an efficient traversal that minimizes the maximum
amount of memory of each type needed to traverse the whole tree. In
this work, we establish the complexity of this two-memory
scheduling problem, provide inapproximability results, and show how
to determine the optimal depth-first traversal. Altogether, these
results lay the foundations for memory-aware scheduling algorithms
on heterogeneous platforms.
</p>
    </subsection>
    <subsection id="uid33" level="1">
      <bodyTitle>On the combination of silent error detection and checkpointing</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid32" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we revisit traditional
checkpointing and rollback recovery strategies, with a focus on
silent data corruption errors. Contrarily to fail-stop failures,
such latent errors cannot be detected immediately, and a mechanism
to detect them must be provided. We consider two models: (i) errors
are detected after some delays following a probability distribution
(typically, an Exponential distribution); (ii) errors are detected
through some verification mechanism. In both cases, we compute the
optimal period in order to minimize the waste, i.e., the fraction of
time where nodes do not perform useful computations. In practice,
only a fixed number of checkpoints can be kept in memory, and the
first model may lead to an irrecoverable failure. In this case, we
compute the minimum period required for an acceptable risk. For the
second model, there is no risk of irrecoverable failure, owing to
the verification mechanism, but the corresponding overhead is
included in the waste. Finally, both models are instantiated using
realistic scenarios and application/architecture parameters.
</p>
    </subsection>
    <subsection id="uid34" level="1">
      <bodyTitle>Checkpointing algorithms and fault prediction</bodyTitle>
      <p>In this series of work <ref xlink:href="#roma-2013-bid33" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid34" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
we deal with the impact of fault prediction techniques on
checkpointing strategies, when the fault-prediction system provides
either prediction windows or exact predictions. We extend the
classical first-order analysis of Young and Daly in the presence of
a fault prediction system, characterized by its recall and its
precision. In this framework, we provide optimal algorithms to
decide whether and when to take predictions into account, and we
derive the optimal value of the checkpointing period. These results
allow us to analytically assess the key parameters that impact the
performance of fault predictors at very large scale.
</p>
    </subsection>
    <subsection id="uid35" level="1">
      <bodyTitle>Mapping applications on volatile resources</bodyTitle>
      <p>In this series of
work <ref xlink:href="#roma-2013-bid35" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid36" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid37" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
we study the execution of iterative applications on volatile
processors such as those found on desktop grids. We envision two
models, one where all tasks are assumed to be independent, and
another where all tasks are tightly coupled and keep exchanging
information throughout the iteration. These two models cover the two
extreme points of the parallelization spectrum. We develop
master-worker scheduling schemes that attempt to achieve good
trade-offs between worker speed and worker availability. Any
iteration entails the execution of a fixed number of independent
tasks or of tightly-coupled tasks. A key feature of our approach is
that we consider a communication model where the bandwidth capacity
of the master for sending application data to workers is
limited. This limitation makes the scheduling problem more difficult
both in a theoretical sense and in a practical sense. Furthermore,
we consider that a processor can be in one of three states:
available, down, or temporarily preempted by its owner. This
preempted state also complicates the scheduling problem. In
practical settings, e.g., desktop grids, master bandwidth is limited
and processors are temporarily reclaimed. Consequently, addressing
the aforementioned difficulties is necessary for successfully
deploying master-worker applications on volatile platforms. Our
first contribution is to determine the complexity of the scheduling
problems in their offline versions, i.e., when processor
availability behaviors are known in advance. Even with this
knowledge, the problems are NP-hard. Our second contribution is an
evaluation of the expectation of the time needed by a worker to
complete a set of tasks. We obtain a close formula for independent
tasks and an analytical approximation for tightly-coupled
tasks. Those evaluations rely on a Markovian assumption for the
temporal availability of processors, and are at the heart of some
heuristics that aim at favoring “reliable” processors in a
sensible manner. Our third contribution is a set of heuristics for
both models, which we evaluate in simulation. Our results provide
guidance to selecting the best strategy as a function of processor
state availability versus average task duration.
</p>
    </subsection>
    <subsection id="uid36" level="1">
      <bodyTitle>Using group replication for resilience on exascale systems</bodyTitle>
      <p>High performance computing applications must be resilient to
faults. The traditional fault-tolerance solution is
checkpoint-recovery, by which application state is saved to and
recovered from secondary storage throughout execution. It has been
shown that, even when using an optimal checkpointing strategy, the
checkpointing overhead precludes high parallel efficiency at large
scale. Additional fault-tolerance mechanisms must thus be used. Such
a mechanism is replication, i.e., multiple processors performing the
same computation so that a processor failure does not necessarily
imply an application failure. In spite of resource waste,
replication can lead to higher parallel efficiency when compared to
using only checkpoint-recovery at large scale. In this
work <ref xlink:href="#roma-2013-bid38" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose to execute and
checkpoint multiple application instances concurrently, an approach
we term group replication. For Exponential failures we give an upper
bound on the expected application execution time. This bound
corresponds to a particular checkpointing period that we derive. For
general failures, we propose a dynamic programming algorithm to
determine non-periodic checkpoint dates as well as an empirical
periodic checkpointing solution whose period is found via a
numerical search. Using simulation we evaluate our proposed
approaches, including comparison to the non-replication case, for
both Exponential and Weibull failure distributions. Our broad
finding is that group replication is useful in a range of realistic
application and checkpointing overhead scenarios for future exascale
platforms.
</p>
    </subsection>
    <subsection id="uid37" level="1">
      <bodyTitle>Unified model for assessing checkpointing
protocols at extreme-scale</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid39" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we present a unified model
for several well-known checkpoint/restart protocols. The proposed
model is generic enough to encompass both extremes of the
checkpoint/restart space, from coordinated approaches to a variety
of uncoordinated checkpoint strategies (with message logging). We
identify a set of crucial parameters, instantiate them and compare
the expected efficiency of the fault tolerant protocols, for a given
application/platform pair. We then propose a detailed analysis of
several scenarios, including some of the most powerful currently
available HPC platforms, as well as anticipated Exascale
designs. The results of this analytical comparison are corroborated
by a comprehensive set of simulations. Altogether, they outline
comparative behaviors of checkpoint strategies at very large scale,
thereby providing insight that is hardly accessible to direct
experimentation.
</p>
    </subsection>
    <subsection id="uid38" level="1">
      <bodyTitle>Revisiting the double checkpointing algorithm</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid40" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we study fast checkpointing algorithms which require distributed access to stable storage. This work revisits the approach base upon double checkpointing, and compares the blocking algorithm of Zheng, Shi, and Kalé, with the non-blocking algorithm of Ni, Meneses, and Kalé in terms of both performance and risk. We also extend the model that they have proposed to assess the impact of the overhead associated to non-blocking communications. We then provide a new peer-to-peer checkpointing algorithm, called the triple checkpointing algorithm, that can work at constant memory, and achieves both higher efficiency and better risk handling than the double checkpointing algorithm. We provide performance and risk models for all the evaluated protocols, and compare them through comprehensive simulations.
</p>
    </subsection>
    <subsection id="uid39" level="1">
      <bodyTitle>Multi-criteria checkpointing strategies: Optimizing response-time versus resource utilization</bodyTitle>
      <p>Failures are increasingly threatening the efficiency of HPC systems,
and current projections of Exascale platforms indicate that
rollback recovery, the most convenient method for providing fault
tolerance to general-purpose applications, reaches its own limits at such scales. One of
the reasons explaining this unnerving situation comes from the focus
that has been given to per-application completion time, rather than to platform
efficiency. In this work <ref xlink:href="#roma-2013-bid41" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we discuss the case of
uncoordinated rollback recovery where the idle time spent waiting
recovering processors is used to progress a different, independent
application from the system batch queue. We then propose an extended
model of uncoordinated checkpointing that can discriminate between
idle time and wasted computation. We instantiate this model in a simulator to
demonstrate that, with this strategy, uncoordinated
checkpointing per application completion time is unchanged, while
it delivers near-perfect platform efficiency.
</p>
    </subsection>
    <subsection id="uid40" level="1">
      <bodyTitle>Optimal checkpointing period: Time vs. energy</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid42" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we deal with parallel scientific applications using non-blocking and periodic coordinated checkpointing to enforce resilience. We provide a model and detailed formulas for total execution time and consumed energy. We characterize the optimal period for both objectives, and we assess the range of time/energy trade-offs to be made by instantiating the model with a set of realistic scenarios for Exascale systems. We give a particular emphasis to I/O transfers, because the relative cost of communication is expected to dramatically increase, both in terms of latency and consumed energy, for future Exascale platforms.
</p>
    </subsection>
    <subsection id="uid41" level="1">
      <bodyTitle>Energy-aware checkpointing of divisible tasks with soft or hard deadlines</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid43" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we aim at minimizing the energy consumption when executing a divisible workload under a bound on the total execution time, while resilience is provided through checkpointing. We discuss several variants of this multi-criteria problem. Given the workload, we need to decide how many chunks to use, what are the sizes of these chunks, and at which speed each chunk is executed. Furthermore, since a failure may occur during the execution of a chunk, we also need to decide at which speed a chunk should be re-executed in the event of a failure. The goal is to minimize the expectation of the total energy consumption, while enforcing a deadline on the execution time, that should be met either in expectation (soft deadline), or in the worst case (hard deadline). For each problem instance, we propose either an exact solution, or a function that can be optimized numerically. The different models are then compared through an extensive set of experiments.
</p>
    </subsection>
    <subsection id="uid42" level="1">
      <bodyTitle>Assessing the performance of energy-aware mappings</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid44" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we aim at mapping streaming applications that can be modeled by a series-parallel graph onto a 2-dimensional tiled chip multiprocessor (CMP) architecture. The objective of the mapping is to minimize the energy consumption, using dynamic voltage and frequency scaling (DVFS) techniques, while maintaining a given level of performance, reflected by the rate of processing the data streams. This mapping problem turns out to be NP-hard, and several heuristics are proposed. We assess their performance through comprehensive simulations using the StreamIt workflow suite and randomly generated series-parallel graphs, and various CMP grid sizes.
</p>
    </subsection>
    <subsection id="uid43" level="1">
      <bodyTitle>Computing the throughput of probabilistic and replicated streaming applications</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid45" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we investigate how to compute
the throughput of probabilistic and replicated streaming
applications. We are given (i) a streaming application whose
dependence graph is a linear chain; (ii) a one-to-many mapping of the
application onto a fully heterogeneous target platform, where a
processor is assigned at most one application stage, but where a stage
can be replicated onto a set of processors; and (iii) a set of random
variables modeling the computation and communication times in the
mapping. We show how to compute the throughput of the application,
i.e., the rate at which data sets can be processed, under two
execution models, the Strict model where the actions of each processor
are sequentialized, and the Overlap model where a processor can
compute and communicate in parallel. The problem is easy when
application stages are not replicated, i.e., assigned to a single
processor: in that case the throughput is dictated by the critical
hardware resource. However, when stages are replicated, i.e., assigned
to several processors, the problem becomes surprisingly complicated:
even in the deterministic case, the optimal throughput may be lower
than the smallest internal resource throughput. The first contribution
of this work is to provide a general method to compute the throughput when mapping parameters are constant or follow I.I.D. exponential laws. The second contribution is to provide bounds for the throughput when stage parameters (computation and communication times) form associated random sequences, and are N.B.U.E. (New Better than Used in Expectation) variables: the throughput is bounded from below by the exponential case and bounded from above by the deterministic case. An extensive set of simulation allows us to assess the quality of the model, and to observe the actual behavior of several distributions.
</p>
    </subsection>
    <subsection id="uid44" level="1">
      <bodyTitle>Reliability and performance optimization of pipelined real-time systems</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid46" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we consider pipelined real-time systems that consist of a chain of tasks executing on a distributed platform. The processing of the tasks is pipelined: each processor executes only one interval of consecutive tasks. We are interested in minimizing both the input-output latency and the period of application mapping. For dependability reasons, we are also interested in maximizing the reliability of the system. We therefore assign several processors to each interval of tasks, so as to increase the reliability of the system. Both processors and communication links are unreliable and subject to transient failures. We assume that the arrival of the failures follows a constant parameter Poisson law, and that the failures are statistically independent events. We study several variants of this multiprocessor mapping problem, with several hypotheses on the target platform (homogeneous/heterogeneous speeds and/or failure rates). We provide NP-hardness complexity results, and optimal mapping algorithms for polynomial problem instances. Efficient heuristics are presented to solve the general case, and experimental results are provided.
</p>
    </subsection>
    <subsection id="uid45" level="1">
      <bodyTitle>Scheduling linear chain streaming applications on heterogeneous systems with failures</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid47" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we study the problem of optimizing the throughput of streaming applications for heterogeneous platforms subject to failures. Applications are linear graphs of tasks (pipelines), with a type associated to each task. The challenge is to map each task onto one machine of a target platform, each machine having to be specialized to process only one task type, given that every machine is able to process all the types before being specialized in order to avoid costly setups. The objective is to maximize the throughput, i.e., the rate at which jobs can be processed when accounting for failures. Each instance can thus be performed by any machine specialized in its type and the workload of the system can be shared among a set of specialized machines. For identical machines, we prove that an optimal solution can be computed in polynomial time. However, the problem becomes NP-hard when two machines may compute the same task type at different speeds. Several polynomial time heuristics are designed for the most realistic specialized settings. Simulation results assess their efficiency, showing that the best heuristics obtain a good throughput, much better than the throughput obtained with a random mapping. Moreover, the throughput is close to the optimal solution in the particular cases where the optimal throughput can be computed.
</p>
    </subsection>
    <subsection id="uid46" level="1">
      <bodyTitle>A survey of pipelined workflow scheduling: Models and algorithms</bodyTitle>
      <p>In this survey <ref xlink:href="#roma-2013-bid48" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we consider a large class of applications that need to execute the same workflow on different data sets of identical size. Efficient execution of such applications necessitates intelligent distribution of the application components and tasks on a parallel machine, and the execution can be orchestrated by utilizing task-, data-, pipelined-, and/or replicated-parallelism. The scheduling problem that encompasses all of these techniques is called pipelined workflow scheduling, and it has been widely studied in the last decade. Multiple models and algorithms have flourished to tackle various programming paradigms, constraints, machine behaviors or optimization goals. This work surveys the field by summing up and structuring known results and approaches.
</p>
    </subsection>
    <subsection id="uid47" level="1">
      <bodyTitle>Reclaiming the energy of a schedule: Models and algorithms</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid49" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we consider a task graph to be
executed on a set of processors. We assume that the mapping is given,
say by an ordered list of tasks to execute on each processor, and we
aim at optimizing the energy consumption while enforcing a prescribed
bound on the execution time. Although it is not possible to change the
allocation of a task, it is possible to change its execution speed. Rather than using a local approach such as backfilling, we consider the problem as a whole and study the impact of several speed variation models on its complexity. For continuous speeds, we give a closed-form formula for trees and series-parallel graphs, and we cast the problem into a geometric programming problem for general directed acyclic graphs. We show that the classical dynamic voltage and frequency scaling (DVFS) model with discrete modes leads to an NP-complete problem, even if the modes are regularly distributed (an important particular case in practice, which we analyze as the incremental model). On the contrary, the Vdd-hopping model that allows to switch between different supply voltages (VDD) while executing a task leads to a polynomial solution. Finally, we provide an approximation algorithm for the incremental model, which we extend for the general DVFS model.
</p>
    </subsection>
    <subsection id="uid48" level="1">
      <bodyTitle>Non-clairvoyant reduction algorithms for heterogeneous platforms</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid50" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we revisit the classical problem of
the reduction collective operation in a heterogeneous environment. We
discuss and evaluate four algorithms that are non-clairvoyant, i.e.,
they do not know in advance the computation and communication costs.
On the one hand, Binomial-stat and Fibonacci-stat are static algorithms that decide in
advance which operations will be reduced, without adapting to the
environment; they were originally defined for homogeneous settings. On
the other hand, Tree-dyn and Non-Commut-Tree-dyn are fully dynamic algorithms, for
commutative or non-commutative reductions. With identical computation
costs, we show that these algorithms are approximation algorithms with
constant or asymptotic ratios. When costs are exponentially
distributed, we perform an analysis of Tree-dyn based on Markov
chains. Finally, we assess the relative performance of all four
non-clairvoyant algorithms with heterogeneous costs through a set of
simulations.
</p>
    </subsection>
    <subsection id="uid49" level="1">
      <bodyTitle>Non-linear divisible loads: There is no free lunch</bodyTitle>
      <p>Divisible Load Theory (DLT) has received a lot of attention in the
past decade. A divisible load is a perfect parallel task, that can
be split arbitrarily and executed in parallel on a set of possibly
heterogeneous resources. The success of DLT is strongly related to
the existence of many optimal resource allocation and scheduling
algorithms, what strongly differs from general scheduling
theory. Moreover, recently, close relationships have been underlined
between DLT, that provides a fruitful theoretical framework for
scheduling jobs on heterogeneous platforms, and MapReduce, that
provides a simple and efficient programming framework to deploy
applications on large scale distributed platforms.</p>
      <p>The success of both have suggested to extend their framework to
non-linear complexity tasks. In this
work <ref xlink:href="#roma-2013-bid51" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we show that both DLT and
MapReduce are better suited to workloads with linear complexity. In
particular, we prove that divisible load theory cannot directly be
applied to quadratic workloads, such as it has been proposed
recently. We precisely state the limits for classical DLT studies
and we review and propose solutions based on a careful preparation
of the dataset and clever data partitioning algorithms. In
particular, through simulations, we show the possible impact of this
approach on the volume of communications generated by MapReduce, in
the context of Matrix Multiplication and Outer Product algorithms.
</p>
    </subsection>
    <subsection id="uid50" level="1">
      <bodyTitle>Direct solvers for sparse linear systems</bodyTitle>
      <p>This work is closely related to the <span class="smallcap" align="left">Mumps</span> solver (see Section <ref xlink:href="#uid29" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) and was performed in close collaboration with INPT (Toulouse). First, we have pursued the study of low-rank representations to speed-up
sparse direct solvers using the so called BLR (Block Low Rank) format <ref xlink:href="#roma-2013-bid52" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. This work was done in collaboration with LSTC (Livermore Software Technology Corp., USA) and in the
context of a contract with EDF which funded the PhD thesis of Clément Weisbecker at INPT.
We also worked on shared-memory parallelism <ref xlink:href="#roma-2013-bid53" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>
in the context of the PhD thesis of Wissam M. Sid-Lakhdar.
Concerning low-rank
approximations, they were experimented on geophysics
applications <ref xlink:href="#roma-2013-bid54" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> (Helmholtz equations)
in the context of a collaboration with members of the ISTerre and Geoazur laboratories.
The impact of both low-rank compression and shared-memory parallelism
was also studied on electromagnetism problems <ref xlink:href="#roma-2013-bid55" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
in collaboration with University of Padova (Italy) and CEDRAT.</p>
      <p>We have started the design and implementation of
a distributed-memory low-rank multifrontal solver.
When computations are faster (thanks to low-rank compression or multithreading within each node),
we observed that communications become critical; we are therefore currently studying the
limits of the communication schemes from the <span class="smallcap" align="left">Mumps</span> approach and
their possible improvements.</p>
      <p>On numerical and industrial aspects, we worked on rank detection
and null space basis computations (in collaboration with CERFACS
and Total/Hutchinson) as well as on improved parallel pivoting strategies
for symmetric indefinite systems, in collaboration
with ESI-Group (see Section <ref xlink:href="#uid62" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
    </subsection>
    <subsection id="uid51" level="1">
      <bodyTitle>Push-relabel based algorithms for the maximum transversal problem</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid56" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we investigate the push-relabel algorithm for solving the problem of finding a maximum cardinality matching in a bipartite graph in the context of the maximum transversal problem. We describe in detail an optimized yet easy-to-implement version of the algorithm and fine-tune its parameters. We also introduce new performance-enhancing techniques. On a wide range of real-world instances, we compare the push-relabel algorithm with state-of-the-art algorithms based on augmenting paths and pseudoflows. We conclude that a carefully tuned push-relabel algorithm is competitive with all known augmenting path-based algorithms, and superior to the pseudoflow-based ones.
</p>
    </subsection>
    <subsection id="uid52" level="1">
      <bodyTitle>Constructing elimination trees for sparse unsymmetric matrices</bodyTitle>
      <p>The elimination tree model for sparse unsymmetric matrices and an algorithm for constructing it have been recently proposed <ref xlink:href="#roma-2013-bid57" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid58" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.
The construction algorithm has a worst-case time complexity of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>Θ</mi><mo>(</mo><mi>m</mi><mi>n</mi><mo>)</mo></mrow></math></formula> for an <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>n</mi><mo>×</mo><mi>n</mi></mrow></math></formula> unsymmetric matrix having <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>m</mi></math></formula> off-diagonal nonzeros. In this work <ref xlink:href="#roma-2013-bid59" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
we propose another algorithm that has a worst-case time complexity of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>𝒪</mi><mo>(</mo><mi>m</mi><mo form="prefix">log</mo><mi>n</mi><mo>)</mo></mrow></math></formula>.
We compare the two algorithms experimentally and show that both algorithms are efficient in general.
The algorithm of Eisenstat and Liu is faster in many practical cases, yet there are instances in which there is a significant difference between the running time of the two algorithms in favor of the proposed one.
</p>
    </subsection>
    <subsection id="uid53" level="1">
      <bodyTitle>Semi-matching algorithms for scheduling parallel tasks under resource constraints</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid60" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we study the problem of minimum makespan scheduling when tasks are restricted to subsets of the processors (resource constraints), and require either one or multiple distinct processors to be executed (parallel tasks).
This problem is related to the minimum makespan scheduling problem on unrelated machines, as well as to the concurrent job shop problem, and it amounts to finding a semi-matching in bipartite graphs or hypergraphs. The problem is known to be NP-complete for bipartite graphs with general vertex (task) weights, and solvable in polynomial time for unweighted graphs with unit weights (i.e., unit-weight tasks).
We prove that the problem is NP-complete for hypergraphs even in the unweighted case.
We design several greedy algorithms of low complexity to solve two versions of the problem, and assess their performance through a set of exhaustive simulations.
Even though there is no approximation guarantee for these low-complexity algorithms, they return solutions close to the optimal (or a known lower bound) in average. </p>
    </subsection>
    <subsection id="uid54" level="1">
      <bodyTitle>Maximum cardinality bipartite matching algorithms on GPUs</bodyTitle>
      <p>In two studies <ref xlink:href="#roma-2013-bid61" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid62" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose, develop, and evaluate maximum cardinality matching algorithms from two different families (called push-relabel and augmenting-path based) on GPUs.
The problem of finding a maximum cardinality matching in bipartite graphs
has applications in computer science, scientific computing, bioinformatics, and other areas.
To the best of our knowledge, the proposed algorithms are the first investigation of the push-relabel and augmenting-path based on GPUs/
We compare the proposed algorithms with serial and multicore implementations from the literature on a large set of real-life problems where in majority of the cases one of our GPU-accelerated algorithms is demonstrated to be faster than both the sequential and multicore implementations.
</p>
    </subsection>
    <subsection id="uid55" level="1">
      <bodyTitle>Analysis of partitioning models and metrics in parallel sparse matrix-vector multiplication</bodyTitle>
      <p>Graph/hypergraph partitioning models and methods have been successfully used to minimize the communication among processors in several parallel computing applications.
Parallel sparse matrix-vector multiplication (SpMxV) is one of the representative applications that renders these models and methods indispensable in many scientific computing contexts.
In this work <ref xlink:href="#roma-2013-bid63" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, <ref xlink:href="#roma-2013-bid64" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we investigate the interplay of the partitioning metrics and execution times of SpMxV implementations in three libraries: Trilinos, PETSc, and an in-house one.
We carry out experiments with up to 512 processors and investigate the results with regression analysis.
Our experiments show that the partitioning metrics influence the performance greatly in a distributed memory setting.
The regression analyses demonstrate which metric is the most influential for the execution time of the libraries.
</p>
    </subsection>
    <subsection id="uid56" level="1">
      <bodyTitle>On partitioning and reordering problems in a hierarchically parallel hybrid linear solver</bodyTitle>
      <p>PDSLin is a general-purpose algebraic parallel hybrid (direct/iterative) linear solver based on the Schur complement method.
The most challenging step of the solver is the computation of a preconditioner based on the global Schur complement.
Efficient parallel computation of the preconditioner gives rise to partitioning problems with sophisticated constraints and objectives.
In this work <ref xlink:href="#roma-2013-bid65" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we identify two such problems and propose hypergraph partitioning methods to address them. The first problem is to balance the workloads associated with different subdomains to compute the preconditioner.
We first formulate an objective function and a set of constraints to model the preconditioner computation time.
Then, to address these complex constraints, we propose a recursive hypergraph bisection method.
The second problem is to improve the data locality during the parallel solution of a sparse triangular system with multiple sparse right-hand sides.
We carefully analyze the objective function and show that it can be well approximated by a standard hypergraph partitioning method.
Moreover, an ordering compatible with a post ordering of the subdomain elimination tree is shown to be very effective in preserving locality.
To evaluate the two proposed methods in practice, we present experimental results using linear systems arising from some applications of our interest.
First, we show that in comparison to a commonly-used nested graph dissection method, the proposed recursive hypergraph partitioning method reduces the preconditioner construction time, especially when the number of subdomains is moderate.
This is the desired result since PDSLin is based on a two-level parallelization to keep the number of subdomains small by assigning multiple processors to each subdomain.
We also show that our second proposed hypergraph method improves the data locality during the sparse triangular solution and reduces the solution time.
Moreover, we show that partitioning time can be greatly reduced while maintaining its quality by removing quasi-dense rows from the solution vectors.
</p>
    </subsection>
    <subsection id="uid57" level="1">
      <bodyTitle>UMPA: A Multi-objective, multi-level partitioner for communication minimization</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid66" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
we propose a directed hypergraph model and a refinement heuristic to distribute communicating tasks among the processing units in a distributed memory setting.
The aim is to achieve load balance and minimize the maximum data sent by a processing unit.
We also take two other communication metrics into account with a tie-breaking scheme.
With this approach, task distributions causing an excessive use of network or a bottleneck processor which participates to almost all of the communication are avoided.
We show on a large number of problem instances that our model improves the maximum data sent by a processor up to 34% for parallel environments with 4, 16, 64, and 256 processing units compared to the state of the art which only minimizes the total communication volume.
</p>
    </subsection>
    <subsection id="uid58" level="1">
      <bodyTitle>A Partitioning-based divisive clustering technique for maximizing the modularity</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid67" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we present a new graph clustering algorithm aimed at obtaining
clusterings of high modularity. The algorithm pursues a divisive
clustering approach and uses established graph partitioning
algorithms and techniques to compute recursive bipartitions of the
input as well as to refine clusters. Experimental evaluation shows
that the modularity scores obtained compare favorably to many
previous approaches. In the majority of test cases, the algorithm
outperformed the best known alternatives. In particular, among 13
problem instances common in the literature, the proposed algorithm
improves the best known modularity in 9 cases.
</p>
    </subsection>
    <subsection id="uid59" level="1">
      <bodyTitle>Randomized matching heuristics with quality guarantees on shared memory parallel computers</bodyTitle>
      <p>In this work <ref xlink:href="#roma-2013-bid68" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose two heuristics for the bipartite matching problem that are amenable to shared-memory parallelization.
The first heuristic is very intriguing from parallelization perspective.
It has no significant algorithmic synchronization overhead and no conflict resolution is needed across threads. We show that this heuristic has an approximation ratio of around 0.632.
The second heuristic is designed to obtain a larger matching by employing the well-known Karp-Sipser heuristic on a judiciously chosen subgraph of the original graph.
We show that the Karp-Sipser heuristic always finds a maximum cardinality matching in the chosen subgraph.
Although the Karp-Sipser heuristic is hard to parallelize for general graphs, we exploit the structure of the selected subgraphs to propose a specialized implementation which demonstrates a very good scalability.
Based on our experiments and theoretical evidence, we conjecture that this second heuristic obtains matchings with cardinality of at least 0.866 of the maximum cardinality.
We discuss parallel implementations of the proposed heuristics on shared memory systems. Experimental results, for demonstrating speed-ups and verifying the theoretical results in practice, are provided.
</p>
    </subsection>
    <subsection id="uid60" level="1">
      <bodyTitle>On the minimum edge cover and vertex partition by quasi-cliques problems</bodyTitle>
      <p>A <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-clique in a simple undirected graph is a set of vertices which induces a subgraph with the edge density of at least <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula> for <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>0</mn><mo>&lt;</mo><mi>γ</mi><mo>&lt;</mo><mn>1</mn></mrow></math></formula>.
A cover of a graph by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques is a set of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques where each edge of the graph is contained in at least one quasi-clique.
The minimum cover by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques problem asks for a <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-clique cover with the minimum number of quasi-cliques. A partition of a graph by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques is a set of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques where each vertex of the graph belongs to exactly one quasi-clique.
The minimum partition by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques problem asks for a vertex partition by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques with the minimum number of quasi-cliques.
In this work <ref xlink:href="#roma-2013-bid69" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we show that the decision versions of the minimum cover and partition by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula>-quasi-cliques problems are NP-complete for any fixed <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>γ</mi></math></formula> satisfying <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>0</mn><mo>&lt;</mo><mi>γ</mi><mo>&lt;</mo><mn>1</mn></mrow></math></formula>.</p>
    </subsection>
  </resultats>
  <contrats id="uid61">
    <bodyTitle>Bilateral Contracts and Grants with Industry</bodyTitle>
    <subsection id="uid62" level="1">
      <bodyTitle>Bilateral Contracts with Industry</bodyTitle>
      <p>Related to evolutions of the <span class="smallcap" align="left">Mumps</span> solver (see Section <ref xlink:href="#uid29" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), and in order to
continue funding two engineers while working on the
design of a consortium of industrial users, we worked on
the following contracts with industry, that were
managed by CERFACS and INPT, respectively:</p>
      <simplelist>
        <li id="uid63">
          <p noindent="true">Total/Hutchinson.
In this contract, we worked more specifically on numerical aspects related
to rank detection and null-space computations. This feature will be available
in a future version of the solver.</p>
        </li>
        <li id="uid64">
          <p noindent="true">ESI-Group. We worked on modified pivoting strategies
for hard symmetric indefinite problems. The proposed solutions could be
validated by the industrial partner. This feature will be available in
the next release of our package.</p>
        </li>
      </simplelist>
    </subsection>
  </contrats>
  <partenariat id="uid65">
    <bodyTitle>Partnerships and Cooperations</bodyTitle>
    <subsection id="uid66" level="1">
      <bodyTitle>National Initiatives</bodyTitle>
      <subsection id="uid67" level="2">
        <bodyTitle>ANR</bodyTitle>
        <descriptionlist>
          <label>ANR White Project <span class="smallcap" align="left">Rescue</span> (2010-2014), 4 years.</label>
          <li id="uid68">
            <p noindent="true">The ANR White Project <span class="smallcap" align="left">Rescue</span> was launched in November 2010, for a duration of 48 months.
It gathers three Inria partners (<span class="smallcap" align="left">Roma</span>, Grand-Large and Hiepacs) and is led by <span class="smallcap" align="left">Roma</span>.
The main objective of the project is to develop new algorithmic techniques and software
tools to solve the <i>exascale resilience problem</i>. Solving this
problem implies a departure from current approaches,
and calls for yet-to-be-discovered algorithms, protocols and software tools.</p>
            <p>This proposed research follows three main research thrusts. The first thrust deals with
novel <i>checkpoint protocols</i>. The second
thrust entails the development of novel <i>execution models</i>, i.e.,
accurate stochastic models to predict (and, in turn, optimize) the
expected performance (execution time or throughput) of large-scale
parallel scientific applications. In the third thrust, we will develop
novel <i>parallel algorithms</i> for scientific numerical kernels.</p>
          </li>
        </descriptionlist>
        <descriptionlist>
          <label>ANR Project <span class="smallcap" align="left">Solhar</span> (2013-2017), 4 years.</label>
          <li id="uid69">
            <p noindent="true">The ANR Project <span class="smallcap" align="left">Solhar</span> was launched in November 2013, for a
duration of 48 months. It gathers five academic partners (the
HiePACS, Cepage, <span class="smallcap" align="left">Roma</span> and Runtime Inria project-teams, and
CNRS-IRIT) and two industrial partners (CEA/CESTA and EADS-IW). This
project aims at studying and designing algorithms and parallel
programming models for implementing direct methods for the solution
of sparse linear systems on emerging computers equipped with
accelerators.</p>
            <p>The proposed research is organized along three distinct research
thrusts. The first objective deals with linear algebra kernels
suitable for heterogeneous computing platforms. The second one
focuses on runtime systems to provide efficient and robust
implementation of dense linear algebra algorithms. The third one is
concerned with scheduling this particular application on a
heterogeneous and dynamic environment.</p>
          </li>
        </descriptionlist>
      </subsection>
      <subsection id="uid70" level="2">
        <bodyTitle>Inria Project Lab C2S@Exa - Computer and Computational Scienecs at Exascale</bodyTitle>
        <participants>
          <person key="PASUSERID">
            <firstname>Olivier</firstname>
            <lastname>Aumage</lastname>
            <moreinfo>RUNTIME project-team, Inria Bordeaux - Sud-Ouest</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Jocelyne</firstname>
            <lastname>Erhel</lastname>
            <moreinfo>SAGE project-team, Inria Rennes - Bretagne Atlantique</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Philippe</firstname>
            <lastname>Helluy</lastname>
            <moreinfo>TONUS project-team, Inria Nancy - Grand-Est</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Laura</firstname>
            <lastname>Grigori</lastname>
            <moreinfo>ALPINE project-team, Inria Saclay - Île-de-France</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Jean-Yves</firstname>
            <lastname>L’excellent</lastname>
            <moreinfo>ROMA project-team, Inria Grenoble - Rhône-Alpes</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Thierry</firstname>
            <lastname>Gautier</lastname>
            <moreinfo>MOAIS project-team, Inria Grenoble - Rhône-Alpes</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Luc</firstname>
            <lastname>Giraud</lastname>
            <moreinfo>HIEPACS project-team, Inria Bordeaux - Sud-Ouest</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Michel</firstname>
            <lastname>Kern</lastname>
            <moreinfo>POMDAPI project-team, Inria Paris - Rocquencourt</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Stéphane</firstname>
            <lastname>Lanteri</lastname>
            <moreinfo>Coordinator of the project</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>François</firstname>
            <lastname>Pellegrini</lastname>
            <moreinfo>BACCHUS project-team, Inria Bordeaux - Sud-Ouest</moreinfo>
          </person>
          <person key="PASUSERID">
            <firstname>Christian</firstname>
            <lastname>Perez</lastname>
            <moreinfo>AVALON project-team, Inria Grenoble - Rhône-Alpes</moreinfo>
          </person>
          <person key="graal-2005-id18145">
            <firstname>Frédéric</firstname>
            <lastname>Vivien</lastname>
            <moreinfo>ROMA project-team, Inria Grenoble - Rhône-Alpes</moreinfo>
          </person>
        </participants>
        <p>Since January 2013, the team is participating to the C2S@Exa
<ref xlink:href="http://www-sop.inria.fr/c2s_at_exa" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www-sop.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>c2s_at_exa</ref> Inria Project Lab (IPL).
This national initiative aims at the development of numerical modeling
methodologies that fully exploit the processing capabilities of modern
massively parallel architectures in the context of a number of
selected applications related to important scientific and
technological challenges for the quality and the security of life in
our society. At the current state of the art in technologies and
methodologies, a multidisciplinary approach is required to overcome
the challenges raised by the development of highly scalable numerical
simulation software that can exploit computing platforms offering
several hundreds of thousands of cores. Hence, the main objective of
C2S@Exa is the establishment of a continuum of expertise in the
computer science and numerical mathematics domains, by gathering
researchers from Inria project-teams whose research and development
activities are tightly linked to high performance computing issues in
these domains. More precisely, this collaborative effort involves
computer scientists that are experts of programming models,
environments and tools for harnessing massively parallel systems,
algorithmists that propose algorithms and contribute to generic
libraries and core solvers in order to take benefit from all the
parallelism levels with the main goal of optimal scaling on very large
numbers of computing entities and, numerical mathematicians that are
studying numerical schemes and scalable solvers for systems of partial
differential equations in view of the simulation of very large-scale
problems.</p>
      </subsection>
    </subsection>
    <subsection id="uid71" level="1">
      <bodyTitle>European Initiatives</bodyTitle>
      <subsection id="uid72" level="2">
        <bodyTitle>FP7 Projects</bodyTitle>
        <subsection id="uid73" level="3">
          <bodyTitle>SCORPIO</bodyTitle>
          <sanspuceslist>
            <li id="uid74">
              <p noindent="true">Type: COOPERATION</p>
            </li>
            <li id="uid75">
              <p noindent="true">Instrument: Specific Targeted Research Project</p>
            </li>
            <li id="uid76">
              <p noindent="true">Duration: June 2013 - May 2016</p>
            </li>
            <li id="uid77">
              <p noindent="true">Coordinator: Nikolaos Bellas</p>
            </li>
            <li id="uid78">
              <p noindent="true">Partners: CERTH, Greece; EPFL, Switzerland; RWTH Aachen
University, Germany; The Queen’s University of Belfast, UK; IMEC,
Belgium</p>
            </li>
            <li id="uid79">
              <p noindent="true">Inria contact: Frédéric Vivien</p>
            </li>
            <li id="uid80">
              <p noindent="true">Abstract: A new computing paradigm that exploits uncertainty to design systems that are energy-efficient and scale gracefully under hardware errors by operating below the nominal operating point, in a controlled way, without inducing massive or fatal errors.</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
    </subsection>
    <subsection id="uid81" level="1">
      <bodyTitle>International Initiatives</bodyTitle>
      <subsection id="uid82" level="2">
        <bodyTitle>Inria Associate Teams</bodyTitle>
        <p>The <span class="smallcap" align="left">Aloha</span> associate-team is a joint project of the <span class="smallcap" align="left">Roma</span> team and of
the Information and Computer science Department of the University of
Hawai`i (UH) at Mānoa, Honolulu, USA. Building on a vast array of
theoretical techniques and expertise developed in the field of
parallel and distributed computing, and more particularly application
<i>scheduling</i>, we tackle database questions from a fresh
perspective. To this end, this proposal includes:</p>
        <simplelist>
          <li id="uid83">
            <p noindent="true">a group that specializes in database systems research and who
has both industrial and academic experience, the group of Lipyeow
Lim (UH);</p>
          </li>
          <li id="uid84">
            <p noindent="true">a group that specializes in practical aspects of scheduling
problems and in simulation for emerging platforms and applications,
and who has a long experience of multidisciplinary research, the
group of Henri Casanova (UH);</p>
          </li>
          <li id="uid85">
            <p noindent="true">a group that specializes in the theoretical aspects of
scheduling problems and resource management (the <span class="smallcap" align="left">Roma</span> team).</p>
          </li>
        </simplelist>
        <p>The research work focuses on the following three thrusts:</p>
        <orderedlist>
          <li id="uid86">
            <p noindent="true">Online, multi-criteria query optimization</p>
          </li>
          <li id="uid87">
            <p noindent="true">Fault-Tolerance for distributed databases</p>
          </li>
          <li id="uid88">
            <p noindent="true">Query scheduling for distributed databases</p>
          </li>
        </orderedlist>
      </subsection>
    </subsection>
    <subsection id="uid89" level="1">
      <bodyTitle>International Research Visitors</bodyTitle>
      <subsection id="uid90" level="2">
        <bodyTitle>Visits of International Scientists</bodyTitle>
        <p>Ana Gainaru (from UIUC and Argonne National Laboratory) has visited our team for three weeks in October and November 2013.
She initiated a collaboration with Guillaume Aupy, Anne Benoit, Franck Cappello and Yves Robert
on scheduling I/O activity to avoid congestion and increase performance when
executing several scientific applications on large-scale platforms.</p>
      </subsection>
      <subsection id="uid91" level="2">
        <bodyTitle>Visits to International Teams</bodyTitle>
        <p>Yves Robert has been appointed as a visiting scientist by the ICL laboratory (headed by Jack Dongarra)
at the University of Tennessee Knoxville. He collaborates with several ICL researchers on high-performance linear algebra
and resilience methods at scale.</p>
      </subsection>
    </subsection>
  </partenariat>
  <diffusion id="uid92">
    <bodyTitle>Dissemination</bodyTitle>
    <subsection id="uid93" level="1">
      <bodyTitle>Scientific Animation</bodyTitle>
      <descriptionlist>
        <label>Anne Benoit</label>
        <li id="uid94">
          <p noindent="true">is an associate editor of the <i>Journal of
Parallel and Distributed Computing (JPDC)</i>. She was the workshops
co-chair of ICPP 2013. She was a member of the program
committees of the following conferences and workshops: HiPC 2013, ICPE 2013,
CCGrid 2013, IPDPS 2013, CLOSER 2013, HCW 2013, IGCC 2013.</p>
        </li>
        <label>Jean-Yves L'Excellent</label>
        <li id="uid95">
          <p noindent="true">was a member of the program committees of
Renpar'13 and ICPP'2013, where he was also local arrangements
co-chair. He co-organized the third MUMPS Users days, EDF, Clamart,
May 29-30, 2013.</p>
        </li>
        <label>Loris Marchal</label>
        <li id="uid96">
          <p noindent="true">is or was a member of the program committees of
IPDPS'2013, ICPP'2013, and IPDPS'2014.</p>
        </li>
        <label>Yves Robert</label>
        <li id="uid97">
          <p noindent="true">is an associate editor of <i>IJHPCA</i>,
<i>IJGUC</i> and <i>JOCS</i>. He was Program Chair of ICPP 2013
(Int. Conference on Parallel Processing) and of HiPC 2013
(Int. Conference on High Performance Computing). He is or was a
member of the program committees of the following conferences and
workshops: EduPar 2013, FTXS 2013, ICCS 2013, IGCC 2013, ISC tutorials 2013
ISCIS 2013 and SC 2013.</p>
        </li>
        <label>Bora Uçar</label>
        <li id="uid98">
          <p noindent="true">was the chair of the applications track of ICPP 2013.
He was a member of the program committee for IPDPS 2013, PCO 2013 (a workshop of IPDPS), and PPAM.</p>
        </li>
        <label>Frédéric Vivien</label>
        <li id="uid99">
          <p noindent="true">is an associate editor of <i>Parallel Computing</i>.
Frédéric Vivien was program vice-chair, for the algorithms track, of
IPDPS 2013, is program vice-chair, for the algorithms track, of
HiPC 2014, and is co-responsible of the stream “Algorithmes
distribués, multi-agents et calcul parallèle” for ROADEF 2014.</p>
          <p>He is or was a member of the program committee of the following
conferences and workshops: SC'14, IPDPS 2014, ComPAS'2014, PDP 2014,
SC'13, EduPDHPC, ICPP 2013, EduPar-13, PDP 2013, ROADEF 2013,
RenPar'21 - ComPAS'2013.</p>
        </li>
      </descriptionlist>
    </subsection>
    <subsection id="uid100" level="1">
      <bodyTitle>Teaching - Supervision - Juries</bodyTitle>
      <subsection id="uid101" level="2">
        <bodyTitle>Teaching</bodyTitle>
        <sanspuceslist>
          <li id="uid102">
            <p noindent="true">Licence: Anne Benoit, Systèmes et Réseaux, 48h, L3, École normale supérieure de Lyon, France.</p>
          </li>
          <li id="uid103">
            <p noindent="true">Licence: Yves Robert, Algorithmes, 48h, L3, École normale supérieure de Lyon, France.</p>
          </li>
          <li id="uid104">
            <p noindent="true">Master: Frédéric Vivien, Algorithmique et Programmation
Parallèles, 36 h, M1, École normale supérieure de Lyon, France.</p>
          </li>
          <li id="uid105">
            <p noindent="true">Master: Frédéric Vivien, Algorithms for High-Performance Computing Platforms, 36 h, M2, École normale supérieure de Lyon, France.</p>
          </li>
          <li id="uid106">
            <p noindent="true">Master: Bora Uçar, Combinatorial Scientific Computing, 36 h, M2, École normale supérieure de Lyon, France.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid107" level="2">
        <bodyTitle>Supervision</bodyTitle>
        <sanspuceslist>
          <li id="uid108">
            <p noindent="true">PhD in progress: Guillaume Aupy, Multi-criteria scheduling on volatile platforms, September 1, 2011, Anne Benoit and Yves Robert.</p>
          </li>
          <li id="uid109">
            <p noindent="true">PhD in progress: Dounia Zaidouni, Performance and execution models for exascale applications in failure-prone
environments, October 1, 2011, Frédéric Vivien and Yves Robert.</p>
          </li>
          <li id="uid110">
            <p noindent="true">PhD in progress: Wissam M. Sid-Lakhdar, Exploitation of multicore architectures in the resolution of sparse linear systems by multifrontal methods,
October 1, 2011, Jean-Yves L'Excellent.</p>
          </li>
          <li id="uid111">
            <p noindent="true">PhD in progress: Julien Herrmann, Numerical algorithms for large-scale platforms, September 1, 2012, Loris Marchal and Yves Robert.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid112" level="2">
        <bodyTitle>Juries</bodyTitle>
        <sanspuceslist>
          <li id="uid113">
            <p noindent="true">PhD: Anne Benoit was a “rapporteur” and member of the jury for the PhD defense
of Przemysław Uznański, Bordeaux, France, October 11, 2013.</p>
          </li>
          <li id="uid114">
            <p noindent="true">PhD: Jean-Yves L'Excellent was a “rapporteur” and member of the jury for the PhD defense of Sethy Montan, University Pierre et Marie Curie, France, October 17, 2013.</p>
          </li>
          <li id="uid115">
            <p noindent="true">PhD: Yves Robert was a “rapporteur” and member of the jury for the PhD defense
of Amal Khabou, University Orsay Paris XI, Saclay, France, on February 11, 2013.</p>
          </li>
          <li id="uid116">
            <p noindent="true">PhD: Yves Robert was a member of the jury for the PhD defense
of Dimitris Letsios, University of Evry Val d'Essonne, Paris, France, on October 22, 2013.</p>
          </li>
          <li id="uid117">
            <p noindent="true">Habilitation: Yves Robert chaired the jury for the <i>Habilitation à Diriger des Recherches</i>
of Laurent Lefèvre, ENS Lyon, France, November 22, 2013.</p>
          </li>
          <li id="uid118">
            <p noindent="true">PhD: Frédéric Vivien was a member of the jury for the PhD defense
of Javier Celaya, University of Zaragoza, Zaragoza, Spain,
September 6, 2013.</p>
          </li>
          <li id="uid119">
            <p noindent="true">PhD: Frédéric Vivien was an “expert” for the PhD defense of
Marco Meoni, EPFL, Lausanne, Switzerland, December 11, 2013.</p>
          </li>
          <li id="uid120">
            <p noindent="true">PhD: Bora Uçar was an “evaluator” for the PhD defense of
Bastian Onne Fagginger Auer, Department of Mathematics, Utrecht University, the Netherlands, August 26 2013.</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
  </diffusion>
  <biblio id="bibliography" html="bibliography" numero="10" titre="Bibliography">
    
    <biblStruct id="roma-2013-bid2" type="book" rend="year" n="cite:benoit:hal-00908448">
      <identifiant type="hal" value="hal-00908448"/>
      <monogr x-international-audience="yes">
        <title level="m">A Guide to Algorithm Design: Paradigms, Methods, and Complexity Analysis</title>
        <title level="s">Applied Algorithms and Data Structures series</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>Chapman &amp; Hall/CRC</orgName>
          </publisher>
          <dateStruct>
            <month>August</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">380</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00908448" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00908448</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid49" type="article" rend="year" n="cite:aupy:hal-00763388">
      <identifiant type="doi" value="10.1002/cpe.2889"/>
      <identifiant type="hal" value="hal-00763388"/>
      <analytic>
        <title level="a">Reclaiming the energy of a schedule: models and algorithms</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2008-id18982">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00483">
        <idno type="issn">1532-0626</idno>
        <title level="j">Concurrency and Computation: Practice and Experience</title>
        <imprint>
          <biblScope type="volume">25</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">1505-1523</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00763388" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763388</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid73" type="article" rend="year" n="cite:aupy:hal-00908446">
      <identifiant type="doi" value="10.1016/j.jpdc.2013.10.010"/>
      <identifiant type="hal" value="hal-00908446"/>
      <analytic>
        <title level="a">Checkpointing algorithms and fault prediction</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01326">
        <idno type="issn">0743-7315</idno>
        <title level="j">Journal of Parallel and Distributed Computing</title>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00908446" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00908446</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid74" type="article" rend="year" n="cite:baboulin:hal-00908496">
      <identifiant type="doi" value="10.1145/2427023.2427025"/>
      <identifiant type="hal" value="hal-00908496"/>
      <analytic>
        <title level="a">Accelerating linear system solutions using randomization technique</title>
        <author>
          <persName key="grand-large-2010-id59617">
            <foreName>Marc</foreName>
            <surname>Baboulin</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Julien</foreName>
            <surname>Herrmann</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Stanimire</foreName>
            <surname>Tomov</surname>
            <initial>S.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00032">
        <idno type="issn">0098-3500</idno>
        <title level="j">ACM Transactions on Mathematical Software</title>
        <imprint>
          <biblScope type="volume">39</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00908496" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00908496</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid48" type="article" rend="year" n="cite:benoit:hal-00926178">
      <identifiant type="doi" value="10.1145/2501654.2501664"/>
      <identifiant type="hal" value="hal-00926178"/>
      <analytic>
        <title level="a">A Survey of Pipelined Workflow Scheduling: Models and Algorithms</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="moais-2007-id19037">
            <foreName>Erik</foreName>
            <surname>Saule</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00004">
        <idno type="issn">0360-0300</idno>
        <title level="j">ACM Computing Surveys</title>
        <imprint>
          <biblScope type="volume">45</biblScope>
          <biblScope type="number">4</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00926178" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926178</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid47" type="article" rend="year" n="cite:benoit:hal-00926146">
      <identifiant type="doi" value="10.1016/j.future.2012.12.015"/>
      <identifiant type="hal" value="hal-00926146"/>
      <analytic>
        <title level="a">Scheduling linear chain streaming applications on heterogeneous systems with failures</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2007-id19010">
            <foreName>Alexandru</foreName>
            <surname>Dobrila</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18242">
            <foreName>Jean-Marc</foreName>
            <surname>Nicod</surname>
            <initial>J.-M.</initial>
          </persName>
          <persName key="graal-2005-id18256">
            <foreName>Laurent</foreName>
            <surname>Philippe</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00695">
        <idno type="issn">0167-739X</idno>
        <title level="j">Future Generation Computer Systems</title>
        <imprint>
          <biblScope type="volume">29</biblScope>
          <biblScope type="number">5</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">1140-1151</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00926146" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926146</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid46" type="article" rend="year" n="cite:benoit:hal-00926123">
      <identifiant type="doi" value="10.1016/j.jpdc.2013.02.009"/>
      <identifiant type="hal" value="hal-00926123"/>
      <analytic>
        <title level="a">Reliability and performance optimization of pipelined real-time systems</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2008-id18982">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="popart-2005-id18078">
            <foreName>Alain</foreName>
            <surname>Girault</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01326">
        <idno type="issn">0743-7315</idno>
        <title level="j">Journal of Parallel and Distributed Computing</title>
        <imprint>
          <biblScope type="volume">73</biblScope>
          <biblScope type="number">6</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">851-865</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00926123" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926123</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid45" type="article" rend="year" n="cite:benoit:hal-00800083">
      <identifiant type="hal" value="hal-00800083"/>
      <analytic>
        <title level="a">Computing the throughput of probabilistic and replicated streaming applications</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2006-id18623">
            <foreName>Matthieu</foreName>
            <surname>Gallet</surname>
            <initial>M.</initial>
          </persName>
          <persName key="mescal-2005-id18078">
            <foreName>Bruno</foreName>
            <surname>Gaujal</surname>
            <initial>B.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00110">
        <idno type="issn">0178-4617</idno>
        <title level="j">Algorithmica</title>
        <imprint>
          <dateStruct>
            <month>March</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00800083" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00800083</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct subtype="nonparu-n" id="roma-2013-bid79" type="incollection" rend="year" n="cite:benoit:hal-00763372">
      <identifiant type="hal" value="hal-00763372"/>
      <analytic>
        <title level="a">Scheduling for Large-Scale Systems</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Teo</foreName>
            <surname>Gonzalez</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Jorge L.</foreName>
            <surname>Díaz Herrera</surname>
            <initial>J. L.</initial>
          </persName>
        </editor>
        <title level="m">The Computing Handbook Set, vol. 1</title>
        <imprint>
          <publisher>
            <orgName>Chapman and Hall/CRC Press</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00763372" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763372</ref>
        </imprint>
      </monogr>
      <note type="bnote">To appear</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid44" type="article" rend="year" n="cite:benoit:hal-00926105">
      <identifiant type="doi" value="10.1142/S0129626413400033"/>
      <identifiant type="hal" value="hal-00926105"/>
      <analytic>
        <title level="a">Assessing the performance of energy-aware mappings</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Rami</foreName>
            <surname>Melhem</surname>
            <initial>R.</initial>
          </persName>
          <persName key="graal-2009-id60733">
            <foreName>Paul</foreName>
            <surname>Renaud-Goud</surname>
            <initial>P.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01649">
        <idno type="issn">0129-6264</idno>
        <title level="j">Parallel Processing Letters</title>
        <imprint>
          <biblScope type="volume">23</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00926105" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926105</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid70" type="article" rend="year" n="cite:benoit:hal-00763321">
      <identifiant type="doi" value="10.1007/s00224-012-9426-z"/>
      <identifiant type="hal" value="hal-00763321"/>
      <analytic>
        <title level="a">Static strategies for worksharing with unrecoverable interruption</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Arnold</foreName>
            <surname>Rosenberg</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01955">
        <idno type="issn">1432-4350</idno>
        <title level="j">Theory of Computing Systems</title>
        <imprint>
          <biblScope type="volume">53</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">386-423</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00763321" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763321</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid39" type="article" rend="year" n="cite:bosilca:hal-00908447">
      <identifiant type="doi" value="10.1002/cpe.3173"/>
      <identifiant type="hal" value="hal-00908447"/>
      <analytic>
        <title level="a">Unified Model for Assessing Checkpointing Protocols at Extreme-Scale</title>
        <author>
          <persName>
            <foreName>George</foreName>
            <surname>Bosilca</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18178">
            <foreName>Aurélien</foreName>
            <surname>Bouteiller</surname>
            <initial>A.</initial>
          </persName>
          <persName key="runtime-2005-id18277">
            <foreName>Élisabeth</foreName>
            <surname>Brunet</surname>
            <initial>É.</initial>
          </persName>
          <persName key="grand-large-2005-id18099">
            <foreName>Franck</foreName>
            <surname>Cappello</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName key="grand-large-2008-id18798">
            <foreName>Amina</foreName>
            <surname>Guermouche</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00483">
        <idno type="issn">1532-0626</idno>
        <title level="j">Journal of Concurrency and Computation: Practice and Experience</title>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00908447" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00908447</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid38" type="article" rend="year" n="cite:bougeret:hal-00881463">
      <identifiant type="doi" value="10.1177/1094342013505348"/>
      <identifiant type="hal" value="hal-00881463"/>
      <analytic>
        <title level="a">Using group replication for resilience on exascale systems</title>
        <author>
          <persName key="moais-2007-id18692">
            <foreName>Marin</foreName>
            <surname>Bougeret</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Henri</foreName>
            <surname>Casanova</surname>
            <initial>H.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01001">
        <idno type="issn">1094-3420</idno>
        <title level="j">International Journal of High Performance Computing Applications</title>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00881463" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00881463</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid35" type="article" rend="year" n="cite:casanova:hal-00923948">
      <identifiant type="hal" value="hal-00923948"/>
      <analytic>
        <title level="a">Mapping Applications on Volatile Resources</title>
        <author>
          <persName>
            <foreName>Henri</foreName>
            <surname>Casanova</surname>
            <initial>H.</initial>
          </persName>
          <persName key="graal-2008-id18982">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01001">
        <idno type="issn">1094-3420</idno>
        <title level="j">International Journal of High Performance Computing Applications</title>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00923948" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00923948</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid66" type="incollection" rend="year" n="cite:catalyurek:hal-00763563">
      <identifiant type="doi" value="10.1090/conm/588/11704"/>
      <identifiant type="hal" value="hal-00763563"/>
      <analytic>
        <title level="a">UMPA: A Multi-objective, multi-level partitioner for communication minimization</title>
        <author>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
          <persName>
            <foreName>Mehmet</foreName>
            <surname>Deveci</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>David A.</foreName>
            <surname>Bader</surname>
            <initial>D. A.</initial>
          </persName>
          <persName>
            <foreName>Henning</foreName>
            <surname>Meyerhenke</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Peters</foreName>
            <surname>Sanders</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Dorothea</foreName>
            <surname>Wagner</surname>
            <initial>D.</initial>
          </persName>
        </editor>
        <title level="m">Graph Partitioning and Graph Clustering 2012</title>
        <title level="s">Contemporary Mathematics</title>
        <imprint>
          <biblScope type="volume">588</biblScope>
          <publisher>
            <orgName>AMS</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">53-66</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00763563" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763563</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid67" type="incollection" rend="year" n="cite:catalyurek:hal-00763559">
      <identifiant type="doi" value="10.1090/conm/588/11712"/>
      <identifiant type="hal" value="hal-00763559"/>
      <analytic>
        <title level="a">A Partitioning-based divisive clustering technique for maximizing the modularity</title>
        <author>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2011-idp140410990993920">
            <foreName>Johannes</foreName>
            <surname>Langguth</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>D. A.</foreName>
            <surname>Bader</surname>
            <initial>D. A.</initial>
          </persName>
          <persName>
            <foreName>H.</foreName>
            <surname>Meyerhenke</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>P.</foreName>
            <surname>Sanders</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>D.</foreName>
            <surname>Wagner</surname>
            <initial>D.</initial>
          </persName>
        </editor>
        <title level="m">Graph Partitioning and Graph Clustering 2012</title>
        <title level="s">Contemporary Mathematics</title>
        <imprint>
          <biblScope type="volume">588</biblScope>
          <publisher>
            <orgName>AMS</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">171-186</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00763559" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763559</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid72" type="article" rend="year" n="cite:dongarra:hal-00809770">
      <identifiant type="doi" value="10.1016/j.parco.2013.01.003"/>
      <identifiant type="hal" value="hal-00809770"/>
      <analytic>
        <title level="a">Hierarchical QR factorization algorithms for multi-core clusters</title>
        <author>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName key="scalapplix-2006-id18605">
            <foreName>Mathieu</foreName>
            <surname>Faverge</surname>
            <initial>M.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2008-id19057">
            <foreName>Mathias</foreName>
            <surname>Jacquelin</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Julien</foreName>
            <surname>Langou</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01648">
        <idno type="issn">0167-8191</idno>
        <title level="j">Parallel Computing</title>
        <imprint>
          <biblScope type="volume">39</biblScope>
          <biblScope type="number">4-5</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">212-232</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00809770" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00809770</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid56" type="article" rend="year" n="cite:kaya:hal-00763920">
      <identifiant type="doi" value="10.1016/j.cor.2012.12.009"/>
      <identifiant type="hal" value="hal-00763920"/>
      <analytic>
        <title level="a">Push-relabel based algorithms for the maximum transversal problem</title>
        <author>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2011-idp140410990993920">
            <foreName>Johannes</foreName>
            <surname>Langguth</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Fredrik</foreName>
            <surname>Manne</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid00469">
        <idno type="issn">0305-0548</idno>
        <title level="j">Computers &amp; Operations Research</title>
        <imprint>
          <biblScope type="volume">40</biblScope>
          <biblScope type="number">5</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">1266-1275</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00763920" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763920</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid59" type="article" rend="year" n="cite:kaya:inria-00567970">
      <identifiant type="doi" value="10.1137/110825443"/>
      <identifiant type="hal" value="inria-00567970"/>
      <analytic>
        <title level="a">Constructing elimination trees for sparse unsymmetric matrices</title>
        <author>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01827">
        <idno type="issn">0895-4798</idno>
        <title level="j">SIAM Journal on Matrix Analysis and Applications</title>
        <imprint>
          <biblScope type="volume">34</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <month>April</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">345-354</biblScope>
          <ref xlink:href="http://hal.inria.fr/inria-00567970" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>inria-00567970</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct subtype="nonparu-n" id="roma-2013-bid71" type="article" rend="year" n="cite:prasad:hal-00764026">
      <identifiant type="hal" value="hal-00764026"/>
      <analytic>
        <title level="a">Literacy for all in parallel and distributed computing: guidelines for an undergraduate core curriculum</title>
        <author>
          <persName>
            <foreName>Sushil</foreName>
            <surname>Prasad</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Anshul</foreName>
            <surname>Gupta</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Krishna</foreName>
            <surname>Kant</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>Andrew</foreName>
            <surname>Lumsdaine</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>David</foreName>
            <surname>Padua</surname>
            <initial>D.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Arnold</foreName>
            <surname>Rosenberg</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Alan</foreName>
            <surname>Sussman</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Charles</foreName>
            <surname>Weems</surname>
            <initial>C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid02461111111111112">
        <idno type="issn">2277-6702</idno>
        <title level="j">CSI Journal of Computing</title>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00764026" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00764026</ref>
        </imprint>
      </monogr>
      <note type="bnote">To appear</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid55" type="inproceedings" rend="year" n="cite:amestoy:hal-00924660">
      <identifiant type="hal" value="hal-00924660"/>
      <analytic>
        <title level="a">Shared memory parallelism and low-rank approximation techniques applied to direct solvers in FEM simulation (regular paper)</title>
        <author>
          <persName key="scalapplix-2005-id18472">
            <foreName>Patrick</foreName>
            <surname>Amestoy</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Olivier</foreName>
            <surname>Boiteau</surname>
            <initial>O.</initial>
          </persName>
          <persName key="graal-2008-id18788">
            <foreName>Alfredo</foreName>
            <surname>Buttari</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2009-id60051">
            <foreName>Guillaume</foreName>
            <surname>Joslin</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18131">
            <foreName>Jean-Yves</foreName>
            <surname>L'Excellent</surname>
            <initial>J.-Y.</initial>
          </persName>
          <persName>
            <foreName>Wissam M.</foreName>
            <surname>Sid-Lakhdar</surname>
            <initial>W. M.</initial>
          </persName>
          <persName key="roma-2012-idp140458935000112">
            <foreName>Clement</foreName>
            <surname>Weisbecker</surname>
            <initial>C.</initial>
          </persName>
          <persName>
            <foreName>Michele</foreName>
            <surname>Forzan</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Cristian</foreName>
            <surname>Pozza</surname>
            <initial>C.</initial>
          </persName>
          <persName>
            <foreName>Valène</foreName>
            <surname>Pellissier</surname>
            <initial>V.</initial>
          </persName>
          <persName>
            <foreName>Rémy</foreName>
            <surname>Perrin</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">IEEE International Conference on the Computation of Electromagnetic Fields (COMPUMAG)</title>
        <loc>Budapest, Hungary</loc>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00924660" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00924660</ref>
        </imprint>
        <meeting id="cid49732">
          <title>Conference on the Computation of Electromagnetic Fields</title>
          <num>2013</num>
          <abbr type="sigle">Compumag</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid42" type="inproceedings" rend="year" n="cite:aupy:hal-00926199">
      <identifiant type="hal" value="hal-00926199"/>
      <analytic>
        <title level="a">Optimal Checkpointing Period: Time vs. Energy</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Performance Modeling, Benchmarking and Simulation of High Performance Computer Systems</title>
        <loc>Denver, United States</loc>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00926199" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926199</ref>
        </imprint>
        <meeting id="cid624073">
          <title>International Workshop on Performance Modeling, Benchmarking and Simulation of High Performance Computer Systems</title>
          <num>4</num>
          <abbr type="sigle">PMBS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid32" type="inproceedings" rend="year" n="cite:aupy:hal-00847620">
      <identifiant type="hal" value="hal-00847620"/>
      <analytic>
        <title level="a">On the Combination of Silent Error Detection and Checkpointing</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">PRDC - The 19th IEEE Pacific Rim International Symposium on Dependable Computing - 2013</title>
        <loc>Vancouver, Canada</loc>
        <imprint>
          <publisher>
            <orgName>IEEE</orgName>
          </publisher>
          <dateStruct>
            <month>December</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00847620" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00847620</ref>
        </imprint>
        <meeting id="cid357066">
          <title>Pacific Rim International Symposium on Dependable Computing</title>
          <num>19</num>
          <abbr type="sigle">PRDC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid43" type="inproceedings" rend="year" n="cite:aupy:hal-00857244">
      <identifiant type="hal" value="hal-00857244"/>
      <analytic>
        <title level="a">Energy-aware checkpointing of divisible tasks with soft or hard deadlines</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Rami</foreName>
            <surname>Melhem</surname>
            <initial>R.</initial>
          </persName>
          <persName key="graal-2009-id60733">
            <foreName>Paul</foreName>
            <surname>Renaud-Goud</surname>
            <initial>P.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">IGCC - 4th International Green Computing Conference - 2013</title>
        <loc>Arlington, United States</loc>
        <imprint>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00857244" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00857244</ref>
        </imprint>
        <meeting id="cid624032">
          <title>IEEE International Green Computing Conference</title>
          <num>4</num>
          <abbr type="sigle">IEEE IGCC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid75" type="inproceedings" rend="year" n="cite:aupy:hal-00844492">
      <identifiant type="hal" value="hal-00844492"/>
      <analytic>
        <title level="a">Implementing a systolic algorithm for QR factorization on multicore clusters with PaRSEC</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="scalapplix-2006-id18605">
            <foreName>Mathieu</foreName>
            <surname>Faverge</surname>
            <initial>M.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Jakub</foreName>
            <surname>Kurzak</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Piotr</foreName>
            <surname>Luszczek</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">PROPER 2013 - 6th Workshop on Productivity and Performance</title>
        <loc>Aachen, Germany</loc>
        <imprint>
          <dateStruct>
            <month>August</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00844492" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00844492</ref>
        </imprint>
        <meeting id="cid623589">
          <title>Workshop on Productivity and Performance</title>
          <num>6</num>
          <abbr type="sigle">PROPER</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid33" type="inproceedings" rend="year" n="cite:aupy:hal-00847622">
      <identifiant type="hal" value="hal-00847622"/>
      <analytic>
        <title level="a">Checkpointing strategies with prediction windows</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">PRDC - The 19th IEEE Pacific Rim International Symposium on Dependable Computing - 2013</title>
        <loc>Vancouver, Canada</loc>
        <imprint>
          <publisher>
            <orgName>IEEE</orgName>
          </publisher>
          <dateStruct>
            <month>December</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00847622" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00847622</ref>
        </imprint>
        <meeting id="cid357066">
          <title>Pacific Rim International Symposium on Dependable Computing</title>
          <num>19</num>
          <abbr type="sigle">PRDC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid51" type="inproceedings" rend="year" n="cite:beaumont:hal-00771640">
      <identifiant type="hal" value="hal-00771640"/>
      <analytic>
        <title level="a">Non Linear Divisible Loads: There is No Free Lunch</title>
        <author>
          <persName key="scalapplix-2005-id18245">
            <foreName>Olivier</foreName>
            <surname>Beaumont</surname>
            <initial>O.</initial>
          </persName>
          <persName key="cepage-2007-id18382">
            <foreName>Hubert</foreName>
            <surname>Larchevêque</surname>
            <initial>H.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">IPDPS 2013, 27th IEEE International Parallel &amp; Distributed Processing Symposium</title>
        <loc>Boston, United States</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">IEEE</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00771640" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00771640</ref>
        </imprint>
        <meeting id="cid87817">
          <title>IEEE International Parallel and Distributed Processing Symposium</title>
          <num>27</num>
          <abbr type="sigle">IPDPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid50" type="inproceedings" rend="year" n="cite:benoit:hal-00926093">
      <identifiant type="hal" value="hal-00926093"/>
      <analytic>
        <title level="a">Non-clairvoyant reduction algorithms for heterogeneous platforms</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="algorille-2005-id18342">
            <foreName>Louis-Claude</foreName>
            <surname>Canon</surname>
            <initial>L.-C.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">HeteroPar'2013, in conjunction with Euro-Par 2013</title>
        <loc>Aachen, Germany</loc>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00926093" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926093</ref>
        </imprint>
        <meeting id="cid322121">
          <title>International Workshop on Algorithms, Models and Tools for Parallel Computing on Heterogeneous Networks</title>
          <num>11</num>
          <abbr type="sigle">HeteroPar</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid60" type="inproceedings" rend="year" n="cite:benoit:hal-00738393">
      <identifiant type="doi" value="10.1109/IPDPSW.2013.30"/>
      <identifiant type="hal" value="hal-00738393"/>
      <analytic>
        <title level="a">Semi-matching algorithms for scheduling parallel tasks under resource constraints</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2011-idp140410990993920">
            <foreName>Johannes</foreName>
            <surname>Langguth</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">IEEE International Symposium on Parallel &amp; Distributed Processing, Workshops and Phd Forum</title>
        <loc>Cambridge, MA, United States</loc>
        <imprint>
          <publisher>
            <orgName>IEEE Computer Society</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">1744-1753</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00738393" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00738393</ref>
        </imprint>
        <meeting id="cid87817">
          <title>IEEE International Parallel and Distributed Processing Symposium</title>
          <num>27</num>
          <abbr type="sigle">IPDPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid41" type="inproceedings" rend="year" n="cite:bouteiller:hal-00926606">
      <identifiant type="doi" value="10.1007/978-3-642-40047-6_43"/>
      <identifiant type="hal" value="hal-00926606"/>
      <analytic>
        <title level="a">Multi-criteria checkpointing strategies: response-time versus resource utilization</title>
        <author>
          <persName key="graal-2005-id18178">
            <foreName>Aurélien</foreName>
            <surname>Bouteiller</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18099">
            <foreName>Franck</foreName>
            <surname>Cappello</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName key="grand-large-2008-id18798">
            <foreName>Amina</foreName>
            <surname>Guermouche</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName>Srpinger</foreName>
            <surname>Verlag</surname>
            <initial>S.</initial>
          </persName>
        </editor>
        <title level="m">Euro-Par 2013</title>
        <loc>Aachen, Germany</loc>
        <title level="s">LNCS</title>
        <imprint>
          <biblScope type="volume">8097</biblScope>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">420-431</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00926606" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926606</ref>
        </imprint>
        <meeting id="cid306382">
          <title>International Euro-Par Conference on Parallel Processing</title>
          <num>19</num>
          <abbr type="sigle">Euro-Par</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid36" type="inproceedings" rend="year" n="cite:casanova:hal-00763376">
      <identifiant type="hal" value="hal-00763376"/>
      <analytic>
        <title level="a">Mapping tightly-coupled applications on volatile resources</title>
        <author>
          <persName>
            <foreName>Henri</foreName>
            <surname>Casanova</surname>
            <initial>H.</initial>
          </persName>
          <persName key="graal-2008-id18982">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">PDP'2013, the 21st Euromicro Int. Conf. on Parallel, Distributed, and Network-Based Processing</title>
        <loc>Belfast, United Kingdom</loc>
        <imprint>
          <publisher>
            <orgName>IEEE Computer Society Press</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00763376" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00763376</ref>
        </imprint>
        <meeting id="cid64853">
          <title>Euromicro International Conference on Parallel, Distributed and Network-Based Processing</title>
          <num>21</num>
          <abbr type="sigle">PDP</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid37" type="inproceedings" rend="year" n="cite:casanova:hal-00788606">
      <identifiant type="hal" value="hal-00788606"/>
      <analytic>
        <title level="a">Scheduling Tightly-Coupled Applications on Heterogeneous Desktop Grids</title>
        <author>
          <persName>
            <foreName>Henri</foreName>
            <surname>Casanova</surname>
            <initial>H.</initial>
          </persName>
          <persName key="graal-2008-id18982">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">HCW 2013 - 22nd International Heterogeneity in Computing Workshop</title>
        <loc>Boston, United States</loc>
        <imprint>
          <dateStruct>
            <month>May</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00788606" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00788606</ref>
        </imprint>
        <meeting id="cid307023">
          <title>International Heterogeneous Computing Workshop</title>
          <num>22</num>
          <abbr type="sigle">HCW</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid77" type="inproceedings" rend="year" n="cite:casanova:hal-00923953">
      <identifiant type="hal" value="hal-00923953"/>
      <analytic>
        <title level="a">Cost-Optimal Execution of Boolean Query Trees with Shared Streams</title>
        <author>
          <persName>
            <foreName>Henri</foreName>
            <surname>Casanova</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Lipyeow</foreName>
            <surname>Lim</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">28th IEEE International Parallel &amp; Distributed Processing Symposium</title>
        <loc>Phoenix, United States</loc>
        <imprint>
          <publisher>
            <orgName>IEEE</orgName>
          </publisher>
          <dateStruct>
            <month>May</month>
            <year>2014</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00923953" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00923953</ref>
        </imprint>
        <meeting id="cid87817">
          <title>IEEE International Parallel and Distributed Processing Symposium</title>
          <num>28</num>
          <abbr type="sigle">IPDPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid61" type="inproceedings" rend="year" n="cite:deveci:hal-00923464">
      <identifiant type="doi" value="10.1109/ICPP.2013.11"/>
      <identifiant type="hal" value="hal-00923464"/>
      <analytic>
        <title level="a">A Push-Relabel-Based Maximum Cardinality Bipartite Matching Algorithm on GPUs</title>
        <author>
          <persName>
            <foreName>Mehmet</foreName>
            <surname>Deveci</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">42nd International Conference on Parallel Processing</title>
        <loc>Lyon, France</loc>
        <imprint>
          <publisher>
            <orgName>IEEE Computer Society</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">21 - 29</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00923464" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00923464</ref>
        </imprint>
        <meeting id="cid295154">
          <title>International Conference on Parallel Processing</title>
          <num>42</num>
          <abbr type="sigle">ICPP</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid62" type="inproceedings" rend="year" n="cite:deveci:hal-00923449">
      <identifiant type="doi" value="10.1007/978-3-642-40047-6_84"/>
      <identifiant type="hal" value="hal-00923449"/>
      <analytic>
        <title level="a">GPU accelerated maximum cardinality matching algorithms for bipartite graphs</title>
        <author>
          <persName>
            <foreName>Mehmet</foreName>
            <surname>Deveci</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName>Felix</foreName>
            <surname>Wolf</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Bernd</foreName>
            <surname>Mohr</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Dieter</foreName>
            <surname>an Mey</surname>
            <initial>D.</initial>
          </persName>
        </editor>
        <title level="m">Euro-Par 2013</title>
        <loc>Aachen, Germany</loc>
        <imprint>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <month>August</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">850-861</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00923449" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00923449</ref>
        </imprint>
        <meeting id="cid306382">
          <title>International Euro-Par Conference on Parallel Processing</title>
          <num>19</num>
          <abbr type="sigle">Euro-Par</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid76" type="inproceedings" rend="year" n="cite:di:hal-00847635">
      <identifiant type="doi" value="10.1145/2503210.2503217"/>
      <identifiant type="hal" value="hal-00847635"/>
      <analytic>
        <title level="a">Optimization of Cloud Task Processing with Checkpoint-Restart Mechanism</title>
        <author>
          <persName key="mescal-2012-idp140606033435856">
            <foreName>Sheng</foreName>
            <surname>Di</surname>
            <initial>S.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="grand-large-2005-id18314">
            <foreName>Derrick</foreName>
            <surname>Kondo</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Cho-Li</foreName>
            <surname>Wang</surname>
            <initial>C.-L.</initial>
          </persName>
          <persName key="grand-large-2005-id18099">
            <foreName>Franck</foreName>
            <surname>Cappello</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">SC13 - Supercomputing - 2013</title>
        <loc>Denver, United States</loc>
        <imprint>
          <publisher>
            <orgName>ACM</orgName>
          </publisher>
          <dateStruct>
            <month>November</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00847635" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00847635</ref>
        </imprint>
        <meeting id="cid19985">
          <title>ACM International Conference on Supercomputing</title>
          <num>2013</num>
          <abbr type="sigle">ICS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid40" type="inproceedings" rend="year" n="cite:dongarra:hal-00925168">
      <identifiant type="hal" value="hal-00925168"/>
      <analytic>
        <title level="a">Revisiting the double checkpointing algorithm</title>
        <author>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">APDCM 2013</title>
        <loc>Boston, United States</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">IEEE</orgName>
          </publisher>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00925168" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00925168</ref>
        </imprint>
        <meeting id="cid373416">
          <title>Workshop on Advances in Parallel and Distributed Computational Models</title>
          <num>15</num>
          <abbr type="sigle">APDCM</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid78" type="inproceedings" rend="year" n="cite:faverge:hal-00930238">
      <identifiant type="hal" value="hal-00930238"/>
      <analytic>
        <title level="a">Designing LU-QR hybrid solvers for performance and stability</title>
        <author>
          <persName key="scalapplix-2006-id18605">
            <foreName>Mathieu</foreName>
            <surname>Faverge</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Julien</foreName>
            <surname>Herrmann</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Julien</foreName>
            <surname>Langou</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Bradley</foreName>
            <surname>Lowery</surname>
            <initial>B.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">IEEE International Parallel &amp; Distributed Processing Symposium</title>
        <loc>Phoenix, United States</loc>
        <imprint>
          <dateStruct>
            <month>December</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00930238" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00930238</ref>
        </imprint>
        <meeting id="cid87817">
          <title>IEEE International Parallel and Distributed Processing Symposium</title>
          <num>27</num>
          <abbr type="sigle">IPDPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid31" type="inproceedings" rend="year" n="cite:herrmann:hal-00926502">
      <identifiant type="hal" value="hal-00926502"/>
      <analytic>
        <title level="a">Model and complexity results for tree traversals on hybrid platforms</title>
        <author>
          <persName>
            <foreName>Julien</foreName>
            <surname>Herrmann</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">HeteroPar - International Workshop on Algorithms, Models and Tools for Parallel Computing on Heterogeneous Platforms</title>
        <loc>Aachen, Germany</loc>
        <imprint>
          <dateStruct>
            <month>August</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00926502" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00926502</ref>
        </imprint>
        <meeting id="cid322121">
          <title>International Workshop on Algorithms, Models and Tools for Parallel Computing on Heterogeneous Networks</title>
          <num>11</num>
          <abbr type="sigle">HeteroPar</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct subtype="nonparu-n" id="roma-2013-bid63" type="inproceedings" rend="year" n="cite:kaya:hal-00923454">
      <identifiant type="hal" value="hal-00923454"/>
      <analytic>
        <title level="a">Analysis of Partitioning Models and Metrics in Parallel Sparse Matrix-Vector Multiplication</title>
        <author>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">10th PPAM - Parallel Processing and Applied Mathematics</title>
        <loc>Varsovie, Poland</loc>
        <imprint>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <year>2014</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00923454" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00923454</ref>
        </imprint>
        <meeting id="cid295329">
          <title>International Conference on Parallel Processing and Applied Mathematics</title>
          <num>11</num>
          <abbr type="sigle">PPAM</abbr>
        </meeting>
      </monogr>
      <note type="bnote">to appear</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid30" type="inproceedings" rend="year" n="cite:marchal:hal-00788612">
      <identifiant type="hal" value="hal-00788612"/>
      <analytic>
        <title level="a">Scheduling tree-shaped task graphs to minimize memory and makespan</title>
        <author>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
          <persName key="roma-2012-idp140458935022000">
            <foreName>Oliver</foreName>
            <surname>Sinnen</surname>
            <initial>O.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">IPDPS 2013 - 27th IEEE International Parallel &amp; Distributed Processing Symposium</title>
        <loc>Boston, United States</loc>
        <imprint>
          <dateStruct>
            <month>May</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00788612" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00788612</ref>
        </imprint>
        <meeting id="cid87817">
          <title>IEEE International Parallel and Distributed Processing Symposium</title>
          <num>27</num>
          <abbr type="sigle">IPDPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid54" type="inproceedings" rend="year" n="cite:weisbecker:hal-00924638">
      <identifiant type="doi" value="10.1190/segam2013-0603.1"/>
      <identifiant type="hal" value="hal-00924638"/>
      <analytic>
        <title level="a">3D frequency-domain seismic modeling with a Block Low-Rank algebraic multifrontal direct solver</title>
        <author>
          <persName key="roma-2012-idp140458935000112">
            <foreName>Clement</foreName>
            <surname>Weisbecker</surname>
            <initial>C.</initial>
          </persName>
          <persName key="scalapplix-2005-id18472">
            <foreName>Patrick R.</foreName>
            <surname>Amestoy</surname>
            <initial>P. R.</initial>
          </persName>
          <persName>
            <foreName>Olivier</foreName>
            <surname>Boiteau</surname>
            <initial>O.</initial>
          </persName>
          <persName>
            <foreName>Romain</foreName>
            <surname>Brossier</surname>
            <initial>R.</initial>
          </persName>
          <persName key="graal-2008-id18788">
            <foreName>Alfredo</foreName>
            <surname>Buttari</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18131">
            <foreName>Jean-Yves</foreName>
            <surname>L'Excellent</surname>
            <initial>J.-Y.</initial>
          </persName>
          <persName key="caiman-2006-id18311">
            <foreName>Stéphane</foreName>
            <surname>Operto</surname>
            <initial>S.</initial>
          </persName>
          <persName key="caiman-2005-id18253">
            <foreName>Jean</foreName>
            <surname>Virieux</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">SEG Technical Program Expanded Abstracts, SEG annual meeting</title>
        <loc>Houston, Texas, United States</loc>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00924638" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00924638</ref>
        </imprint>
        <meeting id="cid360928">
          <title>Society of Exploration Geophysicists International Exposition and Annual Meeting</title>
          <num>2013</num>
          <abbr type="sigle"/>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid65" type="inproceedings" rend="year" n="cite:yamazaki:hal-00923447">
      <identifiant type="hal" value="hal-00923447"/>
      <analytic>
        <title level="a">On Partitioning and Reordering Problems in a Hierarchically Parallel Hybrid Linear Solver</title>
        <author>
          <persName>
            <foreName>Ichitaro</foreName>
            <surname>Yamazaki</surname>
            <initial>I.</initial>
          </persName>
          <persName key="comore-2010-id59770">
            <foreName>Xiaoye S.</foreName>
            <surname>Li</surname>
            <initial>X. S.</initial>
          </persName>
          <persName key="roma-2012-idp140458934997424">
            <foreName>François-Henry</foreName>
            <surname>Rouet</surname>
            <initial>F.-H.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">2013 IEEE 27th International Parallel and Distributed Processing Symposium Workshops &amp; PhD Forum (IPDPSW)</title>
        <loc>Cambridge, MA, United States</loc>
        <imprint>
          <publisher>
            <orgName>IEEE Computer Society</orgName>
          </publisher>
          <publisher>
            <orgName type="organisation">IEEE</orgName>
          </publisher>
          <dateStruct>
            <month>May</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00923447" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00923447</ref>
        </imprint>
        <meeting id="cid87817">
          <title>IEEE International Parallel and Distributed Processing Symposium</title>
          <num>27</num>
          <abbr type="sigle">IPDPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid52" subtype="nonparu-n" type="techreport" rend="year" n="cite:amestoy:hal-00776859">
      <identifiant type="hal" value="hal-00776859"/>
      <monogr>
        <title level="m">Improving multifrontal methods by means of block low-rank representations</title>
        <author>
          <persName key="scalapplix-2005-id18472">
            <foreName>Patrick R.</foreName>
            <surname>Amestoy</surname>
            <initial>P. R.</initial>
          </persName>
          <persName>
            <foreName>Cleve</foreName>
            <surname>Ashcraft</surname>
            <initial>C.</initial>
          </persName>
          <persName>
            <foreName>Olivier</foreName>
            <surname>Boiteau</surname>
            <initial>O.</initial>
          </persName>
          <persName key="graal-2008-id18788">
            <foreName>Alfredo</foreName>
            <surname>Buttari</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18131">
            <foreName>Jean-Yves</foreName>
            <surname>L'Excellent</surname>
            <initial>J.-Y.</initial>
          </persName>
          <persName key="roma-2012-idp140458935000112">
            <foreName>Clement</foreName>
            <surname>Weisbecker</surname>
            <initial>C.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8199</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>January</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00776859" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00776859</ref>
        </imprint>
      </monogr>
      <note type="bnote">Submitted for publication to SIAM</note>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid88" type="techreport" rend="year" n="cite:aupy:hal-00878938">
      <identifiant type="hal" value="hal-00878938"/>
      <monogr>
        <title level="m">Optimal Checkpointing Period: Time vs. Energy</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8387</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>October</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">19</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00878938" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00878938</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid86" type="techreport" rend="year" n="cite:aupy:hal-00836871">
      <identifiant type="hal" value="hal-00836871"/>
      <monogr>
        <title level="m">On the Combination of Silent Error Detection and Checkpointing</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="grand-large-2005-id18208">
            <foreName>Thomas</foreName>
            <surname>Hérault</surname>
            <initial>T.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8319</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00836871" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00836871</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid81" type="techreport" rend="year" n="cite:aupy:hal-00788641">
      <identifiant type="hal" value="hal-00788641"/>
      <monogr>
        <title level="m">Energy-aware checkpointing of divisible tasks with soft or hard deadlines</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Rami</foreName>
            <surname>Melhem</surname>
            <initial>R.</initial>
          </persName>
          <persName key="graal-2009-id60733">
            <foreName>Paul</foreName>
            <surname>Renaud-Goud</surname>
            <initial>P.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8238</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">33</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00788641" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00788641</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid89" type="techreport" rend="year" n="cite:aupy:hal-00879248">
      <identifiant type="hal" value="hal-00879248"/>
      <monogr>
        <title level="m">Implementing a Systolic Algorithm for QR Factorization on Multicore Clusters with PaRSEC</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="scalapplix-2006-id18605">
            <foreName>Mathieu</foreName>
            <surname>Faverge</surname>
            <initial>M.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Jakub</foreName>
            <surname>Kurzak</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Piotr</foreName>
            <surname>Luszczek</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8390</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>November</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">16</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00879248" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00879248</ref>
        </imprint>
      </monogr>
      <note type="bnote">Published in ProPer'13</note>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid34" subtype="nonparu-n" type="techreport" rend="year" n="cite:aupy:hal-00788313">
      <identifiant type="hal" value="hal-00788313"/>
      <monogr>
        <title level="m">Checkpointing algorithms and fault prediction</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8237</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00788313" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00788313</ref>
        </imprint>
      </monogr>
      <note type="bnote">Accepted to be published in JPDC</note>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid82" type="techreport" rend="year" n="cite:aupy:hal-00789109">
      <identifiant type="hal" value="hal-00789109"/>
      <monogr>
        <title level="m">Checkpointing strategies with prediction windows</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8239</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">44</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00789109" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00789109</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid85" type="techreport" rend="year" n="cite:aupy:hal-00836629">
      <identifiant type="hal" value="hal-00836629"/>
      <monogr>
        <title level="m">Comments on ”Improving the computing efficiency of HPC systems using a combination of proactive and preventive checkpoint”</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8318</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00836629" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00836629</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid83" type="techreport" rend="year" n="cite:aupy:hal-00819036">
      <identifiant type="hal" value="hal-00819036"/>
      <monogr>
        <title level="m">Co-Scheduling Algorithms for High-Throughput Workload Execution</title>
        <author>
          <persName key="graal-2011-idp140410991004288">
            <foreName>Guillaume</foreName>
            <surname>Aupy</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Manu</foreName>
            <surname>Shantharam</surname>
            <initial>M.</initial>
          </persName>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Padma</foreName>
            <surname>Raghavan</surname>
            <initial>P.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8293</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>April</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">21</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00819036" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00819036</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid84" type="techreport" rend="year" n="cite:benoit:hal-00832102">
      <identifiant type="hal" value="hal-00832102"/>
      <monogr>
        <title level="m">Non-clairvoyant reduction algorithms for heterogeneous platforms</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="algorille-2005-id18342">
            <foreName>Louis-Claude</foreName>
            <surname>Canon</surname>
            <initial>L.-C.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8315</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00832102" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00832102</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid87" type="techreport" rend="year" n="cite:casanova:hal-00869340">
      <identifiant type="hal" value="hal-00869340"/>
      <monogr>
        <title level="m">Cost-Optimal Execution of Trees of Boolean Operators with Shared Streams</title>
        <author>
          <persName>
            <foreName>Henri</foreName>
            <surname>Casanova</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Lipyeow</foreName>
            <surname>Lim</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
          <persName key="graal-2011-idp140410991039440">
            <foreName>Dounia</foreName>
            <surname>Zaidouni</surname>
            <initial>D.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8373</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>October</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">39</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00869340" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00869340</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid64" type="techreport" rend="year" n="cite:catalyurek:hal-00821523">
      <identifiant type="hal" value="hal-00821523"/>
      <monogr>
        <title level="m">On analysis of partitioning models and metrics in parallel sparse matrix-vector multiplication</title>
        <author>
          <persName>
            <foreName>V. Umit</foreName>
            <surname>Catalyurek</surname>
            <initial>V. U.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8301</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>May</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">25</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00821523" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00821523</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid68" type="techreport" rend="year" n="cite:dufosse:hal-00877211">
      <identifiant type="hal" value="hal-00877211"/>
      <monogr>
        <title level="m">Randomized matching heuristics with quality guarantees on shared memory parallel computers</title>
        <author>
          <persName key="graal-2008-id18982">
            <foreName>Fanny</foreName>
            <surname>Dufossé</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Kamer</foreName>
            <surname>Kaya</surname>
            <initial>K.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8386 ; Rapport LAAS n°13578</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>October</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">28</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00877211" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00877211</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid80" type="techreport" rend="year" n="cite:herrmann:hal-00787753">
      <identifiant type="hal" value="hal-00787753"/>
      <monogr>
        <title level="m">Tree traversals with task-memory affinities</title>
        <author>
          <persName>
            <foreName>Julien</foreName>
            <surname>Herrmann</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8226</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">31</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00787753" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00787753</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid91" type="techreport" rend="year" n="cite:herrmann:hal-00944336">
      <identifiant type="hal" value="hal-00944336"/>
      <monogr>
        <title level="m">Memory-aware list scheduling for hybrid platforms</title>
        <author>
          <persName>
            <foreName>Julien</foreName>
            <surname>Herrmann</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8461</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2014</year>
          </dateStruct>
          <biblScope type="pages">30</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00944336" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00944336</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid90" type="techreport" rend="year" n="cite:kaya:hal-00932882">
      <identifiant type="hal" value="hal-00932882"/>
      <monogr>
        <title level="m">Fill-in reduction in sparse matrix factorizations using hypergraphs</title>
        <author>
          <persName>
            <foreName>Oguz</foreName>
            <surname>Kaya</surname>
            <initial>O.</initial>
          </persName>
          <persName>
            <foreName>Enver</foreName>
            <surname>Kayaaslan</surname>
            <initial>E.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
          <persName key="hiepacs-2009-id59582">
            <foreName>Iain S.</foreName>
            <surname>Duff</surname>
            <initial>I. S.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8448</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>January</month>
            <year>2014</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00932882" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00932882</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid69" type="techreport" rend="year" n="cite:kaya:hal-00795429">
      <identifiant type="hal" value="hal-00795429"/>
      <monogr>
        <title level="m">On the minimum edge cover and vertex partition by quasi-cliques problems</title>
        <author>
          <persName>
            <foreName>Oguz</foreName>
            <surname>Kaya</surname>
            <initial>O.</initial>
          </persName>
          <persName>
            <foreName>Enver</foreName>
            <surname>Kayaaslan</surname>
            <initial>E.</initial>
          </persName>
          <persName key="graal-2009-id59570">
            <foreName>Bora</foreName>
            <surname>Uçar</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8255</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00795429" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00795429</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid53" type="techreport" rend="year" n="cite:lexcellent:hal-00786055">
      <identifiant type="hal" value="hal-00786055"/>
      <monogr>
        <title level="m">Introduction of shared-memory parallelism in a distributed-memory multifrontal solver</title>
        <author>
          <persName key="graal-2005-id18131">
            <foreName>Jean-Yves</foreName>
            <surname>L'Excellent</surname>
            <initial>J.-Y.</initial>
          </persName>
          <persName key="graal-2011-idp140410991034064">
            <foreName>Mohamed W.</foreName>
            <surname>Sid-Lakhdar</surname>
            <initial>M. W.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-8227</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>February</month>
            <year>2013</year>
          </dateStruct>
          <biblScope type="pages">35</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00786055" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00786055</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid17" type="inproceedings" rend="foot" n="footcite:Assayad11">
      <analytic>
        <title level="a">Tradeoff exploration between reliability power consumption and execution time</title>
        <author>
          <persName>
            <foreName>Ismail</foreName>
            <surname>Assayad</surname>
            <initial>I.</initial>
          </persName>
          <persName key="popart-2005-id18078">
            <foreName>Alain</foreName>
            <surname>Girault</surname>
            <initial>A.</initial>
          </persName>
          <persName key="espresso-2005-id18200">
            <foreName>Hamoudi</foreName>
            <surname>Kalla</surname>
            <initial>H.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of SAFECOMP, the Conf. on Computer Safety, Reliability and Security</title>
        <loc>Washington, DC, USA</loc>
        <imprint>
          <dateStruct>
            <year>2011</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid12" type="inproceedings" rend="foot" n="footcite:pow3IPDPS">
      <analytic>
        <title level="a">Energy-aware partitioning for multiprocessor real-time systems</title>
        <author>
          <persName>
            <foreName>H.</foreName>
            <surname>Aydin</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Q.</foreName>
            <surname>Yang</surname>
            <initial>Q.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">IPDPS'03, the IEEE Int. Parallel and Distributed Processing Symposium</title>
        <imprint>
          <dateStruct>
            <year>2003</year>
          </dateStruct>
          <biblScope type="pages">113–121</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid13" type="article" rend="foot" n="footcite:BKP07">
      <identifiant type="doi" value="10.1145/1206035.1206038"/>
      <analytic>
        <title level="a">Speed Scaling to Manage Energy and Temperature</title>
        <author>
          <persName>
            <foreName>Nikhil</foreName>
            <surname>Bansal</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Tracy</foreName>
            <surname>Kimbrel</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Kirk</foreName>
            <surname>Pruhs</surname>
            <initial>K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Journal of the ACM</title>
        <imprint>
          <biblScope type="volume">54</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
          <biblScope type="pages">1 – 39</biblScope>
          <ref xlink:href="http://doi.acm.org/10.1145/1206035.1206038" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>doi.<allowbreak/>acm.<allowbreak/>org/<allowbreak/>10.<allowbreak/>1145/<allowbreak/>1206035.<allowbreak/>1206038</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid8" type="article" rend="foot" n="footcite:j107">
      <analytic>
        <title level="a">Scheduling concurrent bag-of-tasks applications on heterogeneous platforms</title>
        <author>
          <persName key="graal-2005-id18164">
            <foreName>Anne</foreName>
            <surname>Benoit</surname>
            <initial>A.</initial>
          </persName>
          <persName key="graal-2005-id18473">
            <foreName>Loris</foreName>
            <surname>Marchal</surname>
            <initial>L.</initial>
          </persName>
          <persName key="graal-2005-id18500">
            <foreName>Jean-François</foreName>
            <surname>Pineau</surname>
            <initial>J.-F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes">
        <title level="j">IEEE Transactions on Computers</title>
        <imprint>
          <biblScope type="volume">59</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">202-217</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid25" type="book" rend="foot" n="footcite:Scalapack97">
      <monogr>
        <title level="m">ScaLAPACK Users' Guide</title>
        <author>
          <persName>
            <foreName>L. S.</foreName>
            <surname>Blackford</surname>
            <initial>L. S.</initial>
          </persName>
          <persName key="imara-2008-id18673">
            <foreName>J.</foreName>
            <surname>Choi</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>A.</foreName>
            <surname>Cleary</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>E.</foreName>
            <surname>D'Azevedo</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>J.</foreName>
            <surname>Demmel</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>I.</foreName>
            <surname>Dhillon</surname>
            <initial>I.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>S.</foreName>
            <surname>Hammarling</surname>
            <initial>S.</initial>
          </persName>
          <persName key="cristal-2005-id18425">
            <foreName>G.</foreName>
            <surname>Henry</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>A.</foreName>
            <surname>Petitet</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>K.</foreName>
            <surname>Stanley</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>D.</foreName>
            <surname>Walker</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>R. C.</foreName>
            <surname>Whaley</surname>
            <initial>R. C.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>SIAM</orgName>
          </publisher>
          <dateStruct>
            <year>1997</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid24" type="techreport" rend="foot" n="footcite:lawn41">
      <monogr>
        <title level="m">Installation Guide for LAPACK</title>
        <author>
          <persName>
            <foreName>Susan</foreName>
            <surname>Blackford</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">41</biblScope>
          <publisher>
            <orgName type="institution">LAPACK Working Note</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>1999</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="bnote">originally released March 1992</note>
      <note type="typdoc">Technical report</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid6" type="booklet" rend="foot" n="footcite:bluewatersdec12">
      <monogr>
        <title level="m">Blue Waters Newsletter</title>
        <imprint>
          <dateStruct>
            <month>dec</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://cgi.ncsa.illinois.edu/BlueWaters/pdfs/bw-newsletter-1212.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>cgi.<allowbreak/>ncsa.<allowbreak/>illinois.<allowbreak/>edu/<allowbreak/>BlueWaters/<allowbreak/>pdfs/<allowbreak/>bw-newsletter-1212.<allowbreak/>pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid19" type="misc" rend="foot" n="footcite:bluewatersdata">
      <monogr>
        <title level="m">Blue Waters Resources</title>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="https://bluewaters.ncsa.illinois.edu/data" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>bluewaters.<allowbreak/>ncsa.<allowbreak/>illinois.<allowbreak/>edu/<allowbreak/>data</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid1" type="misc" rend="foot" n="footcite:boinc">
      <monogr>
        <title level="m">The BOINC project</title>
        <imprint>
          <dateStruct>
            <year>2013</year>
          </dateStruct>
          <ref xlink:href="http://boinc.berkeley.edu/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>boinc.<allowbreak/>berkeley.<allowbreak/>edu/</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid26" type="article" rend="foot" n="footcite:Buttari2008">
      <analytic>
        <title level="a">Parallel tiled QR factorization for multicore architectures</title>
        <author>
          <persName key="graal-2008-id18788">
            <foreName>Alfredo</foreName>
            <surname>Buttari</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Julien</foreName>
            <surname>Langou</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Jakub</foreName>
            <surname>Kurzak</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Concurrency: Practice and Experience</title>
        <imprint>
          <biblScope type="volume">20</biblScope>
          <biblScope type="number">13</biblScope>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">1573-1590</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid14" type="inproceedings" rend="foot" n="footcite:pow3ICPP">
      <analytic>
        <title level="a">Multiprocessor energy-efficient scheduling for real-time tasks</title>
        <author>
          <persName>
            <foreName>J.-J.</foreName>
            <surname>Chen</surname>
            <initial>J.-J.</initial>
          </persName>
          <persName>
            <foreName>T.-W.</foreName>
            <surname>Kuo</surname>
            <initial>T.-W.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">ICPP'05, the Int. Conference on Parallel Processing</title>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">13–20</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid29" type="inproceedings" rend="foot" n="footcite:6267853">
      <identifiant type="doi" value="10.1109/IPDPS.2012.53"/>
      <analytic>
        <title level="a">Hybrid Static/dynamic Scheduling for Already Optimized Dense Matrix Factorization</title>
        <author>
          <persName key="grand-large-2008-id18846">
            <foreName>S.</foreName>
            <surname>Donfack</surname>
            <initial>S.</initial>
          </persName>
          <persName key="sage-2005-id18153">
            <foreName>Laura</foreName>
            <surname>Grigori</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>W.D.</foreName>
            <surname>Gropp</surname>
            <initial>W.</initial>
          </persName>
          <persName>
            <foreName>L. V.</foreName>
            <surname>Kale</surname>
            <initial>L. V.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Parallel Distributed Processing Symposium (IPDPS), 2012 IEEE 26th International</title>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">496-507</biblScope>
          <ref xlink:href="http://dx.doi.org/10.1109/IPDPS.2012.53" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>dx.<allowbreak/>doi.<allowbreak/>org/<allowbreak/>10.<allowbreak/>1109/<allowbreak/>IPDPS.<allowbreak/>2012.<allowbreak/>53</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid9" type="article" rend="foot" n="footcite:j103">
      <analytic>
        <title level="a">Revisiting Matrix Product on Master-Worker Platforms</title>
        <author>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2005-id18500">
            <foreName>Jean-François</foreName>
            <surname>Pineau</surname>
            <initial>J.-F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Zhiao</foreName>
            <surname>Shi</surname>
            <initial>Z.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">International Journal of Foundations of Computer Science</title>
        <imprint>
          <biblScope type="volume">19</biblScope>
          <biblScope type="number">6</biblScope>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">1317-1336</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid10" type="inproceedings" rend="foot" n="footcite:c136">
      <analytic>
        <title level="a">Matrix Product on Heterogeneous Master-Worker Platforms</title>
        <author>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
          <persName key="graal-2005-id18500">
            <foreName>Jean-François</foreName>
            <surname>Pineau</surname>
            <initial>J.-F.</initial>
          </persName>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">13th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming</title>
        <loc>Salt Lake City, Utah</loc>
        <imprint>
          <dateStruct>
            <month>February</month>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">53–62</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid21" type="article" rend="foot" n="footcite:dure:83">
      <analytic>
        <title level="a">The multifrontal solution of indefinite sparse symmetric linear systems</title>
        <author>
          <persName key="hiepacs-2009-id59582">
            <foreName>Iain S.</foreName>
            <surname>Duff</surname>
            <initial>I. S.</initial>
          </persName>
          <persName>
            <foreName>John K.</foreName>
            <surname>Reid</surname>
            <initial>J. K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">"ACM Transactions on Mathematical Software"</title>
        <imprint>
          <biblScope type="volume">9</biblScope>
          <dateStruct>
            <year>1983</year>
          </dateStruct>
          <biblScope type="pages">302-325</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid22" type="article" rend="foot" n="footcite:dure:84">
      <analytic>
        <title level="a">The multifrontal solution of unsymmetric sets of linear systems</title>
        <author>
          <persName key="hiepacs-2009-id59582">
            <foreName>Iain S.</foreName>
            <surname>Duff</surname>
            <initial>I. S.</initial>
          </persName>
          <persName>
            <foreName>John K.</foreName>
            <surname>Reid</surname>
            <initial>J. K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">SIAM Journal on Scientific and Statistical Computing</title>
        <imprint>
          <biblScope type="volume">5</biblScope>
          <dateStruct>
            <year>1984</year>
          </dateStruct>
          <biblScope type="pages">633-641</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid57" type="article" rend="foot" n="footcite:eili:05">
      <analytic>
        <title level="a">The theory of elimination trees for sparse unsymmetric matrices</title>
        <author>
          <persName>
            <foreName>Stanley C.</foreName>
            <surname>Eisenstat</surname>
            <initial>S. C.</initial>
          </persName>
          <persName>
            <foreName>Joseph W. H.</foreName>
            <surname>Liu</surname>
            <initial>J. W. H.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">SIAM Journal on Matrix Analysis and Applications</title>
        <imprint>
          <biblScope type="volume">26</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">686–705</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid58" type="article" rend="foot" n="footcite:eili:08">
      <analytic>
        <title level="a">Algorithmic aspects of elimination trees for sparse unsymmetric matrices</title>
        <author>
          <persName>
            <foreName>Stanley C.</foreName>
            <surname>Eisenstat</surname>
            <initial>S. C.</initial>
          </persName>
          <persName>
            <foreName>Joseph W. H.</foreName>
            <surname>Liu</surname>
            <initial>J. W. H.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">SIAM Journal on Matrix Analysis and Applications</title>
        <imprint>
          <biblScope type="volume">29</biblScope>
          <biblScope type="number">4</biblScope>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">1363–1381</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid7" type="misc" rend="foot" n="footcite:DOEFaultManagement">
      <monogr>
        <title level="m">Final report of the Department of Energy Fault Management Workshop</title>
        <imprint>
          <dateStruct>
            <month>December</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://science.energy.gov/~/media/ascr/pdf/program-documents/docs/FaultManagement-wrkshpRpt-v4-final.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>science.<allowbreak/>energy.<allowbreak/>gov/<allowbreak/>~/<allowbreak/>media/<allowbreak/>ascr/<allowbreak/>pdf/<allowbreak/>program-documents/<allowbreak/>docs/<allowbreak/>FaultManagement-wrkshpRpt-v4-final.<allowbreak/>pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid20" type="inproceedings" rend="foot" n="footcite:ca-gauss-sc08">
      <analytic>
        <title level="a">Communication avoiding Gaussian elimination</title>
        <author>
          <persName key="sage-2005-id18153">
            <foreName>Laura</foreName>
            <surname>Grigori</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>James W.</foreName>
            <surname>Demmel</surname>
            <initial>J. W.</initial>
          </persName>
          <persName key="grand-large-2007-id18580">
            <foreName>Hua</foreName>
            <surname>Xiang</surname>
            <initial>H.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 2008 ACM/IEEE conference on Supercomputing</title>
        <loc>Piscataway, NJ, USA</loc>
        <title level="s">SC '08</title>
        <imprint>
          <publisher>
            <orgName>IEEE Press</orgName>
          </publisher>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">29:1</biblScope>
          <ref xlink:href="http://dl.acm.org/citation.cfm?id=1413370.1413400" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>dl.<allowbreak/>acm.<allowbreak/>org/<allowbreak/>citation.<allowbreak/>cfm?id=1413370.<allowbreak/>1413400</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid28" type="inproceedings" rend="foot" n="footcite:Hadri_ipdps_2010">
      <analytic>
        <title level="a">Tile QR Factorization with Parallel Panel Processing for Multicore Architectures</title>
        <author>
          <persName>
            <foreName>Bilel</foreName>
            <surname>Hadri</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Hatem</foreName>
            <surname>Ltaief</surname>
            <initial>H.</initial>
          </persName>
          <persName key="graal-2005-id18388">
            <foreName>Emmanuel</foreName>
            <surname>Agullo</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>Jack</foreName>
            <surname>Dongarra</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">IPDPS'10, the 24st IEEE Int. Parallel and Distributed Processing Symposium</title>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid23" type="article" rend="foot" n="footcite:liu:92">
      <analytic>
        <title level="a">The multifrontal method for sparse matrix solution: Theory and Practice</title>
        <author>
          <persName>
            <foreName>Joseph W. H.</foreName>
            <surname>Liu</surname>
            <initial>J. W. H.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">SIAM Review</title>
        <imprint>
          <biblScope type="volume">34</biblScope>
          <dateStruct>
            <year>1992</year>
          </dateStruct>
          <biblScope type="pages">82–109</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid18" type="article" rend="foot" n="footcite:Melhem03CP">
      <analytic>
        <title level="a">The Interplay of Power Management and Fault Recovery in Real-Time Systems</title>
        <author>
          <persName>
            <foreName>Rami</foreName>
            <surname>Melhem</surname>
            <initial>R.</initial>
          </persName>
          <persName>
            <foreName>Daniel</foreName>
            <surname>Mossé</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Elmootazbellah</foreName>
            <surname>Elnozahy</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">IEEE Transactions on Computers</title>
        <imprint>
          <biblScope type="volume">53</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">217-231</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid16" type="inproceedings" rend="foot" n="footcite:Oliner04">
      <analytic>
        <title level="a">Fault-aware job scheduling for bluegene/l systems</title>
        <author>
          <persName>
            <foreName>A. J.</foreName>
            <surname>Oliner</surname>
            <initial>A. J.</initial>
          </persName>
          <persName>
            <foreName>R. K.</foreName>
            <surname>Sahoo</surname>
            <initial>R. K.</initial>
          </persName>
          <persName>
            <foreName>J. E.</foreName>
            <surname>Moreira</surname>
            <initial>J. E.</initial>
          </persName>
          <persName>
            <foreName>M.</foreName>
            <surname>Gupta</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>A.</foreName>
            <surname>Sivasubramaniam</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">IPDPS'04, the IEEE Int. Parallel and Distributed Processing Symposium</title>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">64–73</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid27" type="article" rend="foot" n="footcite:Quintana:2009">
      <analytic>
        <title level="a">Programming Matrix Algorithms-by-Blocks for Thread-Level Parallelism</title>
        <author>
          <persName>
            <foreName>G.</foreName>
            <surname>Quintana-Ortí</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>E.S.</foreName>
            <surname>Quintana-Ortí</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>R. A.</foreName>
            <surname>van de Geijn</surname>
            <initial>R. A.</initial>
          </persName>
          <persName>
            <foreName>F. G. Van</foreName>
            <surname>Zee</surname>
            <initial>F. G. V.</initial>
          </persName>
          <persName>
            <foreName>Ernie</foreName>
            <surname>Chan</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">ACM Transactions on Mathematical Software</title>
        <imprint>
          <biblScope type="volume">36</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid11" type="incollection" rend="foot" n="footcite:c149">
      <analytic>
        <title level="a">Algorithmic Issues in Grid Computing</title>
        <author>
          <persName key="graal-2005-id18220">
            <foreName>Yves</foreName>
            <surname>Robert</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="graal-2005-id18145">
            <foreName>Frédéric</foreName>
            <surname>Vivien</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Algorithms and Theory of Computation Handbook</title>
        <imprint>
          <publisher>
            <orgName>Chapman and Hall/CRC Press</orgName>
          </publisher>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid5" type="misc" rend="foot" n="footcite:DarpaExaResilience">
      <monogr>
        <title level="m">System Resilience at Extreme Scale: white paper</title>
        <imprint>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
          <ref xlink:href="http://institute.lanl.gov/resilience/docs/IBM%20Mootaz%20White%20Paper%20System%20Resilience.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>institute.<allowbreak/>lanl.<allowbreak/>gov/<allowbreak/>resilience/<allowbreak/>docs/<allowbreak/>IBM%20Mootaz%20White%20Paper%20System%20Resilience.<allowbreak/>pdf</ref>
        </imprint>
      </monogr>
      <note type="bnote">DARPA</note>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid3" type="misc" rend="foot" n="footcite:top500nov11">
      <monogr>
        <title level="m">Top500 List - November 2011</title>
        <imprint>
          <dateStruct>
            <year>2011</year>
          </dateStruct>
          <ref xlink:href="http://www.top500.org/list/2011/11/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>top500.<allowbreak/>org/<allowbreak/>list/<allowbreak/>2011/<allowbreak/>11/</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid0" type="misc" rend="foot" n="footcite:top500nov12">
      <monogr>
        <title level="m">Top500 List - November 2012</title>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://www.top500.org/list/2012/11/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>top500.<allowbreak/>org/<allowbreak/>list/<allowbreak/>2012/<allowbreak/>11/</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid4" type="inproceedings" rend="foot" n="footcite:6264677">
      <identifiant type="doi" value="10.1109/DSNW.2012.6264677"/>
      <analytic>
        <title level="a">A scalable double in-memory checkpoint and restart scheme towards exascale</title>
        <author>
          <persName>
            <foreName>Gengbin</foreName>
            <surname>Zheng</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Xiang</foreName>
            <surname>Ni</surname>
            <initial>X.</initial>
          </persName>
          <persName>
            <foreName>L. V.</foreName>
            <surname>Kale</surname>
            <initial>L. V.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Dependable Systems and Networks Workshops (DSN-W)</title>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://dx.doi.org/10.1109/DSNW.2012.6264677" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>dx.<allowbreak/>doi.<allowbreak/>org/<allowbreak/>10.<allowbreak/>1109/<allowbreak/>DSNW.<allowbreak/>2012.<allowbreak/>6264677</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="roma-2013-bid15" type="inproceedings" rend="foot" n="footcite:Zhu04EEM">
      <analytic>
        <title level="a">The effects of energy management on reliability in real-time embedded systems</title>
        <author>
          <persName>
            <foreName>Dakai</foreName>
            <surname>Zhu</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Rami</foreName>
            <surname>Melhem</surname>
            <initial>R.</initial>
          </persName>
          <persName>
            <foreName>Daniel</foreName>
            <surname>Mossé</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proc. of IEEE/ACM Int. Conf. on Computer-Aided Design (ICCAD)</title>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">35–40</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
  </biblio>
</raweb>
