<?xml version="1.0" encoding="utf-8"?>
<raweb xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" year="2018">
  <identification id="links" isproject="true">
    <shortname>LINKS</shortname>
    <projectName>Linking Dynamic Data</projectName>
    <theme-de-recherche>Data and Knowledge Representation and Processing</theme-de-recherche>
    <domaine-de-recherche>Perception, Cognition and Interaction</domaine-de-recherche>
    <urlTeam>http://team.inria.fr/links/</urlTeam>
    <structure_exterieure type="Labs">
      <libelle>Centre de Recherche en Informatique, Signal et Automatique de Lille</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>CNRS</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Université Charles de Gaulle (Lille 3)</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Université des sciences et technologies de Lille (Lille 1)</libelle>
    </structure_exterieure>
    <header_dates_team>Creation of the Team: 2013 January 01, updated into Project-Team: 2016 June 01</header_dates_team>
    <LeTypeProjet>Project-Team</LeTypeProjet>
    <keywordsSdN>
      <term>A2.1. - Programming Languages</term>
      <term>A2.1.1. - Semantics of programming languages</term>
      <term>A2.1.4. - Functional programming</term>
      <term>A2.1.6. - Concurrent programming</term>
      <term>A2.4. - Formal method for verification, reliability, certification</term>
      <term>A2.4.1. - Analysis</term>
      <term>A2.4.2. - Model-checking</term>
      <term>A2.4.3. - Proofs</term>
      <term>A3.1. - Data</term>
      <term>A3.1.1. - Modeling, representation</term>
      <term>A3.1.2. - Data management, quering and storage</term>
      <term>A3.1.3. - Distributed data</term>
      <term>A3.1.4. - Uncertain data</term>
      <term>A3.1.5. - Control access, privacy</term>
      <term>A3.1.6. - Query optimization</term>
      <term>A3.1.7. - Open data</term>
      <term>A3.1.8. - Big data (production, storage, transfer)</term>
      <term>A3.1.9. - Database</term>
      <term>A3.2.1. - Knowledge bases</term>
      <term>A3.2.2. - Knowledge extraction, cleaning</term>
      <term>A3.2.3. - Inference</term>
      <term>A3.2.4. - Semantic Web</term>
      <term>A4.7. - Access control</term>
      <term>A4.8. - Privacy-enhancing technologies</term>
      <term>A7. - Theory of computation</term>
      <term>A7.2. - Logic in Computer Science</term>
      <term>A9.1. - Knowledge</term>
      <term>A9.2. - Machine learning</term>
      <term>A9.7. - AI algorithmics</term>
      <term>A9.8. - Reasoning</term>
    </keywordsSdN>
    <keywordsSecteurs>
      <term>B6.1. - Software industry</term>
      <term>B6.3.1. - Web</term>
      <term>B6.3.4. - Social Networks</term>
      <term>B6.5. - Information systems</term>
      <term>B9.5.1. - Computer science</term>
      <term>B9.5.6. - Data science</term>
      <term>B9.10. - Privacy</term>
    </keywordsSecteurs>
    <UR name="Lille"/>
  </identification>
  <team id="uid1">
    <person key="links-2018-idp158976">
      <firstname>Joachim</firstname>
      <lastname>Niehren</lastname>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Team leader, Inria, Senior Researcher</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="links-2018-idp161888">
      <firstname>Iovka</firstname>
      <lastname>Boneva</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Associate Professor</moreinfo>
    </person>
    <person key="links-2018-idp164416">
      <firstname>Florent</firstname>
      <lastname>Capelli</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Associate Professor</moreinfo>
    </person>
    <person key="links-2018-idp166944">
      <firstname>Aurélien</firstname>
      <lastname>Lemay</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Associate Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="links-2018-idp169856">
      <firstname>Charles</firstname>
      <lastname>Paperman</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Associate Professor</moreinfo>
    </person>
    <person key="links-2018-idp172384">
      <firstname>Sylvain</firstname>
      <lastname>Salvati</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="links-2018-idp175280">
      <firstname>Slawomir</firstname>
      <lastname>Staworko</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Associate Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="links-2018-idp178192">
      <firstname>Sophie</firstname>
      <lastname>Tison</lastname>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille, Professor</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="links-2018-idp181088">
      <firstname>Nicolas</firstname>
      <lastname>Bacquey</lastname>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria, until Aug 2018</moreinfo>
    </person>
    <person key="links-2018-idp183552">
      <firstname>Bruno</firstname>
      <lastname>Guillon</lastname>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria, from Nov 2018</moreinfo>
    </person>
    <person key="links-2018-idp186016">
      <firstname>Nicolas</firstname>
      <lastname>Crosetti</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria, from Oct 2018</moreinfo>
    </person>
    <person key="links-2018-idp188448">
      <firstname>Dimitri</firstname>
      <lastname>Gallois</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille</moreinfo>
    </person>
    <person key="links-2018-idp190912">
      <firstname>Paul</firstname>
      <lastname>Gallot</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
    <person key="links-2018-idp193344">
      <firstname>Jose Martin</firstname>
      <lastname>Lozano</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Université de Lille</moreinfo>
    </person>
    <person key="links-2018-idp195808">
      <firstname>Momar</firstname>
      <lastname>Sakho</lastname>
      <categoryPro>PhD</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
    <person key="links-2018-idp198240">
      <firstname>Jeremie</firstname>
      <lastname>Dusart</lastname>
      <categoryPro>Technique</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
    <person key="links-2018-idp200704">
      <firstname>Nathalie</firstname>
      <lastname>Bonte</lastname>
      <categoryPro>Assistant</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Inria</moreinfo>
    </person>
    <person key="links-2018-idp203168">
      <firstname>Rustam</firstname>
      <lastname>Azimov</lastname>
      <categoryPro>Visiteur</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Saint Petersburg University, from Aug 2018 until Nov 2018</moreinfo>
    </person>
    <person key="links-2018-idp205680">
      <firstname>Herminio</firstname>
      <lastname>Garcia Gonzalez</lastname>
      <categoryPro>Visiteur</categoryPro>
      <research-centre>Lille</research-centre>
      <moreinfo>Oviedo University, from Sep 2018 until Dec 2018</moreinfo>
    </person>
  </team>
  <presentation id="uid2">
    <bodyTitle>Overall Objectives</bodyTitle>
    <subsection id="uid3" level="1">
      <bodyTitle>Overall Objectives</bodyTitle>
      <p>We will develop algorithms for answering
logical querying on heterogeneous linked data collections in hybrid formats,
distributed programming languages for managing dynamic linked data
collections and workflows based on queries and mappings, and symbolic
machine learning algorithms that can link datasets by inferring appropriate
queries and mappings.</p>
    </subsection>
    <subsection id="uid4" level="1">
      <bodyTitle>Presentation</bodyTitle>
      <p>The following three paragraphs summarize our main research objectives.</p>
      <descriptionlist>
        <label>
          <i>Querying Heterogeneous Linked Data</i>
        </label>
        <li id="uid5">
          <p noindent="true"> We will develop new kinds of schema mappings for semi-structured
datasets in hybrid formats including graph databases, RDF collections, and
relational databases. These induce recursive queries on linked data collections
for which we will investigate evaluation algorithms, containment problems,
and concrete applications.</p>
        </li>
        <label>
          <i>Managing Dynamic Linked Data</i>
        </label>
        <li id="uid6">
          <p noindent="true"> In order to manage dynamic linked
data collections and workflows, we will develop distributed data-centric
programming languages with streams and parallelism, based on novel algorithms for
incremental query answering, study the propagation of updates of dynamic data
through schema mappings, and investigate static analysis methods for
linked data workflows.</p>
        </li>
        <label>
          <i>Linking Data Graphs</i>
        </label>
        <li id="uid7">
          <p noindent="true"> Finally, we will develop symbolic
machine learning algorithms, for inferring queries and
mappings between linked data collections in various graphs formats
from annotated examples.</p>
        </li>
      </descriptionlist>
    </subsection>
  </presentation>
  <fondements id="uid8">
    <bodyTitle>Research Program</bodyTitle>
    <subsection id="uid9" level="1">
      <bodyTitle>Background</bodyTitle>
      <p>The main objective of <span class="smallcap" align="left">Links</span> is to develop methods for
querying and managing linked data collections. Even though
open linked data is the most prominent example, we will focus
on hybrid linked data collections, which are collections of
semi-structured datasets in hybrid formats: graph-based,
<span class="smallcap" align="left">rdf</span>, relational, and <span class="smallcap" align="left">NoSQL</span>. The elements of these datasets
may be linked, either by pointers or by additional relations
between the elements of the different datasets, for instance
the “same-as” or “member-of” relations as in <span class="smallcap" align="left">rdf</span>.</p>
      <p>The advantage of traditional data models
is that there exist powerful querying methods and technologies that one
might want to preserve. In particular, they come with
powerful schemas that constraint the possible manners in
which knowledge is represented to a finite number
of patterns. The exhaustiveness of these patterns is
essential for writing of queries that cover all possible cases.
Pattern violations are excluded by schema validation.
In contrast, <span class="smallcap" align="left">rdf</span> schema languages such as <span class="smallcap" align="left">rdfs</span> can only enrich
the relations of a dataset by new relations, which also helps for
query writing, but which cannot constraint the number of possible
patterns, so that they do not come with any reasonable notion
of schema validation.</p>
      <p>The main weakness of traditional formats, however, is that they do not scale
to large data collections as stored on the Web, while the <span class="smallcap" align="left">rdf</span> data models
scales well to very big collections such as linked open data. Therefore, our
objective is to study mixed data collections, some of which may be in <span class="smallcap" align="left">rdf</span> format, in which we can lift the advantages of smaller datasets in traditional
formats to much larger linked data collections. Such data collections are typically distributed over the internet, that some data sources
have rigid query facilities that cannot be easily adapted or extended.</p>
      <p>The main assumption that we impose in order to enable
the logical approach, is that the given linked data
collection must be correct in most dimensions. This means that
all datasets are well-formed with respect to their available
constraints and schemas, and clean with respect to the data values in
most of the components of the relations in the datasets.
One of the challenges is to integrate good quality <span class="smallcap" align="left">rdf</span> datasets into
this setting, another is to clean the incorrect data in those
dimensions that are less proper. It remains to be investigated
in how far these assumptions can be maintained in realistic
applications, and how much they can be weakened otherwise.</p>
      <p>For querying linked data collections,
the main problems are to resolve the heterogeneity of data formats and schemas,
to understand the efficiency and expressiveness of recursive queries,
that can follow links repeatedly, to answer queries under constraints,
and to optimize query answering algorithms based on static analysis.
When linked data is dynamically created, exchanged, or updated,
the problems are how to process linked data incrementally, and how to manage
linked data collections that change dynamically. In any case (static
and dynamic) one needs to find appropriate schema mappings for linking
semi-structured datasets. We will study how to automatize parts of
this search process by developing symbolic machine learning techniques for
linked data collections.</p>
    </subsection>
    <subsection id="uid10" level="1">
      <bodyTitle>Querying Heterogeneous
Linked Data</bodyTitle>
      <p>Our main objective is to query collections of linked datasets. In the static setting, we consider
two kinds of links: explicit links between elements of the datasets, such as equalities
or pointers, and logical links between relations of different datasets such as schema mappings.
In the dynamic setting, we permit a third kind of links that point to
“intentional” relations computable from a description, such
as the application of a Web service or the application of
a schema mapping.</p>
      <p>We believe that collections of linked datasets are usually too big to ensure a global
knowledge of all datasets. Therefore, schema mappings and constraints should
remain between pairs of datasets. Our main goal is to be able to pose a query on a collection of
datasets, while accounting for the possible recursive effects of schema mappings.
For illustration, consider a ring of datasets <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mn>1</mn></msub></math></formula>, <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mn>2</mn></msub></math></formula>, <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mn>3</mn></msub></math></formula>
linked by schema mappings <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>M</mi><mn>1</mn></msub></math></formula>, <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>M</mi><mn>2</mn></msub></math></formula>, <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>M</mi><mn>3</mn></msub></math></formula> that tell us how to
complete a database <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mi>i</mi></msub></math></formula> by new elements from the next database in the cycle.</p>
      <p>The mappings <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>M</mi><mi>i</mi></msub></math></formula> induce three intentional datasets <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mn>1</mn></msub></math></formula>, <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mn>2</mn></msub></math></formula>, and <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mn>3</mn></msub></math></formula>, such
that <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mi>i</mi></msub></math></formula> contains all elements from <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mi>i</mi></msub></math></formula> and all elements
implied by <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>M</mi><mi>i</mi></msub></math></formula> from the next intentional dataset in the ring:</p>
      <formula type="display">
        <math xmlns="http://www.w3.org/1998/Math/MathML" mode="display" overflow="scroll">
          <mrow>
            <msub>
              <mi>I</mi>
              <mn>1</mn>
            </msub>
            <mo>=</mo>
            <msub>
              <mi>D</mi>
              <mn>1</mn>
            </msub>
            <mo>∪</mo>
            <msub>
              <mi>M</mi>
              <mn>1</mn>
            </msub>
            <mrow>
              <mo>(</mo>
              <msub>
                <mi>I</mi>
                <mn>2</mn>
              </msub>
              <mo>)</mo>
            </mrow>
            <mo>,</mo>
            <mspace width="1.em"/>
            <msub>
              <mi>I</mi>
              <mn>2</mn>
            </msub>
            <mo>=</mo>
            <msub>
              <mi>D</mi>
              <mn>2</mn>
            </msub>
            <mo>∪</mo>
            <msub>
              <mi>M</mi>
              <mn>2</mn>
            </msub>
            <mrow>
              <mo>(</mo>
              <msub>
                <mi>I</mi>
                <mn>3</mn>
              </msub>
              <mo>)</mo>
            </mrow>
            <mo>,</mo>
            <mspace width="1.em"/>
            <msub>
              <mi>I</mi>
              <mn>3</mn>
            </msub>
            <mo>=</mo>
            <msub>
              <mi>D</mi>
              <mn>3</mn>
            </msub>
            <mo>∪</mo>
            <msub>
              <mi>M</mi>
              <mn>3</mn>
            </msub>
            <mrow>
              <mo>(</mo>
              <msub>
                <mi>I</mi>
                <mn>1</mn>
              </msub>
              <mo>)</mo>
            </mrow>
          </mrow>
        </math>
      </formula>
      <p noindent="true">Clearly, the global information collected by the intentional
datasets depends recursively on all three original datasets <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mi>i</mi></msub></math></formula>.
Queries to the global information can now be specified as
standard queries to the intentional databases <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mi>i</mi></msub></math></formula>. However,
we will never materialize the intentional databases <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mi>i</mi></msub></math></formula>.
Instead, we can rewrite queries on one of the intentional datasets <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mi>i</mi></msub></math></formula>
to recursive queries on the union of the original
datasets <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mn>1</mn></msub></math></formula>, <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mn>2</mn></msub></math></formula>, and <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mn>3</mn></msub></math></formula> with their links and relations. Therefore, a query answering algorithm is needed
for recursive queries, that chases the “links” between the <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>D</mi><mi>i</mi></msub></math></formula> in order to
compute the part of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><msub><mi>I</mi><mi>i</mi></msub></math></formula> needed for the purpose of query answering.</p>
      <p>This illustrates that we must account for the graph data models when dealing with linked data collections whose elements are
linked, and that query languages for such graphs must provide
recursion in order to chase links. Therefore, we will
have to study graph databases with recursive queries,
such as <span class="smallcap" align="left">rdf</span> graphs with <span class="smallcap" align="left">sparql</span> queries, but also
other classes of graph databases and queries.</p>
      <p>We study schemas and mappings between datasets with different
kinds of data models
and the complexity of evaluating recursive queries over graphs.
In order to use schema mapping for efficiently querying the different
datasets,
we need to optimize the queries by taking into account the mappings.
Therefore, we will study
static analysis of schema mappings and
recursive queries.
Finally, we develop concrete applications in which our
fundamental techniques can be applied.</p>
    </subsection>
    <subsection id="uid11" level="1">
      <bodyTitle>Managing Dynamic Linked Data</bodyTitle>
      <p>With the quick growth of the information technology on the Web, more
and more Web data gets created dynamically every day, for instance by smartphones,
industrial machines, users of social networks, and all kinds
of sensors. Therefore, large amounts of dynamic data need to
be exchanged and managed by various data-centric web services, such
as online shops, online newspapers, and social networks.</p>
      <p>Dynamic data is often created by the application of some kind
of service on the Web. This kind of data is intentional in the
same spirit as the intentional data specified by the application
of a schema mapping, or the application of some query to the
hidden Web. Therefore, we will consider a third kind of links
in the dynamic setting, that map to intentional data
specified by whatever kind of function application. Such a function
can be defined in data-centric programming languages,
in the style of Active <tt>XML</tt>, <span class="smallcap" align="left">xslt</span>, and <span class="smallcap" align="left">NoSQL</span> languages.</p>
      <p>The dynamicity of data adds a further dimension to the
challenges for linked data collections that we described
before, while all the difficulties remain valid. One of the
new aspects is that intentional data may be produced incrementally,
as for instance when exchanged over data streams. Therefore, one needs
incremental algorithms able to evaluate queries on
incomplete linked data collections, that are extended
or updated incrementally. Note that incremental data
may be produced without end, such as a Twitter stream,
so that one cannot wait for its completion. Instead,
one needs to query and manage dynamic data with
as low latency as possible. Furthermore, all static
analysis problems are to be re-investigated in
the presence of dynamic data.</p>
      <p>Another aspect of dynamic data is distribution over the Web,
and thus parallel processing as in the cloud. This raises
the typical problems coming with data distribution:
huge data sources cannot be moved without very high costs,
while data must be replicated for providing efficient
parallel access. This makes it difficult, if not impossible,
to update replicated data consistently. Therefore, the
consistency assumption has been removed by <span class="smallcap" align="left">NoSQL</span> databases for instance, while parallel algorithmic
is limited to naive parallelization (i.e. map/reduce)
where only few data needs to be exchanged.</p>
      <p>We will investigate incremental query evaluation for
distributed data-centered programming languages
for linked data collections,
dynamic updates as needed for linked data
management,
and static analysis for linked data
workflows.</p>
    </subsection>
    <subsection id="uid12" level="1">
      <bodyTitle>Linking Graphs</bodyTitle>
      <p>When datasets from independent sources are not linked with existing
schema mappings, we would like to investigate symbolic machine learning solutions for
inferring such mappings in order to define meaningful links between
data from separate sources. This problem can be
studied for various kinds of linked data collections. Before
presenting the precise objectives, we will illustrate
our approach on the example of linking data in two independent
graphs: an address book of a research institute containing
detailed personnel information and a (global) bibliographic database
containing information on papers and their authors.</p>
      <p>We remind that a schema allows to identify a collection of types each
grouping objects from the same semantic class e.g., the collection of
all persons in the address book and the collection of all authors in
the bibliography database. As a schema is often lacking or underspecified in graph data models, we intend to investigate inference methods
based on structural similarity of graph fragments used to describe
objects from the same class in a given document e.g., in the
bibliographic database every author has a name and a number of
affiliations, while a paper has a title and a number of
authors. Furthermore, our inference methods will attempt to identify,
for every type, a set of possible keys, where by key we understand a
collection of attributes of an object that uniquely identifies such an
object in its semantic class. For instance, for a person in the
address book two examples of a key are the name of the person and the
office phone number of that person.</p>
      <p>In the next step, we plan to investigate employing existing entity
linkage solutions
to identify pairs of types from different databases whose instances
should be linked using compatible keys. For instance, persons in the
address book should be linked with authors in the bibliographical
database using the name as the compatible key. Linking the same
objects (represented in different ways) in two databases can be viewed
as an instance of a mapping between the two databases. Such mapping
is, however, discriminatory because it typically maps objects from a
specific subset of objects of given types. For instance, the mapping
implied by linking persons in the address book with authors in the
bibliographic database involves in fact researchers, a subgroup of
personnel of the research institute, and authors affiliated with the
research institute. Naturally, a subset of objects of a given type, or
a subtype, can be viewed as a result of a query on the set of all
objects, which on very basic level illustrates how learning data
mappings can be reduced to learning queries.</p>
      <p>While basic mappings link objects of the same type, more general
mappings define how the same type of information is represented in two
different databases. For instance, the email address and the postal
address of an individual may be represented in one way in the address
book and in another way in the bibliographic databases, and naturally,
the query asking for the email address and the postal address of a
person identified by a given name will differ from one database to the
other. While queries used in the context of linking objects of
compatible types are essentially unary, queries used in the context of
linking information are <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>n</mi></math></formula>-ary and we plan to approach inference of
general database mappings by investigating and employing algorithms
for inference of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>n</mi></math></formula>-ary queries.</p>
      <p>An important goal in this research is elaborating a formal definition
of <i>learnability</i> (feasibility of inference) of a given class of
concepts (schemas of queries). We plan to following the example of
Gold (1967), which requires not only the existence of an
efficient algorithm that infers concepts consistent with the given
input but the ability to infer every concept from the given class with
a sufficiently informative input. Naturally, learnability depends on
two parameters. The first parameter is the class of concepts i.e., a
class of schema and a class of queries, from which the goal concept is
to be inferred. The second parameter is the type of input that an
inference algorithm is given. This can be a set of examples of a
concept e.g., instances of <span class="smallcap" align="left">rdf</span> databases for which we wish to
construct a schema or a selection of nodes that a goal query is to
select. Alternatively, a more general interactive scenario can be used
where the learning algorithm inquires the user about the goal concept
e.g., by asking to indicate whether a given node is to be selected or
not (as membership queries of Angluin (1987)). In general, the richer the input is, the
richer class of concepts can be handled, however, the richer class of
queries is to be handled, the higher computational cost is to be
expected. The primary task is to find a good compromise and identify
classes of concepts that are of high practical value, allow efficient
inference with possibly simple type of input.</p>
      <p>The main open problem for graph-shaped data studied by Links
are how to infer queries, schemas, and schema-mappings for
graph-structured data.</p>
    </subsection>
  </fondements>
  <domaine id="uid13">
    <bodyTitle>Application Domains</bodyTitle>
    <subsection id="uid14" level="1">
      <bodyTitle>Linked Data Integration</bodyTitle>
      <p>There are many contexts in which integrating linked data is interesting.
We advocate here one possible scenario, namely that of integrating business linked data to feed what is called Business Intelligence.
The latter consists of a set of theories and methodologies that transform raw data into meaningful and useful information for business purposes (from Wikipedia).
In the past decade, most of the enterprise data was proprietary, thus residing within the enterprise repository, along with the knowledge derived from that data.
Today's' enterprises and businessmen need to face the problem of information explosion, due to the Internet's ability to rapidly convey large amounts of information throughout the world via end-user applications and tools.
Although linked data collections exist by bridging the gap between enterprise data and external resources, they are not sufficient to
support the various tasks of Business Intelligence. To make a concrete example, concepts in an enterprise repository need to be matched
with concepts in Wikipedia and this can be done via pointers or equalities. However, more complex logical statements (i.e. mappings) need to be conceived to
map a portion of a local database to a portion of an <span class="smallcap" align="left">rdf</span> graph, such as a subgraph in Wikipedia or in a social network, e.g. LinkedIn.
Such mappings would then enrich the amount of knowledge shared within the enterprise and let more complex queries be evaluated.
As an example, businessmen with the aid of business intelligence tools need to make complex sentimental analysis on the potential
clients and for such a reason, such tools must be able to pose complex queries, that exploit the previous logical mappings to
guide their analysis.
Moreover, the external resources may be rapidly evolving thus leading to revisit the current state of business intelligence within the enterprise.
</p>
    </subsection>
    <subsection id="uid15" level="1">
      <bodyTitle>Data Cleaning</bodyTitle>
      <p>The second example of application of our proposal concerns scientists who want to quickly inspect relevant literature and datasets. In such a case, local knowledge that comes from a local repository of publications belonging to a research institute (e.g. HAL) need to be integrated with other Web-based repositories, such as DBLP, Google Scholar, ResearchGate and even Wikipedia. Indeed, the local repository may be incomplete or contain semantic ambiguities, such as mistaken or missing conference venues, mistaken long names for the publication venues and journals, missing explanation of research keywords, and opaque keywords.
We envision a publication management system that exploits both links between database elements, namely pointers to external resources and logical links. The latter can be complex relationships between local portions of data and remote resources, encoded as schema mappings. There are different tasks that such a scenario could entail such as (i) cleaning the errors with links to correct data e.g. via mappings from HAL to DBLP for the publications errors, and via mappings from HAL to Wikipedia for opaque keywords, (ii) thoroughly enrich the list of publications of a given research institute, and (iii) support complex queries on the corrected data combined with logical mappings.</p>
    </subsection>
    <subsection id="uid16" level="1">
      <bodyTitle>Real Time Complex Event Processing</bodyTitle>
      <p>Complex event processing serves for monitoring nested word streams
in real time. Complex event streams are gaining popularity
with social networks such as with Facebook and Twitter, and thus
should be supported by distributed databases on the Web. Since
this is not yet the case, there remains much space
for future industrial transfer related to Links' second axis
on dynamic linked data.
</p>
    </subsection>
  </domaine>
  <highlights id="uid17">
    <bodyTitle>Highlights of the Year</bodyTitle>
    <subsection id="uid18" level="1">
      <bodyTitle>Highlights of the Year</bodyTitle>
      <p>
        <b>Containment for RDF Schemas</b>
      </p>
      <p>The ShEx language for defining RDF schemas was proposed and
developed earlier by the Links team in cooperation with the W3C.
Slawek Staworko et al. now studied the
containment problem for ShEx schemas for RDF documents.
They showed at <b>PODS</b> <ref xlink:href="#links-2018-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> – the best
database theory conference – that the problem is decidable, but <tt>co-NEXP</tt>-hard. This is
joined work with P. Wieczorek from the University of Wrazlaw.</p>
      <p>
        <b>Foundations of AI: Knowledge Compilation</b>
      </p>
      <p>Florent Capelli et al. showed at
<b>STACS</b> <ref xlink:href="#links-2018-bid1" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> – a top conferences in
theoretical computer science –
a new knowledge compilation procedure for quantified boolean formulas allowing
to decide the satisfiability quantified boolean
formulas with bounded tree width in polynomial time. This can be applied in particular to first-order
database queries with quantifiers. This is joined work with S. Mengel
from the CNRS in Lens.</p>
      <p>
        <b>Foundations of AI: Constrained Topologial Sort</b>
      </p>
      <p>Charles Paperman et al. showed at <b>ICALP</b> <ref xlink:href="#links-2018-bid2" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>
– a top conferences in theoretical computer science –
how to compute efficiently topological sorts of graphs under regular
constraints. The problem was initially introduced in the
context of preferential query answer for uncertain databases,
where on usually wants to sort the query
answers by some preferences, that are known only
partially. It becomes then
crucial to look for total orders on the answer set satisfying regular constraints
that specify the preferences.
Finding such an order for regular constraints was know to
be infeasible in general.
In this article, a class of regular constraints is identified
for which this problem becomes tractable. A (partial)
decidable dichotomy theorem is proven drawing the frontier between
the kind of constraints which are feasible from those which are
not. This is joined work with A. Amarilli from Telecom
Paristech.
</p>
    </subsection>
  </highlights>
  <logiciels id="uid19">
    <bodyTitle>New Software and Platforms</bodyTitle>
    <subsection id="uid20" level="1">
      <bodyTitle>ShEx validator</bodyTitle>
      <p>
        <i>Validation of Shape Expression schemas</i>
      </p>
      <p noindent="true"><span class="smallcap" align="left">Keywords:</span> Data management - RDF</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> Shape Expression schemas is a formalism for defining constraints on RDF graphs. This software allows to check whether a graph satisfies a Shape Expressions schema.</p>
      <p><span class="smallcap" align="left">Release Functional Description:</span> ShExJava now uses the Commons RDF API and so support RDF4J, Jena, JSON-LD-Java, OWL API and Apache Clerezza. It can parse ShEx schema in the ShEcC, ShEJ, ShExR formats and can serialize a schema in ShExJ.</p>
      <p>To validate data against a ShExSchema using ShExJava, you have two different algorithms:
- the refine algorithm: compute once and for all the typing for the whole graph
- the recursive algorithm: compute only the typing required to answer a validate(node,ShapeLabel) call and forget the results.</p>
      <simplelist>
        <li id="uid21">
          <p noindent="true">Contact: Iovka Boneva</p>
        </li>
        <li id="uid22">
          <p noindent="true">URL: <ref xlink:href="http://shexjava.lille.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>shexjava.<allowbreak/>lille.<allowbreak/>inria.<allowbreak/>fr/</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid23" level="1">
      <bodyTitle>gMark</bodyTitle>
      <p>
        <i>gMark: schema-driven graph and query generation</i>
      </p>
      <p noindent="true"><span class="smallcap" align="left">Keywords:</span> Semantic Web - Data base</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> gMark allow the generation of graph databases and an associated set of query from a schema of the graph.gMark is based on the following principles:
- great flexibility in the schema definition
- ability to generate big size graphs
- ability to generate recursive queries
- ability to generate queries with a desired selectivity</p>
      <simplelist>
        <li id="uid24">
          <p noindent="true">Contact: Aurélien Lemay</p>
        </li>
        <li id="uid25">
          <p noindent="true">URL: <ref xlink:href="https://github.com/graphMark/gmark" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>github.<allowbreak/>com/<allowbreak/>graphMark/<allowbreak/>gmark</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid26" level="1">
      <bodyTitle>SmartHal</bodyTitle>
      <p><span class="smallcap" align="left">Keyword:</span> Bibliography</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> SmartHal is a better tool for querying the HAL bibliography database, while is based on Haltool queries. The idea is that a Haltool query returns an XML document that can be queried further. In order to do so, SmartHal provides a new query language. Its queries are conjunctions of Haltool queries (for a list of laboratories or authors) with expressive Boolean queries by which answers of Haltool queries can be refined. These Boolean refinement queries are automatically translated to XQuery and executed by Saxon. A java application for extraction from the command line is available. On top of this, we have build a tool for producing the citation lists for the evaluation report of the LIFL, which can be easily adapter to other Labs.</p>
      <simplelist>
        <li id="uid27">
          <p noindent="true">Contact: Joachim Niehren</p>
        </li>
        <li id="uid28">
          <p noindent="true">URL: <ref xlink:href="http://smarthal.lille.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>smarthal.<allowbreak/>lille.<allowbreak/>inria.<allowbreak/>fr/</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid29" level="1">
      <bodyTitle>QuiXPath</bodyTitle>
      <p><span class="smallcap" align="left">Keywords:</span> XML - NoSQL - Data stream</p>
      <p noindent="true"><span class="smallcap" align="left">Scientific Description:</span> The QuiXPath tools supports a very large fragment of XPath 3.0. The QuiXPath library provides a compiler from QuiXPath to FXP, which is a library for querying XML streams with a fragment of temporal logic.</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> QuiXPath is a streaming implementation of XPath 3.0. It can query large XML files without loading the entire file in main memory, while selecting nodes as early as possible.</p>
      <simplelist>
        <li id="uid30">
          <p noindent="true">Contact: Joachim Niehren</p>
        </li>
        <li id="uid31">
          <p noindent="true">URL: <ref xlink:href="https://project.inria.fr/quix-tool-suite/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>project.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>quix-tool-suite/</ref></p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid32" level="1">
      <bodyTitle>X-FUN</bodyTitle>
      <p><span class="smallcap" align="left">Keywords:</span> Programming language - Compilers - Functional programming - Transformation - XML</p>
      <p noindent="true"><span class="smallcap" align="left">Functional Description:</span> X-FUN is a core language for implementing various XML, standards in a uniform manner. X-Fun is a higher-order functional programming language for transforming data trees based on node selection queries.</p>
      <simplelist>
        <li id="uid33">
          <p noindent="true">Participants: Joachim Niehren and Pavel Labath</p>
        </li>
        <li id="uid34">
          <p noindent="true">Contact: Joachim Niehren</p>
        </li>
      </simplelist>
    </subsection>
  </logiciels>
  <resultats id="uid35">
    <bodyTitle>New Results</bodyTitle>
    <subsection id="uid36" level="1">
      <bodyTitle>Querying Heterogeneous Linked Data</bodyTitle>
      <subsection id="uid37" level="2">
        <bodyTitle>Data Integration</bodyTitle>
        <p>The PhD project of Lozano on relational to RDF data
integration is progressing under the direction of Boneva, and
Staworko. At <b>AMW</b> <ref xlink:href="#links-2018-bid3" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>
they studied the <i>relational to RDF data exchange problem</i>. They focus in
particular on a preliminary analysis of the consistency problem for
relational to RDF data exchange with target ShEx schema.</p>
      </subsection>
      <subsection id="uid38" level="2">
        <bodyTitle>Schema Validation</bodyTitle>
        <p>Shape Expression Language 2.0 (ShEx) is a language to
describe the vocabulary and the structure of an RDF graph.
It is base on the
notion of shapes, a typing system supporting algebraic operations,
recursive references to other shapes or Boolean combination.</p>
        <p>In their <b>PODS</b> paper <ref xlink:href="#links-2018-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
Staworko studied the <i>containment problem</i> for ShEx
(in cooperation with Wieczorek from Wrazlaw).
Containement is a classical subject for schema-related issue
in database theory. The authors proved that it is decidable
for ShEx-schema, but with a untractable complexity (<tt>co-NEXP</tt>-hard).
They also carefuly craft restriction of ShEx schema to design
tractable-but-still-signifiant fragments.</p>
      </subsection>
    </subsection>
    <subsection id="uid39" level="1">
      <bodyTitle>Managing Dynamic Linked Data</bodyTitle>
      <subsection id="uid40" level="2">
        <bodyTitle>Complex Event Processing</bodyTitle>
        <p>Complex event processing requires to answer queries on streams of
complex events, i.e., nested words or equivalently linearizations of
data trees, but also to produce dynamically evolving
data structures as output.</p>
        <p>The topic of the PhD project of M. Sakho supervised by Niehren and
Boneva is to generalize algorithms for querying streams to
hyperstreams. These are collections of linked streams as
naturally produced as intermediate results of complex
events processing. Hyperstreams are incomplete descriptions
of relational structures, so they can queried similarly
to incomplete databases, for which the notion of a
certain query answer is most appropriate.</p>
        <p>In a paper published at
<b>RP</b> <ref xlink:href="#links-2018-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, they studied certain query
answering for hyperstreams with simple events. Such hyperstreams
can be identified with compressed string patterns. They proved that
the certain query answering for regular queries on compressed
string patterns is PSPACE-complete, independently of whether
the finite automata defining the regular queries are assumed
deterministic or not, and independently of whether compression
is permitted or not. They also showed that the problem is in
PTIME when restricted to <i>linear</i> string patterns
(possibly with compression) and to
deterministic finite automata.</p>
        <p>In a paper published at <b>LATA</b> <ref xlink:href="#links-2018-bid5" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, the
studied certain query answering on hyperstreams of complex events.
Such hyperstreams can be modeled by compressed tree pattern with
context variables. They showed that certain query answering for
regular queries on compressed tree pattern with context variables
is <tt>EXP</tt>-complete, independently of whether
the tree automata defining the regular queries are assumed
deterministic or not, and independently of whether compression
is permitted or not. They also showed that the problem is in
PTIME when restricted to <i>linear</i> tree patterns
(possibly with compression) and to
deterministic tree automata.</p>
      </subsection>
      <subsection id="uid41" level="2">
        <bodyTitle>Transformations</bodyTitle>
        <p>In his PhD project – belonging to the ANR Colis– Gallot with his
supervisors Salvati and Lemay presented higher order tree transducers
which extend macro tree transducers. Moreover they obtained
nice properties such as the closure of the transducers under
composition. Algorithms to compute such compositions are proposed.
Those algorithms perform partial evaluation and are guided
by semantic interpretations over finite domains.</p>
        <p>Another virtue of higher-order transducers is that their <i>linear</i>
syntactic restriction make them equivalent to logically
defined MSO transductions.
One of the composition algorithm proposed preserves the linearity.
Furthermore, we have also showed that we can decrease the order of
linear transducer (i.e. the complexity of the functions it handles) when this
one is larger than 4.</p>
        <p>These results are unpublished paper for now.</p>
      </subsection>
    </subsection>
    <subsection id="uid42" level="1">
      <bodyTitle>Foundations of AI</bodyTitle>
      <p>Various problems of databases and knowledge bases are closely related
to foundational problems in artificial intelligence, since they are
rooted in logic or graph theory.</p>
      <subsection id="uid43" level="2">
        <bodyTitle>Knowledge Compilation</bodyTitle>
        <p>Many problems in Artificial Intelligence boil down to the exploration of the
solution set (called the models) of logical formulas. Such an exploration can be
finding one model of the formula, counting the number of models or enumerating
them all. However, even for simple quantifier-free formulas, those explorations
are known be untractable (<tt>NP</tt>-hard).</p>
        <p><i>Knowledge compilation</i> encompasses methods that aim to change the
representation of the set of models in order to get tractable algorithms for
(some of) those tasks. A big computational cost is paid during the compilation
time but then replying to queries become tractable on the new representation.
More generally, the core of Knowledge compilation is the study of the trade-off
between the size of the representation and the easiness of queries. This subject
is of interest for both Artificial Intelligence and Database communities.</p>
        <p>At <b>STACS</b> <ref xlink:href="#links-2018-bid1" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, Capelli, in cooperation with Mengel
from CRIL (Lens), studied knowledge compilation techiques for quantified Boolean
formulas. Deciding the existence of models for such formulas is known to climb
arbitrarly high the polynomial time hierarchy. The authors provide an efficient
compilation procedure for formulas having a <i>bounded tree-width</i>
generalizing results from SAT solving.</p>
      </subsection>
      <subsection id="uid44" level="2">
        <bodyTitle>Aggregation and Enumeration for Graphs</bodyTitle>
        <p>Aggregation and enumeration are not relevant for answer sets of database queries
but equally for any kinds of sets, most typically defined by
combinatoric problems on graphs.</p>
        <p>In a paper published at <b>ICALP</b> <ref xlink:href="#links-2018-bid2" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
Paperman proposed (in cooperation with Amarilli from
Telecom Paristech) to study the problem of finding so called <i>topological sort</i>
satisfying constraints provided by regular expressions.
Searching topological sort happens typically in situations
where an order is <i>uncertain</i>. For instance, in relational
database where users provides a partial preference order, or in
concurrent and distributed programming where some tasks
can be executed in an arbitrary order.
A classical task in <i>preferential query answering</i> is to find a
topological sort satisfying some
global constrained. Typically, to find a total order satisfying all (or most) of the customers.
The paper provides and proves sufficient conditions on the <i>shape
of the constraints</i> to
make the problem tractable (P-time) as well as sufficient condition to make the problem <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>𝙽𝙿</mi></math></formula>-hard.
They also prove a complete dichotomy for an adapted and well chosen version of the constrained topological
sort problem.</p>
        <p>In an article in <b>JCSS</b> <ref xlink:href="#links-2018-bid6" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>,
Capelli (with Bergougnoux and Kanté from Bordeaux and Clérmont-Ferrand) propose
an algorithm for counting the number of <i>transversal</i> in some
<i>hypergraphs</i>. Here, a hypergraph is a collection
of sets – called <i>hyperedges</i> over a <i>ground set</i> and a traversal is a subset
intersecting all hyperedges.
In full generality, counting the number of minimal traversals in a hypergraph
is a hard problem: it is known to be <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mo>#</mo><mi>P</mi></mrow></math></formula>-complete.
They proved that under the assumptions of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>β</mi></math></formula>-acyclicity, it is possible to
count all the minimal traversals can be done in polynomial times.</p>
      </subsection>
    </subsection>
  </resultats>
  <contrats id="uid45">
    <bodyTitle>Bilateral Contracts and Grants with Industry</bodyTitle>
    <subsection id="uid46" level="1">
      <bodyTitle>Bilateral Grants with Industry</bodyTitle>
      <descriptionlist>
        <label><b>Posos</b>.</label>
        <li id="uid47">
          <p noindent="true">A. Lemay is directing an internship of a master student (<i>projet de fin
d'étude</i>) in cooperation with the POSOS company from Amiens. The goal of this
collaboration is to work on efficient schema for a large pharmaceutical Knowledge Base.</p>
        </li>
        <label><b>Strapdata</b>.</label>
        <li id="uid48">
          <p noindent="true">C. Paperman is actively collaborating with the Strapdata
company on efficient distributed graph database using an Apache novel
technology to query distributed graph <i>Gremlin</i> that could benefit
of the main product of Strapdata: Elassandra as a <i>database backend</i>.</p>
        </li>
      </descriptionlist>
    </subsection>
  </contrats>
  <partenariat id="uid49">
    <bodyTitle>Partnerships and Cooperations</bodyTitle>
    <subsection id="uid50" level="1">
      <bodyTitle>Regional Initiatives</bodyTitle>
      <simplelist>
        <li id="uid51">
          <p noindent="true">Links is member of the CPER Data (2016-19).</p>
        </li>
        <li id="uid52">
          <p noindent="true">Lozano's PhD project (2016-19) is co-funded by the Region Nord-Pas de
Calais.</p>
        </li>
        <li id="uid53">
          <p noindent="true">Sakho's PhD project is co-funded by the Region Nord-Pas de
Calais.</p>
        </li>
        <li id="uid54">
          <p noindent="true">Gillot's PhD project (2017-20) is co-funded by the Region Nord-Pas de
Calais.</p>
        </li>
        <li id="uid55">
          <p noindent="true">Crosetti's PhD project (2018-21) is co-funded by the Region
Haut de France. This is joined work with J. Ramon from the Inria project Magnet.</p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid56" level="1">
      <bodyTitle>National Initiatives</bodyTitle>
      <sanspuceslist>
        <li id="uid57">
          <p noindent="true"><b>ANR Aggreg</b> (2014-19): Aggregated Queries.</p>
          <descriptionlist>
            <li id="uid58">
              <p noindent="true">Participants: J. Niehren [correspondent], P. Bourhis, A. Lemay, A. Boiret, F. Capelli.</p>
            </li>
            <li id="uid59">
              <p noindent="true">The coordinator is J. Niehren and the partners are the University Paris 7 (A. Durand) including members of the Inria
project DAHU (L. Ségoufin), the University of Marseille (N. Creignou)
and University of Caen (E. Grandjean).</p>
            </li>
            <li id="uid60">
              <p noindent="true">Objective: the main goal of the Aggreg project is to develop efficient
algorithms and to study the complexity of answering aggregate queries
for databases and data streams of various kinds.</p>
            </li>
          </descriptionlist>
        </li>
        <li id="uid61">
          <p noindent="true"><b>ANR Colis</b> (2015-20): Correctness of Linux Scripts.</p>
          <descriptionlist>
            <li id="uid62">
              <p noindent="true">Participants: J. Niehren [correspondent], A. Lemay, S. Tison,
A. Boiret, V. Hugot, N. Bacquey, P. Gallot, S. Salvati.</p>
            </li>
            <li id="uid63">
              <p noindent="true">The coordinator is R. Treinen from the University of Paris 7 and the
other partner is the Tocata project of Inria Saclay (C. Marché).</p>
            </li>
            <li id="uid64">
              <p noindent="true">Objective: This project aims at verifying the correctness of
transformations on data trees defined by shell scripts for
Linux software installation. The data trees here are
the instance of the file system which are changed by
installation scripts.</p>
            </li>
          </descriptionlist>
        </li>
        <li id="uid65">
          <p noindent="true"><b>ANR DataCert</b> (2015-20):</p>
          <descriptionlist>
            <li id="uid66">
              <p noindent="true">Participants: I. Boneva [correspondent], S. Tison, J. Lozano.</p>
            </li>
            <li id="uid67">
              <p noindent="true">Partners: The coordinator is E. Contejean from the University of Paris Sud and
the other partner is the University of Lyon.</p>
            </li>
            <li id="uid68">
              <p noindent="true">Objective: the main goals of the Datacert project are to provide deep specification in Coq of algorithms for data integration and exchange and of algorithms for enforcing security policies, as well as to design data integration methods for data models beyond the relational data model.</p>
            </li>
          </descriptionlist>
        </li>
        <li id="uid69">
          <p noindent="true"><b>ANR Headwork</b> (2016-21):</p>
          <descriptionlist>
            <li id="uid70">
              <p noindent="true">Participants:  J. Niehren,
M. Sakho, N. Crosetti, F. Capelli.</p>
            </li>
            <li id="uid71">
              <p noindent="true">Scientific partners: The coordinateur is D. Gross-Amblard from the Druid
Team (Rennes 1). Other partners include the Dahu team (Inria Saclay)
and Sumo (Inria Bretagne).</p>
            </li>
            <li id="uid72">
              <p noindent="true">Industrial partners: Spipoll, and Foulefactory.</p>
            </li>
            <li id="uid73">
              <p noindent="true">Objective:
The main object is to develop data-centric workflows for programming
crowd sourcing systems in flexible declarative manner. The problem of
crowd sourcing systems is to fill a database with knowledge gathered
by thousands or more human participants. A particular focus is to be
put on the aspects of data uncertainty and for the representation of
user expertise.</p>
            </li>
          </descriptionlist>
        </li>
        <li id="uid74">
          <p noindent="true"><b>ANR Delta</b> (2016-21):</p>
          <descriptionlist>
            <li id="uid75">
              <p noindent="true">Participants: J. Niehren, 
S. Salvati, A. Lemay, N. Bacquey, D. Gallois.</p>
            </li>
            <li id="uid76">
              <p noindent="true">Partners: The coordinator is M. Zeitoun from LaBRI, other partners are LIF (Marseille) and IRIF (Paris-Diderot).</p>
            </li>
            <li id="uid77">
              <p noindent="true">Objective: Delta is focused on the study of logic, transducers
and automata. In particular, it aims at extending classical
framework to handle input/output, quantities and data.</p>
            </li>
          </descriptionlist>
        </li>
        <li id="uid78">
          <p noindent="true"><b>ANR Bravas</b> (2017-22):</p>
          <descriptionlist>
            <li id="uid79">
              <p noindent="true">Participants: S. Salvati [correspondent]</p>
            </li>
            <li id="uid80">
              <p noindent="true">Scientific Partners: The coordinator is Jérôme Leroux from LaBRI, University of Bordeaux. The other partner is LSV, ENS Cachan.</p>
            </li>
            <li id="uid81">
              <p noindent="true">Objective: The goal of the BraVAS project is to develop a new
and powerful approach to decide the reachability problems for Vector
Addition Systems (VAS) extensions and to analyze their
complexity. The ambition here is to crack with a single hammer
(ideals over well-orders) several long-lasting open problems that
have all been identified as a barrier in different areas, but that
are in fact closely related when seen as reachability.</p>
            </li>
          </descriptionlist>
        </li>
      </sanspuceslist>
    </subsection>
    <subsection id="uid82" level="1">
      <bodyTitle>European Initiatives</bodyTitle>
      <descriptionlist>
        <label><b>Oxford</b>:</label>
        <li id="uid83">
          <p noindent="true">A exchange project with the computer science lab of the University of Oxford is funded by the University of
Lille via the Cristal Lab. Links' member produced many common publications over the years with Oxford. Links' contact is Paperman.</p>
        </li>
        <label><b>Wrazlaw</b>:</label>
        <li id="uid84">
          <p noindent="true">Staworko has regular exchange with the University of Wrazlaw.
This has led to a publication at <b>PODS</b> <ref xlink:href="#links-2018-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/> together with
P. Wieczorek.</p>
        </li>
        <label><b>Saint Petersburg</b>:</label>
        <li id="uid85">
          <p noindent="true">Salvati and Niehren started a cooperation with the University of
Saint Petersburg, via a 3 months visit of R. Azimov in 2018.</p>
        </li>
        <label><b>Oviedo</b>:</label>
        <li id="uid86">
          <p noindent="true">Boneva started a cooperation with the University of Oviedo,
via a 3 months visit of H. Garcia Gonzalez in 2018.</p>
        </li>
      </descriptionlist>
    </subsection>
    <subsection id="uid87" level="1">
      <bodyTitle>International Initiatives</bodyTitle>
      <subsection id="uid88" level="2">
        <bodyTitle>Informal International Partners</bodyTitle>
        <descriptionlist>
          <label><b>Santiago de Chile</b>:</label>
          <li id="uid89">
            <p noindent="true">S. Staworko started a collaboration with C. Riveros from the Pontificia Universidad
Catolica de Chile in 2018.</p>
          </li>
        </descriptionlist>
      </subsection>
    </subsection>
    <subsection id="uid90" level="1">
      <bodyTitle>International Research Visitors</bodyTitle>
      <subsection id="uid91" level="2">
        <bodyTitle>Visits of International Scientists</bodyTitle>
        <p>Several researchers has visited us:</p>
        <simplelist>
          <li id="uid92">
            <p noindent="true">Filip Mazowiecki, a researcher from Warsaw University and currently in
post-doctorate in Bordeaux to work with Charles Paperman.</p>
          </li>
          <li id="uid93">
            <p noindent="true">Rustam Azimov, a Russian PhD students from Saint Petersburg State University, to collaborate with
Sylvain Salvati and Joachim Niehren.</p>
          </li>
          <li id="uid94">
            <p noindent="true">Michaël Cadilhac, a researcher from Oxford University to work with Charles
Paperman.</p>
          </li>
          <li id="uid95">
            <p noindent="true">Cristian Riveros, an Assistant Professor at the Department of Computer
Science at the Pontificia Universidad Catolica de Chile.</p>
          </li>
          <li id="uid96">
            <p noindent="true">Henning Fernau, Professor at Universität Trier and Andreas Maletti,
Professor at Universität Leipzig, visited us during the HDR defense of
Aurelien Lemay.</p>
          </li>
        </simplelist>
        <subsection id="uid97" level="3">
          <bodyTitle>Internships</bodyTitle>
          <simplelist>
            <li id="uid98">
              <p noindent="true">Nicolas Crosetti started an internship supervised by Florent Capelli,
Joachim Niehren and Jan Ramon. His internship has evolved into the
preparation of a PhD thesis.</p>
            </li>
            <li id="uid99">
              <p noindent="true">Chen Huan, from Centrale Lille, has done an internship under the
supervision of Sylvain Salvati and Joachim Niehren.</p>
            </li>
          </simplelist>
        </subsection>
      </subsection>
      <subsection id="uid100" level="2">
        <bodyTitle>Visits to International Teams</bodyTitle>
        <simplelist>
          <li id="uid101">
            <p noindent="true">Charles Paperman visited Michaël Cadilhac form the verification team
of the University of Oxford.</p>
          </li>
          <li id="uid102">
            <p noindent="true">Joachim Niehren got invited by Hilal Zaid for a visit at the American University of Palestine in
August 2018.</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
  </partenariat>
  <diffusion id="uid103">
    <bodyTitle>Dissemination</bodyTitle>
    <subsection id="uid104" level="1">
      <bodyTitle>Promoting Scientific Activities</bodyTitle>
      <subsection id="uid105" level="2">
        <bodyTitle>Scientific Events Organisation</bodyTitle>
        <simplelist>
          <li id="uid106">
            <p noindent="true">F. Capelli: workshop organisation of <i>Graph and Constraints</i> (27/08) within
the conference Constraint Programming (CP) 2018, Lille.</p>
          </li>
          <li id="uid107">
            <p noindent="true">F. Capelli: organisation of annual meeting of GT ALGA (Groupe de Travail Automata, Logic, Games, Algebra of CNRS)
the 15th and 16th of October at Lille.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection id="uid108" level="2">
        <bodyTitle>Scientific Events Selection</bodyTitle>
        <subsection id="uid109" level="3">
          <bodyTitle>Chair of Conference Program Committees</bodyTitle>
          <simplelist>
            <li id="uid110">
              <p noindent="true">J. Niehren was is was chair of the Program Committee of WPTE
2018.</p>
            </li>
            <li id="uid111">
              <p noindent="true">J. Niehren was is was co-chair of the Program Committee of WPTE
2019.</p>
            </li>
          </simplelist>
        </subsection>
        <subsection id="uid112" level="3">
          <bodyTitle>Member of the Conference Program Committees</bodyTitle>
          <simplelist>
            <li id="uid113">
              <p noindent="true">F. Capelli: member of Program Committee of International Joint Conference on Artificial
Intelligence (IJCAI) 2018.</p>
            </li>
            <li id="uid114">
              <p noindent="true">F. Capelli: member of Program Committee of workshop Quantified Boolean Formulas (QBF)
within FLoC conference (Federated Logic Conference).</p>
            </li>
            <li id="uid115">
              <p noindent="true">F. Capelli: member of Program Committee of workshop Graph and
Constraints, 2018.</p>
            </li>
            <li id="uid116">
              <p noindent="true">S. Tison: member of Program Committee of RAIRO ITA, 2018.</p>
            </li>
            <li id="uid117">
              <p noindent="true">J. Niehren: member of the Program Committee of LATA 2019.</p>
            </li>
          </simplelist>
        </subsection>
      </subsection>
      <subsection id="uid118" level="2">
        <bodyTitle>Journal</bodyTitle>
        <subsection id="uid119" level="3">
          <bodyTitle>Member of the Editorial Boards</bodyTitle>
          <sanspuceslist>
            <li id="uid120">
              <p noindent="true">J. Niehren is editor of Fundamenta Informaticæ.</p>
            </li>
            <li id="uid121">
              <p noindent="true">S. Salvati is managing editor of JoLLI (Journal for Logic, Language and Information).</p>
            </li>
            <li id="uid122">
              <p noindent="true">S. Tison is in the editorial committee of RAIRO-ITA (Theoretical Informatics and Applications).</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
      <subsection id="uid123" level="2">
        <bodyTitle>Invited Talks</bodyTitle>
        <simplelist>
          <li id="uid124">
            <p noindent="true">B. Guillon gave invited talks at Mid-term Meeting of ANR Delta in
Bordeaux in December 2018.</p>
          </li>
          <li id="uid125">
            <p noindent="true">A. Lemay gave invited talks at Mid-term Meeting of ANR Delta in
Bordeaux in December 2018.</p>
          </li>
          <li id="uid126">
            <p noindent="true">Joachim Niehren gave an invited talk at the American University
of Palestine in August 2018.</p>
          </li>
          <li id="uid127">
            <p noindent="true">F. Capelli get invited to talk at seminars of CRIL at Lens, LACL in Créteil and VALDA in Paris.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection id="uid128" level="2">
        <bodyTitle>Scientific Expertise</bodyTitle>
        <simplelist>
          <li id="uid129">
            <p noindent="true">S. Tison: member of coordinator of i-SIte ULNE, about innovation and relationship with social economical world.</p>
          </li>
          <li id="uid130">
            <p noindent="true">S. Tison: Head of CITC-Eurarfid.</p>
          </li>
          <li id="uid131">
            <p noindent="true">J. Niehren is member of the board of the committee of project-teams of
Inria Lille.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection id="uid132" level="2">
        <bodyTitle>Research Administration</bodyTitle>
        <simplelist>
          <li id="uid133">
            <p noindent="true">F. Capelli: Co-organizer of <i>Groupe de Travail</i> of CNRS IMIA (Informatique Mathématique
Intelligence Artificielle)</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
    <subsection id="uid134" level="1">
      <bodyTitle>Teaching - Supervision - Juries</bodyTitle>
      <subsection id="uid135" level="2">
        <bodyTitle>Teaching</bodyTitle>
        <sanspuceslist>
          <li id="uid136">
            <p noindent="true">I. Boneva gives a Master 1 semester on Algorithms for databases.</p>
          </li>
          <li id="uid137">
            <p noindent="true">C. Paperman is pedagogical responsible for Master MIASHS “parcours” WebAnalyste.</p>
          </li>
          <li id="uid138">
            <p noindent="true">A. Lemay is pedagogical responsible for Computer Science and Numeric correspondent for UFR LEA.</p>
          </li>
          <li id="uid139">
            <p noindent="true">J. Niehren was teaching the course “Foundations of Databases” as part of the masters 2 Mocad on Information Extraction at the University of Lille.</p>
          </li>
          <li id="uid140">
            <p noindent="true">S. Salvati is pedagogical responsible of Master Miage FA, Lille.</p>
          </li>
          <li id="uid141">
            <p noindent="true">S. Salvati organized the research label for Computer Science Bachelor, Lille.</p>
          </li>
          <li id="uid142">
            <p noindent="true">S. Tison is pedagogical responsible of first year ACT Master, Lille.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid143" level="2">
        <bodyTitle>Supervision</bodyTitle>
        <sanspuceslist>
          <li id="uid144">
            <p noindent="true">HdR : Aurélien Lemay, <i>Machine Learning Techniques for Semistructured Data</i>, Université de Lille, Fri 16th Nov.</p>
          </li>
          <li id="uid145">
            <p noindent="true">PhD in progress: N. Crosetti. Privacy Risks of Aggregates in Data Centric-Workflows. Supervised by Capelli, Niehren, Ramon (Team MAGNET) and Tison.</p>
          </li>
          <li id="uid146">
            <p noindent="true">PhD in progress: D. Gallois. Since 2015. Recursive Queries. Supervised by Bourhis and Tison.</p>
          </li>
          <li id="uid147">
            <p noindent="true">PhD in progress: M. Sakho. Hyperstreaming Query answering on graphs. Since 2016. Supervised by Niehren and Boneva.</p>
          </li>
          <li id="uid148">
            <p noindent="true">PhD in progress: J.M. Lozano. On data integration for mixed database formats. Supervised by Boneva and Staworko.</p>
          </li>
          <li id="uid149">
            <p noindent="true">PhD in progress: P. Gallot. On safety of data transformations. Started on October 2017. Supervised by Lemay and Salvati.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid150" level="2">
        <bodyTitle>Juries</bodyTitle>
        <sanspuceslist>
          <li id="uid151">
            <p noindent="true">S. Tison: Vice-Présidente du jury Agrégation de Mathématiques (co-pillote option D- Informatique).</p>
          </li>
          <li id="uid152">
            <p noindent="true">S. Tison: Jury de Thèse Lucien Mousin.</p>
          </li>
          <li id="uid153">
            <p noindent="true">S. Tison: PhD Committee of Narjes Jomaa.</p>
          </li>
          <li id="uid154">
            <p noindent="true">F. Capelli: PhD Committee of Mikaël Monet.</p>
          </li>
          <li id="uid155">
            <p noindent="true">J. Niehren: Habilitation Committee of Aurélien Lemay.</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
    <subsection id="uid156" level="1">
      <bodyTitle>Popularization</bodyTitle>
      <subsection id="uid157" level="2">
        <bodyTitle>Internal action</bodyTitle>
        <descriptionlist>
          <label>
            <b>General Assembly of Inria Lille</b>
          </label>
          <li id="uid158">
            <p noindent="true">Niehren presented Links work on data and knowledge bases on the
Dynamic Semantic Crosswords demonstration during a general
assembly of Inria Lille in July 2018.</p>
          </li>
        </descriptionlist>
      </subsection>
      <subsection id="uid159" level="2">
        <bodyTitle>Creation of media or tools for science outreach</bodyTitle>
        <descriptionlist>
          <label>
            <b>Dynamic Semantic Crosswords</b>
          </label>
          <li id="uid160">
            <p noindent="true">Bacquey's demonstration system on dynamic semantic crosswords is
presented in the new showroom of Inria Lille in the new building Place.
The demo generates dynamically crosswords while streaming Twitter
feeds, depending on a semantic topic specified by the user. The
specification can be given by a list of hashtags, and in the future
by a XPath 3.0 query, that can be executed on streams by using
Links QuiXPath tool. This illustrates the work on complex
event processing by Niehren and his students during the
last years.</p>
          </li>
        </descriptionlist>
      </subsection>
    </subsection>
  </diffusion>
  <biblio id="bibliography" html="bibliography" numero="10" titre="Bibliography">
    
    <biblStruct id="links-2018-bid9" type="hdrthesis" rend="year" n="cite:lemay:tel-01929944">
      <identifiant type="hal" value="tel-01929944"/>
      <monogr>
        <title level="m">Machine Learning Techniques for Semistructured Data</title>
        <author>
          <persName key="links-2018-idp166944">
            <foreName>Aurélien</foreName>
            <surname>Lemay</surname>
            <initial>A.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">Université de Lille</orgName>
          </publisher>
          <dateStruct>
            <month>November</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://tel.archives-ouvertes.fr/tel-01929944" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>tel.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>tel-01929944</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Habilitation à diriger des recherches</note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid6" type="article" rend="year" n="cite:bergougnoux:hal-01923090">
      <identifiant type="doi" value="10.1016/j.jcss.2018.10.002"/>
      <identifiant type="hal" value="hal-01923090"/>
      <analytic>
        <title level="a">Counting Minimal Transversals of β-Acyclic Hypergraphs</title>
        <author>
          <persName>
            <foreName>Benjamin</foreName>
            <surname>Bergougnoux</surname>
            <initial>B.</initial>
          </persName>
          <persName key="links-2018-idp164416">
            <foreName>Florent</foreName>
            <surname>Capelli</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Mamadou Moustapha</foreName>
            <surname>Kanté</surname>
            <initial>M. M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid01107">
        <idno type="issn">0022-0000</idno>
        <title level="j">Journal of Computer and System Sciences</title>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01923090" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01923090</ref>
        </imprint>
      </monogr>
      <note type="bnote">
        <ref xlink:href="https://arxiv.org/abs/1808.05017" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>arxiv.<allowbreak/>org/<allowbreak/>abs/<allowbreak/>1808.<allowbreak/>05017</ref>
      </note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid14" type="article" rend="year" n="cite:boiret:hal-01176763">
      <identifiant type="hal" value="hal-01176763"/>
      <analytic>
        <title level="a">Logics for Unordered Trees with Data Constraints</title>
        <author>
          <persName>
            <foreName>Adrien</foreName>
            <surname>Boiret</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Vincent</foreName>
            <surname>Hugot</surname>
            <initial>V.</initial>
          </persName>
          <persName key="links-2018-idp158976">
            <foreName>Joachim</foreName>
            <surname>Niehren</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Ralf</foreName>
            <surname>Treinen</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid01107">
        <idno type="issn">0022-0000</idno>
        <title level="j">Journal of Computer and System Sciences</title>
        <imprint>
          <dateStruct>
            <month>December</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">40</biblScope>
          <ref xlink:href="https://hal.inria.fr/hal-01176763" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01176763</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid12" type="article" rend="year" n="cite:capelli:hal-01923091">
      <identifiant type="doi" value="10.1016/j.dam.2018.06.038"/>
      <identifiant type="hal" value="hal-01923091"/>
      <analytic>
        <title level="a">Incremental delay enumeration: Space and time</title>
        <author>
          <persName key="links-2018-idp164416">
            <foreName>Florent</foreName>
            <surname>Capelli</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Yann</foreName>
            <surname>Strozecki</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00466">
        <idno type="issn">0166-218X</idno>
        <title level="j">Discrete Applied Mathematics</title>
        <imprint>
          <dateStruct>
            <month>August</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01923091" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01923091</ref>
        </imprint>
      </monogr>
      <note type="bnote">
        <ref xlink:href="https://arxiv.org/abs/1703.01928" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>arxiv.<allowbreak/>org/<allowbreak/>abs/<allowbreak/>1703.<allowbreak/>01928</ref>
      </note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid15" type="article" rend="year" n="cite:daviaud:hal-01943493">
      <identifiant type="hal" value="hal-01943493"/>
      <analytic>
        <title level="a">Classes of languages generated by the Kleene star of a word</title>
        <author>
          <persName>
            <foreName>Laure</foreName>
            <surname>Daviaud</surname>
            <initial>L.</initial>
          </persName>
          <persName key="links-2018-idp169856">
            <foreName>Charles</foreName>
            <surname>Paperman</surname>
            <initial>C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-editorial-board="yes" x-international-audience="yes" id="rid00819">
        <idno type="issn">0890-5401</idno>
        <title level="j">Information and Computation</title>
        <imprint>
          <biblScope type="volume">262</biblScope>
          <biblScope type="number">Part 1</biblScope>
          <dateStruct>
            <month>October</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">90-109</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01943493" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01943493</ref>
        </imprint>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid2" type="inproceedings" rend="year" n="cite:amarilli:hal-01950909">
      <identifiant type="hal" value="hal-01950909"/>
      <analytic>
        <title level="a">Topological Sorting with Regular Constraints</title>
        <author>
          <persName>
            <foreName>Antoine</foreName>
            <surname>Amarilli</surname>
            <initial>A.</initial>
          </persName>
          <persName key="links-2018-idp169856">
            <foreName>Charles</foreName>
            <surname>Paperman</surname>
            <initial>C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="no" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">ICALP 2018 - 45th International Colloquium on Automata, Languages, and Programming</title>
        <loc>Prague, Czech Republic</loc>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01950909" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01950909</ref>
        </imprint>
        <meeting id="cid106057">
          <title>International Colloquium on Automata, Languages and Programming</title>
          <num>45</num>
          <abbr type="sigle">ICALP</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid3" type="inproceedings" rend="year" n="cite:boneva:hal-01775199">
      <identifiant type="hal" value="hal-01775199"/>
      <analytic>
        <title level="a">Relational to RDF Data Exchange in Presence of a Shape Expression Schema</title>
        <author>
          <persName key="links-2018-idp161888">
            <foreName>Iovka</foreName>
            <surname>Boneva</surname>
            <initial>I.</initial>
          </persName>
          <persName key="links-2018-idp193344">
            <foreName>Jose</foreName>
            <surname>Lozano</surname>
            <initial>J.</initial>
          </persName>
          <persName key="links-2018-idp175280">
            <foreName>Sławek</foreName>
            <surname>Staworko</surname>
            <initial>S.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="no" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">AMW 2018 - 12th Alberto Mendelzon International Workshop on Foundations of Data Management</title>
        <loc>Cali, Colombia</loc>
        <imprint>
          <dateStruct>
            <month>May</month>
            <year>2018</year>
          </dateStruct>
          <biblScope type="pages">1-16</biblScope>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01775199" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01775199</ref>
        </imprint>
        <meeting id="cid625778">
          <title>Alberto Mendelzon International Workshop on Foundations of Data Management</title>
          <num>12</num>
          <abbr type="sigle">AMW</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid8" type="inproceedings" rend="year" n="cite:boneva:hal-01609498">
      <identifiant type="hal" value="hal-01609498"/>
      <analytic>
        <title level="a">Certain Query Answering on Compressed String Patterns: From Streams to Hyperstreams</title>
        <author>
          <persName key="links-2018-idp161888">
            <foreName>Iovka</foreName>
            <surname>Boneva</surname>
            <initial>I.</initial>
          </persName>
          <persName key="links-2018-idp158976">
            <foreName>Joachim</foreName>
            <surname>Niehren</surname>
            <initial>J.</initial>
          </persName>
          <persName key="links-2018-idp195808">
            <foreName>Momar</foreName>
            <surname>Sakho</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="no" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">RP 2018 - 12th International Conference on Reachability Problems</title>
        <loc>Marseille, France</loc>
        <imprint>
          <dateStruct>
            <month>September</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01609498" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01609498</ref>
        </imprint>
        <meeting id="cid383134">
          <title>Workshop on Reachability Problems</title>
          <num>12</num>
          <abbr type="sigle">RP</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid5" type="inproceedings" rend="year" n="cite:sakho:hal-01926011">
      <identifiant type="hal" value="hal-01926011"/>
      <analytic>
        <title level="a">Regular Matching and Inclusion on Compressed Tree Patterns with Context Variables</title>
        <author>
          <persName key="links-2018-idp195808">
            <foreName>Momar</foreName>
            <surname>Sakho</surname>
            <initial>M.</initial>
          </persName>
          <persName key="links-2018-idp161888">
            <foreName>Iovka</foreName>
            <surname>Boneva</surname>
            <initial>I.</initial>
          </persName>
          <persName key="links-2018-idp158976">
            <foreName>Joachim</foreName>
            <surname>Niehren</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">13th International Conference on Language and Automata Theory and Applications (LATA)</title>
        <loc>Saint Petersburg, Russia</loc>
        <imprint>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <month>March</month>
            <year>2019</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01926011" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01926011</ref>
        </imprint>
        <meeting id="cid289532">
          <title>International Conference on Language and Automata Theory and Applications</title>
          <num>13</num>
          <abbr type="sigle">LATA</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid0" type="inproceedings" rend="year" n="cite:staworko:hal-01959143">
      <identifiant type="hal" value="hal-01959143"/>
      <analytic>
        <title level="a">Containment of Shape Expression Schemas for RDF</title>
        <author>
          <persName key="links-2018-idp175280">
            <foreName>Slawomir</foreName>
            <surname>Staworko</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Piotr</foreName>
            <surname>Wieczorek</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-scientific-popularization="no" x-international-audience="yes" x-proceedings="yes" x-invited-conference="no" x-editorial-board="yes">
        <title level="m">SIGMOD-SIGACT-SIGAI Symposium on Principles of Database Systems (PODS)</title>
        <loc>Amsterdam, Netherlands</loc>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2019</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01959143" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01959143</ref>
        </imprint>
        <meeting id="cid18524">
          <title>ACM Conference on Principle of Database Systems</title>
          <num>2019</num>
          <abbr type="sigle">PODS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    
    <biblStruct id="links-2018-bid10" type="techreport" rend="year" n="cite:salvati:hal-01771670">
      <identifiant type="hal" value="hal-01771670"/>
      <monogr>
        <title level="m">On is an n-MCFL</title>
        <author>
          <persName key="links-2018-idp172384">
            <foreName>Sylvain</foreName>
            <surname>Salvati</surname>
            <initial>S.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="institution">Université de Lille, Inria, CRIStAL CNRS</orgName>
          </publisher>
          <dateStruct>
            <month>April</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01771670" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01771670</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid11" type="misc" rend="year" n="cite:boneva:hal-01811835">
      <identifiant type="hal" value="hal-01811835"/>
      <monogr x-scientific-popularization="no">
        <title level="m">Approximating Certain Query Answering on Hyperstreams</title>
        <author>
          <persName key="links-2018-idp161888">
            <foreName>Iovka</foreName>
            <surname>Boneva</surname>
            <initial>I.</initial>
          </persName>
          <persName key="links-2018-idp158976">
            <foreName>Joachim</foreName>
            <surname>Niehren</surname>
            <initial>J.</initial>
          </persName>
          <persName key="links-2018-idp195808">
            <foreName>Momar</foreName>
            <surname>Sakho</surname>
            <initial>M.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01811835" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01811835</ref>
        </imprint>
      </monogr>
      <note type="bnote">Technical report</note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid4" type="unpublished" rend="year" n="cite:boneva:hal-01846016">
      <identifiant type="hal" value="hal-01846016"/>
      <monogr>
        <title level="m">Certain Query Answering on Compressed String Patterns: From Streams to Hyperstreams (long version)</title>
        <author>
          <persName key="links-2018-idp161888">
            <foreName>Iovka</foreName>
            <surname>Boneva</surname>
            <initial>I.</initial>
          </persName>
          <persName key="links-2018-idp158976">
            <foreName>Joachim</foreName>
            <surname>Niehren</surname>
            <initial>J.</initial>
          </persName>
          <persName key="links-2018-idp195808">
            <foreName>Momar</foreName>
            <surname>Sakho</surname>
            <initial>M.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01846016" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01846016</ref>
        </imprint>
      </monogr>
      <note type="bnote">working paper or preprint</note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid13" type="unpublished" rend="year" n="cite:capelli:hal-01981553">
      <identifiant type="hal" value="hal-01981553"/>
      <monogr>
        <title level="m">Dependency Weighted Aggregation on Factorized Databases</title>
        <author>
          <persName key="links-2018-idp164416">
            <foreName>Florent</foreName>
            <surname>Capelli</surname>
            <initial>F.</initial>
          </persName>
          <persName key="links-2018-idp186016">
            <foreName>Nicolas</foreName>
            <surname>Crosetti</surname>
            <initial>N.</initial>
          </persName>
          <persName key="links-2018-idp158976">
            <foreName>Joachim</foreName>
            <surname>Niehren</surname>
            <initial>J.</initial>
          </persName>
          <persName key="magnet-2018-idp161824">
            <foreName>Jan</foreName>
            <surname>Ramon</surname>
            <initial>J.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>January</month>
            <year>2019</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01981553" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01981553</ref>
        </imprint>
      </monogr>
      <note type="bnote"><ref xlink:href="https://arxiv.org/abs/1901.03633" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>arxiv.<allowbreak/>org/<allowbreak/>abs/<allowbreak/>1901.<allowbreak/>03633</ref> - working paper or preprint</note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid1" type="unpublished" rend="year" n="cite:capelli:hal-01836402">
      <identifiant type="hal" value="hal-01836402"/>
      <monogr>
        <title level="m">Knowledge Compilation, Width and Quantification</title>
        <author>
          <persName key="links-2018-idp164416">
            <foreName>Florent</foreName>
            <surname>Capelli</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Stefan</foreName>
            <surname>Mengel</surname>
            <initial>S.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.archives-ouvertes.fr/hal-01836402" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>archives-ouvertes.<allowbreak/>fr/<allowbreak/>hal-01836402</ref>
        </imprint>
      </monogr>
      <note type="bnote"><ref xlink:href="https://arxiv.org/abs/1807.04263" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>arxiv.<allowbreak/>org/<allowbreak/>abs/<allowbreak/>1807.<allowbreak/>04263</ref> - working paper or preprint</note>
    </biblStruct>
    
    <biblStruct id="links-2018-bid7" type="unpublished" rend="year" n="cite:capelli:hal-01891483">
      <identifiant type="hal" value="hal-01891483"/>
      <monogr>
        <title level="m">Enumerating models of DNF faster: breaking the dependency on the formula size</title>
        <author>
          <persName key="links-2018-idp164416">
            <foreName>Florent</foreName>
            <surname>Capelli</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Yann</foreName>
            <surname>Strozecki</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2018</year>
          </dateStruct>
          <ref xlink:href="https://hal.inria.fr/hal-01891483" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-01891483</ref>
        </imprint>
      </monogr>
      <note type="bnote">working paper or preprint</note>
    </biblStruct>
  </biblio>
</raweb>
