<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE raweb PUBLIC "-//INRIA//DTD " "raweb2.dtd">
<raweb xml:lang="en" year="2010">
  <identification id="alpage" isproject="true">
    <shortname>alpage</shortname>
    <projectName>Large-scale deep linguistic
    processing</projectName>
    <domaine-de-recherche>Perception, Cognition,
    Interaction</domaine-de-recherche>
    <theme-de-recherche>Audio, Speech, and Language
    Processing</theme-de-recherche>
    <UR name="Rocquencourt"/>
  </identification>
  <team id="uid1">
    <person key="alpage-2010-idm152476291760">
      <firstname>Marianna</firstname>
      <lastname>Apidianaki</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>funded by the System@tic project Scribo (May to
      December 2010)</moreinfo>
    </person>
    <person key="atoll-2006-idm57727932096">
      <firstname>François</firstname>
      <lastname>Barthélemy</lastname>
      <affiliation>AutreEtablissementPublic</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Associate Professor (MC) CNAM</moreinfo>
    </person>
    <person key="alpage-2008-idm542378786864">
      <firstname>André</firstname>
      <lastname>Bittar</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student Univ. Paris 7 (since 2007), now
      ATER at Université Paris-Est Marne-la-Vallée</moreinfo>
    </person>
    <person key="alpage-2009-idm402038353920">
      <firstname>Luc</firstname>
      <lastname>Boruta</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (allocataire) (since October
      2009)</moreinfo>
    </person>
    <person key="atoll-2006-idm57727947600">
      <firstname>Pierre</firstname>
      <lastname>Boullier</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Emeritus Senior Researcher (DR-E) Inria</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="alpage-2008-idm542378777200">
      <firstname>Marie</firstname>
      <lastname>Candito</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Associate Professor (MC) Univ.
      Paris 7</moreinfo>
    </person>
    <person key="alpage-2008-idm542378774048">
      <firstname>François-Régis</firstname>
      <lastname>Chaumartin</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student Univ. Paris 7</moreinfo>
    </person>
    <person key="alpage-2008-idm542378770960">
      <firstname>Benoît</firstname>
      <lastname>Crabbé</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Associate Professor (MC) Univ.
      Paris 7</moreinfo>
    </person>
    <person key="alpage-2008-idm542378767840">
      <firstname>Laurence</firstname>
      <lastname>Danlos</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Full Professor (PR) Univ. Paris 7, Member of
      IUF, Team leader</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="alpage-2008-idm542378764240">
      <firstname>Pascal</firstname>
      <lastname>Denis</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Junior Researcher (CR) Inria</moreinfo>
    </person>
    <person key="alpage-2010-idm152476259776">
      <firstname>Kata</firstname>
      <lastname>Gábor</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>funded by the System@tic project Scribo (May to
      December 2010)</moreinfo>
    </person>
    <person key="alpage-2008-idm542378755024">
      <firstname>Elżbieta</firstname>
      <lastname>Gryglicka</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (CIFRE) Thales &amp; Univ.
      Paris 7</moreinfo>
    </person>
    <person key="alpage-2008-idm542378751904">
      <firstname>Christelle</firstname>
      <lastname>Guiziou</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Assistant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Secretary (SAR) Inria</moreinfo>
    </person>
    <person key="alpage-2009-idm402038316144">
      <firstname>Enrique</firstname>
      <lastname>Henestroza Anguiano</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD funded by the ANR project 
      <span class="smallcap" align="left">Sequoia</span>(since
      November 2009)</moreinfo>
    </person>
    <person key="alpage-2008-idm542378745744">
      <firstname>Sylvain</firstname>
      <lastname>Kahane</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Full Professor (PR) Univ. Paris X, Associate
      member</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="alpage-2009-idm402038308688">
      <firstname>Éric</firstname>
      <lastname>Villemonte de La Clergerie</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Junior Researcher (CR) Inria</moreinfo>
    </person>
    <person key="alpage-2010-idm152476240000">
      <firstname>Emmanuel</firstname>
      <lastname>Lassale</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (ENS stipendium) Univ. Paris 7
      (since September 2010)</moreinfo>
    </person>
    <person key="alpage-2010-idm152476236784">
      <firstname>Pierre</firstname>
      <lastname>Magistry</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (allocataire) Univ. Paris 7 (since
      September 2010)</moreinfo>
    </person>
    <person key="alpage-2009-idm402038296432">
      <firstname>Philippe</firstname>
      <lastname>Muller</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>delegation from Université Paul Sabatier, Toulouse,
      since September 2009</moreinfo>
    </person>
    <person key="alpage-2010-idm152476230416">
      <firstname>Yayoi</firstname>
      <lastname>Nakamura-Delloye</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>funded by the System@tic project Scribo (March to
      November 2010), then by the ANR project EDyLex (from December
      2010)</moreinfo>
    </person>
    <person key="alpage-2009-idm402038293216">
      <firstname>Gaëlle</firstname>
      <lastname>Recourcé</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>AutreCategorie</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>funded by the Scribo project, part-time, until June
      2010</moreinfo>
    </person>
    <person key="alpage-2009-idm402038290176">
      <firstname>Charlotte</firstname>
      <lastname>Roze</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (allocataire) Univ. Paris 7 (since
      October 2009)</moreinfo>
    </person>
    <person key="atoll-2006-idm57727917280">
      <firstname>Benoît</firstname>
      <lastname>Sagot</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Junior Researcher (CR) Inria</moreinfo>
    </person>
    <person key="alpage-2008-idm542378729584">
      <firstname>Djamé</firstname>
      <lastname>Seddah</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>Enseignant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Associate Professor (MC) Univ. Paris 4</moreinfo>
    </person>
    <person key="alpage-2009-idm402038280912">
      <firstname>Rosa</firstname>
      <lastname>Stern</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (CIFRE) AFP &amp; Univ. Paris 7
      (since November 2009)</moreinfo>
    </person>
    <person key="alpage-2009-idm402038277728">
      <firstname>Sattisvar</firstname>
      <lastname>Tandabany</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>funded by the ANR project 
      <span class="smallcap" align="left">Sequoia</span>(from
      November 2009)</moreinfo>
    </person>
    <person key="alpage-2009-idm402038273904">
      <firstname>Juliette</firstname>
      <lastname>Thuilier</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>PhD student (allocataire) Univ. Paris 7 (since
      2008)</moreinfo>
    </person>
    <person key="alpage-2010-idm152477262864">
      <firstname>Tim</firstname>
      <lastname>Van de Cruys</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>funded by the System@tic project Scribo (May to
      December 2010)</moreinfo>
    </person>
  </team>
  <presentation id="uid2">
    <bodyTitle>Overall Objectives</bodyTitle>
    <subsection id="uid3" level="1">
      <bodyTitle>Overall Objectives</bodyTitle>
      <p>The Alpage team is specialized in 
      <b>Language modeling</b>, 
      <b>Computational linguistics</b>and 
      <b>Natural Language Processing (NLP)</b>. These fields are
      considered central in the new Inria strategic plan, and are
      indeed of crucial importance for the new information society.
      Applications of this domain of research include the numerous
      technologies grouped under the term of “language engineering”
      (information retrieval, information extraction, spelling,
      grammatical and semantic correction, automatic summarizing,
      machine translation, man machine communication, etc).</p>
      <p>NLP, the domain of Alpage, is a subfield of both
      artificial intelligence, linguistics, and cognition. It
      studies the problems of automated understanding and
      generation of natural human languages. Natural language
      understanding systems convert samples of human language into
      more formal representations that are easier for computer
      programs to manipulate. Natural language generation systems
      convert information from computer databases into human
      language. Alpage focuses on 
      <i>text</i>understanding and text generation (by opposition
      to speech processing and generation).</p>
      <p>NLP applications are numerous, and include domains such as
      machine translation, question answering, information
      retrieval, information extraction, text simplification,
      automatic or computer-aided translation, automatic
      symmetrization, foreign language reading and writing aid.
      From a more research-oriented point of view, experimental
      linguistics can be also viewed as an “application” of
      NLP.</p>
      <p>NLP is a multidisciplinary domain. Indeed, it requires an
      expertise in formal and descriptive linguistics (to develop
      linguistic models of human languages), in computer science
      and algorithmics (to design and develop efficient programs
      that can deal with such models), in applied mathematics (to
      acquire automatically linguistic or general knowledge) and in
      other related fields. It is one of the specificities of
      Alpage to put together NLP specialists with a strong
      background in all these fields (in particular, linguistics
      for Paris 7 Alpage members, previously in the Lattice
      UMR, computer science and algorithmics for Inria
      members).</p>
      <p>One specificity of NLP is the diversity of human languages
      it has to deal with. Alpage focuses on French and English,
      but does not ignore other languages, through collaborations,
      in particular with those that are already studied by its
      members or by long-standing collaborators (e.g., Spanish
      Polish, Slovak, Persian, Galician, and others). This is of
      course of high relevance, among others, for
      language-independant modeling and multi-lingual tools and
      applications.</p>
      <p>Alpage's overall objective is to develop linguistically
      relevant 
      <i>and</i>computationally efficient tools and resources for
      natural language processing and its applications. More
      specifically, Alpage focuses on the following topics:</p>
      <simplelist>
        <li id="uid4">
          <p noindent="true">Research topics:</p>
          <simplelist>
            <li id="uid5">
              <p noindent="true">deep syntactic modeling and
              parsing. This topic includes, but is not limited to,
              development of advanced parsing technologies,
              development of large-coverage and high-quality
              adaptive linguistic resources, and use of hybrid
              architectures coupling shallow parsing,
              (probabilistic and symbolic) deep parsing, and
              (probabilistic and symbolic) disambiguation
              techniques;</p>
            </li>
            <li id="uid6">
              <p noindent="true">modeling and processing of
              language at a supra-sentential level (discourse
              modeling and parsing, anaphora resolution, etc);</p>
            </li>
            <li id="uid7">
              <p noindent="true">NLP-based knowledge acquisition
              techniques</p>
            </li>
          </simplelist>
        </li>
        <li id="uid8">
          <p noindent="true">Application domains:</p>
          <simplelist>
            <li id="uid9">
              <p noindent="true">experimental linguistics;</p>
            </li>
            <li id="uid10">
              <p noindent="true">automatic information extraction
              (both linguistic information, inside a bootstrapping
              scheme for linguistic resources, and document
              content, with a more industry-oriented
              perspective);</p>
            </li>
            <li id="uid11">
              <p noindent="true">text mining;</p>
            </li>
            <li id="uid12">
              <p noindent="true">automatic generation;</p>
            </li>
            <li id="uid13">
              <p noindent="true">with a more long-term perspective,
              automatic or computer-aided translation, which is an
              historical domain of expertise for Talana.</p>
            </li>
          </simplelist>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid14" level="1">
      <bodyTitle>Highlights</bodyTitle>
      <p>2010 is a very important year for Alpage as the team's
      visibility, dissemination opportunities and involvement in
      projects and projects proposal has broaden out.</p>
      <p>First, Alpage's international connections and
      collaborations are now numerous and lead to concrete results,
      which shows that the team's work is recognized
      internationaly. Alpage members are involved in a European
      (FP7) project proposal, have organized and organizing several
      workshops (SPMRL at NAACL 2010, WoLeR at ESSLLI 2011, SSSST
      at ACL 2011), are in charge of special issues in several
      journals (Computational Linguistics, TAL).</p>
      <p>Second, the number and impact of Alpage's industrial
      collaborations have increased significantly. Two members of
      Alpage also work for companies that exploit Alpage's results
      and technologies, including the INRIA spin-off 
      <i>Verbatim Analysis</i>. Two CIFRE PhDs (i.e., PhDs in
      collaboration with a company), one with AFP and one with
      Verbatim Analysis (starting Jan 1st, 2011) also contribute to
      transfering Alpage tools and resources to the industry.
      Thanks to the Iliatech day organized by INRIA and Alpage,
      which took place Oct 20, several other industrial contracts
      have been set up, some of them already accepted (with Lingua
      et Machina and Dated), an other still under review by the
      Pôle de Compétitivité System@tic (with Diadeis).</p>
    </subsection>
  </presentation>
  <fondements id="uid15">
    <bodyTitle>Scientific Foundations</bodyTitle>
    <subsection id="uid16" level="1">
      <bodyTitle>From programming languages to linguistic
      grammars</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="atoll-2006-idm57727947600">
          <firstname>Pierre</firstname>
          <lastname>Boullier</lastname>
        </person>
      </participants>
      <p>Historically, several members of Alpage were originally
      specialists in the domain of modeling and parsing for
      programming languages, and are working for more than 15 years
      on the generalization and extension of the techniques
      involved to the domain of natural language. The shift from
      programming language grammars to NLP grammars seriously
      increases complexity and requires ways to handle the
      ambiguities inherent in every human language. It is well
      known that these ambiguities are the sources of many badly
      handled combinatorial explosions.</p>
      <p>Furthermore, while most programming languages are
      expressed by (subclasses) of well-understood context-free
      grammars (CFGs), no consensual grammatical formalism has yet
      been accepted by the whole linguistic community for the
      description of human languages. On the contrary, new
      formalisms (or variants of older ones) appear constantly.
      Many of them may be classified into the three following large
      families:</p>
      <descriptionlist>
        <label>Mildly Context-Sensitive (MCS) formalisms</label>
        <li id="uid17">
          <p noindent="true">They manipulate possibly complex
          elementary structures with enough restrictions to ensure
          the possibility of parsing with polynomial time
          complexities. They include, for instance, Tree Adjoining
          Grammars (TAGs) and Multi-component TAGs with trees as
          elementary structures, Linear Indexed Grammars (LIGs).
          Although they are strictly more powerful than MCS
          formalisms, Range Concatenation Grammars (RCGs,
          introduced and used by Alpage members, such as Pierre
          Boullier and Benoît Sagot 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid1" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid2" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) are also parsable in
          polynomial time.</p>
        </li>
        <label>Unification-based formalisms</label>
        <li id="uid18">
          <p noindent="true">They combine a context-free backbone
          with logic arguments as decoration on non-terminals. Most
          famous representatives are Definite Clause Grammars
          (DCGs) where PROLOG powerful unification is used to
          compute and propagate these logic arguments. More recent
          formalisms, like Lexical Functional Grammars (LFGs) and
          Head-Driven Phrasal Structure Grammars (HPSGs) rely on
          more expressive Typed Feature Structures (TFS) or
          constraints.</p>
        </li>
        <label>Unification-based formalisms with an MCS
        backbone</label>
        <li id="uid19">
          <p noindent="true">The two above-mentioned
          characteristics may be combined, for instance by adding
          logic arguments or constraints to non-terminals in
          TAGs.</p>
        </li>
      </descriptionlist>
      <p>An efficient way to develop large-coverage hand-crafted
      symbolic grammars is to use adequate tools and adequate
      levels of representation, and in particular Meta-Grammars,
      one of Alpage's areas of expertise 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid3" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Meta-Grammars allows the
      linguist to focus on a modular description of the linguistic
      aspects of a grammar, rather than focusing on the specific
      aspects of a given grammatical formalism. Translation from
      MGs to grammatical formalisms such as TAG or LFG may be
      automatically handled. Graphical environments can be used to
      design MGs and their modularity provides a promising way for
      sharing the description of common linguistic phenomena across
      human languages.</p>
    </subsection>
    <subsection id="uid20" level="1">
      <bodyTitle>Statistical Parsing</bodyTitle>
      <p>Contrary to symbolic approaches to parsing, in statistical
      parsing, the grammar is extracted from a corpus of syntactic
      trees : a treebank. The main advantage of the statistical
      approach is to encode within the same framework the parsing
      and disambiguating tasks. The extracted grammar rules are
      associated with probabilities that allow to score and rank
      the output parse trees of an input sentence. This obvious
      advantage of probabilistic context-free grammars has long
      been counterbalanced by two main shortcomings that resulted
      in poor performance for plain PCFG parsers: (i) the
      generalization encoded in non terminal symbols that stand for
      syntagmatic phrases is too coarse (so probabilistic
      independence between rules is too strong an assertion) and
      (ii) lexical items are underused. In the last decade though,
      effective solutions to these shortcomings have been proposed.
      Symbol annotation, either manual 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid5" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>or automatic 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid6" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid7" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>captures inter-dependence between
      CFG rules. Lexical information is integrated in frameworks
      such as head-driven models that allow lexical heads to
      percolate up the syntagmatic tree 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid8" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, or probabilistic models derived
      from lexicalized Tree Adjoining grammars, such as Stochastic
      Tree Insertion Grammars 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid9" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p>In the same period, totally different parsing
      architectures have been proposed, to obtain dependency-based
      syntactic representations. The properties of dependency
      structures, in which each word is related to exactly one
      other word, make it possible to define dependency parsing as
      a sequence of simple actions (such as read buffer and store
      word on top of a stack, attach read word as dependent of
      stack top word, attach read word as governor of stack top
      word ...) 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid10" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid11" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Classifiers can be trained to
      choose the best action to perform given a partial parsing
      configuration. In another approach, dependency parsing is
      cast into the problem of finding the maximum spanning tree
      within the graph of all possible word-to-word dependencies,
      and online classification is used to weight the edges 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid12" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. These two kinds of statistical
      dependency parsing allow to benefit from discriminative
      learning, and its ability to easily integrate various kinds
      of features, which is typically needed in a complex task such
      as parsing.</p>
      <p>Statistical parsing is now effective, both for syntagmatic
      representations and dependency-based syntactic
      representations. Alpage has obtained state-of-the-art parsing
      results for French, by adapting various parser learners for
      French, and works on the current challenges in statistical
      parsing, namely (1) robustness and portability across domains
      and (2) the ability to incorporate exogenous data to improve
      parsing attachment decisions. We review below the approaches
      that Alpage has tested and adapted, and the techniques that
      we plan to investigate to answer these challenges.</p>
      <p>In order to investigate statistical parsers for French, we
      have first worked how to use the French Treebank 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid13" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and derive the best input for
      syntagmatic statistical parsing 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid14" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Benchmarking several PCFG-based
      learning frameworks 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid15" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>has led to state-of-the-art
      results for French, the best performance being obtained with
      the split-merge Berkeley parser (PCFG with latent
      annotations) 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid7" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p noindent="true">In parallel to the work on dependency
      based representation, presented in the next paragraph, we
      also conducted a preliminary set of experiments on richer
      parsing models based on Stochastic Tree Insertion Grammars as
      used in 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid9" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and which, besides their inferior
      performance compared to PCFG-LA based parser, raise promising
      results with respect to dependencies that can be extracted
      from derivation trees. One variation we explored, that uses a
      specific TIG grammar instance, a 
      <i>vertical</i>grammar called 
      <i>spinal</i>grammars, exhibits interesting properties wrt
      the grammar size typically extracted from treebanks (a few
      hundred unlexicalized trees, compared to 14,000 CFG rules).
      These models are currently being investigated in our team 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid16" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p>Pursuing our work on PCFG-LA based parsing, we
      investigated the automatic conversion of the treebank into
      dependency syntax representations 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid17" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, that are easier to use for
      various NLP applications such as question-answering or
      information extraction, and that are a better ground for
      further semantic analysis. This conversion can be applied on
      the treebank, before training a dependency-based parser, or
      on PCFG-LA parsed trees. This gives the possibility to
      evaluate and compare on the same gold data, both syntagmatic-
      and dependency-based statistical parsing. This also paved the
      way for studies on the influence of various types of lexical
      information. Results are described in sections 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid74" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid72" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
    </subsection>
    <subsection id="uid21" level="1">
      <bodyTitle>Dynamic wide coverage lexical
      resources</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
      </participants>
      <p>Grammatical formalisms and associated parsing generators
      are useful only when used together with linguistic resources
      (lexicons, grammars) so as to build operational parsers,
      especially when considering modern lexically oriented
      grammatical formalisms. Hence, linguistic resources are the
      topic of the following section.</p>
      <p>However, wide coverage linguistic resources are scarce and
      expensive, because they are difficult to build, especially
      when hand-crafted. This observation motivates us to
      investigate methods, along to manual development techniques,
      to automatically or semi-automatically acquire, supplement
      and correct linguistic resources.</p>
      <p>Linguistic expertise remains a very important asset to
      benefit efficiently from such techniques, including those
      described below. Moreover, linguistically oriented
      environments with adequate collaborative interfaces are
      needed to facilitate the edition, comparison, validation and
      maintenance of large scale linguistic resources. Just to give
      some idea of the complexity, a syntactic lexicon, as
      described below, should provide rich information for several
      tens of thousands of lemma and several hundreds of thousands
      of forms.</p>
      <p>Successful experiments have been conduced by Alpage
      members with different languages for the automatic
      acquisition of morphological knowledge from raw corpora 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid18" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. At the syntactic level, work
      has been achieved on automatic acquisition of atomic
      syntactic information and automatic detection of errors in
      the lexicon 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid19" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid20" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. At the semantic level,
      automatic wordnet development tools have been described 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid21" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid22" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid23" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid24" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. All such techniques need of
      course to be followed by manual validation, so as to ensure
      high-quality results.</p>
      <p>For French, these techniques, and others, have lead some
      Alpage members to develop one of the main syntactic resources
      for French, the Le 
      <i>fff</i>
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid25" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid26" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, developed within the Alexina
      framework, as well as a wordnet for French, the WOLF 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid27" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, the first freely available
      resource of the kind.</p>
      <p>In the last 2 years, Alpage members have shown how to
      benefit from other more linguistically-oriented resources,
      such as the Lexique-Grammaire and 
      <span class="smallcap" align="left">Dicovalence</span>, in
      order to improve the coverage and quality of the Le 
      <i>fff</i>and the WOLF. This work is a good example of how
      Inria and Paris 7 members of Alpage fruitful
      collaborate: this collaboration between NLP computer
      scientists and NLP linguists have resulted in significant
      advances which would have not been possible otherwise.</p>
      <p>Moreover, an increasing effort has been made towards
      multilingual aspects. In particular, Alexina lexicons
      developed in 2009 or before exist for Slovak 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid18" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, Polish 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid28" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, English, Spanish and Persian
      (although very preliminarily before 2010, see 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid85" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), not including freely-available
      lexicons adapted to the Alexina framework.</p>
    </subsection>
    <subsection id="uid22" level="1">
      <bodyTitle>Shallow processing</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
      </participants>
      <p>The constitution of resources such as lexica or grammars
      raises the issues of the evaluation of these resources to
      assess their quality and coverage. For this reason, Alpage is
      the leader of the PASSAGE ANR project (ended in June 2010),
      which is the follow-up of the EASy parsing evaluation
      campaign held in 2004 and conducted by team LIR at LIMSI.</p>
      <p>However, although developing parsing techniques, grammars
      (symbolic or probabilistic), and lexica constitute obviously
      the key efforts towards deep large-scale linguistic
      processing, these components need to be included inside a
      full and robust processing chain, able to handle any text
      from any source. The development of such linguistic chains,
      such as 
      <span class="smallcap" align="left">Sx</span>Pipe , is not a
      trivial task 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid29" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Moreover, when used as a
      preliminary step before parsers, the quality of parsers'
      results strongly depends on the quality of such chains. In
      that regard, less-standard pre-processings such as word
      clustering show promising results (see, e.g., section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid72" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>)</p>
      <p>I fact, such processing chains are mostly used as such,
      and not only as pre-processing tools before parsing. They aim
      at performing the basic tasks that produce immediately usable
      results for many applications, such as tokenization, sentence
      segmentation, spelling correction, and, most importantly,
      named entity detection, disambiguation and resolution (see
      section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid84" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
    </subsection>
    <subsection id="uid23" level="1">
      <bodyTitle>Discourse structures</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
        <person key="alpage-2009-idm402038290176">
          <firstname>Charlotte</firstname>
          <lastname>Roze</lastname>
        </person>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2009-idm402038296432">
          <firstname>Philippe</firstname>
          <lastname>Muller</lastname>
        </person>
      </participants>
      <p>Until now, the linguistic modeling and automatic
      processing of sentences has been the main focus of the
      community. However, many applications would benefit from more
      large-scale approaches which go beyond the level of
      sentences. This is not only the case for automatic
      translation: information extraction/retrieval, summarizing,
      and other applications do need to resolve anaphoras, which in
      turn can benefit from the availability of hierarchical
      discourse structures induced by discourse relations (in
      particular through the notion of right frontier of discourse
      structures). Moreover, discourse structures are required to
      extract sequential (chronological, logical,...) or
      hierarchical representations of events. It is also useful for
      topic extraction, which in turns can help syntactic and
      semantic disambiguation.</p>
      <p>Although supra-sentential problematics received increasing
      attention in the last years, there is no satisfying solution
      to these problems. Among them, anaphora resolution and
      discourse structures have a far-reaching impact and are
      domains of expertise of Alpage members. But their formal
      modeling has now reached a maturity which allows to integrate
      them, in a near future, inside future Alpage tools, including
      parsing systems inherited from Atoll.</p>
      <p>It is well known that a text is not a random sequence of
      sentences: sentences are linked the ones to the others by
      “discourse relations”, which give to the text a hierarchical
      structure. Traditionally, it is considered that discourse
      relations are lexicalized by connectors (adverbial connectors
      like 
      <i>ensuite</i>, conjunctions like 
      <i>parce que</i>), or are not lexicalized. This vision is
      however too simple:</p>
      <simplelist>
        <li id="uid24">
          <p noindent="true">first, some connectors (in particular
          conjunctions of subordination) introduce pure modifiers
          and must not be considered as bearing discourse
          relations,</p>
        </li>
        <li id="uid25">
          <p noindent="true">second, other elements than connectors
          can lexicalize discourse relations, in particular verbs
          like 
          <i>précéder / to precede</i>or 
          <i>causer / to cause</i>, which have facts or fact
          eventualities as arguments 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid30" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
        </li>
      </simplelist>
      <p>There are three main frameworks used to model discourse
      structures: RST, SDRT , and, more recently, D-LTAG. Inside
      Alpage, Laurence Danlos has introduced 
      <span class="smallcap" align="left">d-stag</span>(Discourse
      Synchronous TAGs, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid31" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid32" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), which subsumes in an elegant
      way both SDRT and RST, to the extent that SDRT and RST
      structures can be obtained by two different partial
      projections of 
      <span class="smallcap" align="left">d-stag</span>structures.
      As done in D-LTAG, 
      <span class="smallcap" align="left">d-stag</span>extends a
      lexicalized TAG analysis so as to deal with the level of
      discourse. 
      <span class="smallcap" align="left">d-stag</span>has been
      fully formalized, and is hence possible to implement (thanks
      to Synchronous TAG, or even TAG parsers), provided one
      develops linguistic descriptions in this formalism.</p>
    </subsection>
    <subsection id="uid26" level="1">
      <bodyTitle>Coreference resolution</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2009-idm402038296432">
          <firstname>Philippe</firstname>
          <lastname>Muller</lastname>
        </person>
        <person key="alpage-2008-idm542378755024">
          <firstname>Elżbieta</firstname>
          <lastname>Gryglicka</lastname>
        </person>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
      </participants>
      <p>An important challenge for the understanding of natural
      language texts is the correct computation of the 
      <i>discourse entities</i>that are mentioned therein —persons,
      locations, abstract objects, and so on. In addition to
      identifying individual referential expressions (e.g., 
      <i>Nicolas Sarkozy</i>, 
      <i>Neuilly</i>, 
      <i>l'UMP</i>) and properly typing them (e.g. 
      <i>Nicolas Sarkozy</i>is a 
      <span class="smallcap" align="left">person</span>, 
      <i>Neuilly</i>is a 
      <span class="smallcap" align="left">lieu</span>), the task is
      also to determine the other mentions with which these
      expressions are coreferential. Part of the difficulty of this
      task is that natural languages provide many ways to refer to
      the same entity (including the use of pronouns such as 
      <i>il</i>, 
      <i>ses</i>and definite descriptions such as 
      <i>le président</i>, making them highly ambiguous. The
      identification of coreferential links and other anaphoric
      links (such as “associative anaphora”) plays a key role for
      various applications, such as extraction and retrieval of
      information, but also the summary or automatic
      question-answering systems. This central role of coreference
      resolution has been recognized by the inclusion of this task
      in different international evaluation campaigns, beginning
      with the campaigns 
      <i>Message Understanding Conference</i>(in particular, 
      <span class="smallcap" align="left">muc-6</span>and 
      <span class="smallcap" align="left">muc-7</span>) 
      <footnote id="uid27" id-text="1">See, respectively: 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.cs.nyu.edu/cs/faculty/grishman/muc6.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
      <allowbreak/>www. 
      <allowbreak/>cs. 
      <allowbreak/>nyu. 
      <allowbreak/>edu/ 
      <allowbreak/>cs/ 
      <allowbreak/>faculty/ 
      <allowbreak/>grishman/ 
      <allowbreak/>muc6. 
      <allowbreak/>html</ref>and 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.itl.nist.gov/iaui/894.02/related_projects/muc/proceedings/muc_7_toc.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
      <allowbreak/>www. 
      <allowbreak/>itl. 
      <allowbreak/>nist. 
      <allowbreak/>gov/ 
      <allowbreak/>iaui/ 
      <allowbreak/>894. 
      <allowbreak/>02/ 
      <allowbreak/>related_projects/ 
      <allowbreak/>muc/ 
      <allowbreak/>proceedings/ 
      <allowbreak/>muc_7_toc. 
      <allowbreak/>html</ref>.</footnote>, and more recently 
      <i>Automatic Content Extraction</i>( 
      <span class="smallcap" align="left">ace</span>) 
      <footnote id="uid28" id-text="2"><ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.nist.gov/speech/tests/ace/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>www. 
        <allowbreak/>nist. 
        <allowbreak/>gov/ 
        <allowbreak/>speech/ 
        <allowbreak/>tests/ 
        <allowbreak/>ace/ 
        <allowbreak/></ref></footnote>and 
      <i>Anaphora Resolution Evaluation</i>( 
      <span class="smallcap" align="left">are</span>) 
      <footnote id="uid29" id-text="3"><ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://clg.wlv.ac.uk/events/ARE/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>clg. 
        <allowbreak/>wlv. 
        <allowbreak/>ac. 
        <allowbreak/>uk/ 
        <allowbreak/>events/ 
        <allowbreak/>ARE/ 
        <allowbreak/></ref></footnote>. The creation and distribution of corpora
      developped as part of these campaigns have significantly
      boosted research in automatic coreference resolution. In
      particular, they have made possible the application of
      machine learning techniques (mostly supervised ones) to the
      problem of coreference resolution. This in turn has led to
      the development of systems that were both more robust and
      more precise, thus making more realistic their integration
      within these larger systems. Some of the best systems based
      on supervised learning methods are described in 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid33" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid34" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid35" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid36" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid37" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>; 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid38" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Note that a few attemtps were
      also made at using unsupervised techniques (mostly clustering
      methods) for the task 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid39" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid40" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, but these systems are still far
      from reaching the performance of their supervised
      counterparts.</p>
    </subsection>
  </fondements>
  <domaine id="uid30">
    <bodyTitle>Application Domains</bodyTitle>
    <subsection id="uid31" level="1">
      <bodyTitle>Panorama</bodyTitle>
      <p>NLP tools and methods have many possible domains of
      application. Some of then are already mature enough to be
      commercialized. They can be roughly classified in three
      groups:</p>
      <descriptionlist>
        <label>Human-computer interaction</label>
        <li id="uid32">
          <p noindent="true">: mostly speech processing and
          text-to-speech, often in a dialogue context; today,
          commercial offers are limited to restricted domains
          (train tickets reservation...);</p>
        </li>
        <label>Language writing aid</label>
        <li id="uid33">
          <p noindent="true">: spelling, grammatical and stylistic
          correctors for text editors, controlled-language writing
          aids (e.g., for technical documents), memory-based
          translation aid, foreign language learning tools, as well
          as vocal dictation;</p>
        </li>
        <label>Access to information</label>
        <li id="uid34">
          <p noindent="true">: tools to enable a better access to
          information present in huge collections of texts (e.g.,
          the Internet): automatic document classification,
          automatic document structuring, automatic summarizing,
          information acquisition and extraction, text mining,
          question-answering systems, as well as surface machine
          translation. Information access to speech archives
          through transcriptions is also an emerging field.</p>
        </li>
        <label>Experimental linguistics</label>
        <li id="uid35">
          <p noindent="true">: tools to explore language in an
          objective way (this is related, but not limited to corpus
          linguistics).</p>
        </li>
      </descriptionlist>
      <p>Alpage focuses on some applications included in the three
      last points, such as information extraction and (linguistic
      and extra-linguistic) knowledge acquisition ( 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid36" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), text mining ( 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid37" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), text generation ( 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid40" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), spelling correction ( 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid41" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) and experimental linguistics ( 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid42" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
    </subsection>
    <subsection id="uid36" level="1">
      <bodyTitle>Information extraction and knowledge
      acquisition</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
        <person key="alpage-2008-idm542378774048">
          <firstname>François-Régis</firstname>
          <lastname>Chaumartin</lastname>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
        <person key="alpage-2010-idm152476259776">
          <firstname>Kata</firstname>
          <lastname>Gábor</lastname>
        </person>
        <person key="PASUSERID">
          <firstname>Tim</firstname>
          <lastname>van de Cruys</lastname>
        </person>
        <person key="alpage-2010-idm152476230416">
          <firstname>Yayoi</firstname>
          <lastname>Nakamura-Delloye</lastname>
        </person>
        <person key="alpage-2010-idm152476291760">
          <firstname>Marianna</firstname>
          <lastname>Apidianaki</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <p>The first domain of application for Alpage parsing systems
      is information extraction, and in particular knowledge
      acquisition, be it linguistic or not, and text mining.</p>
      <p>Knowledge acquisition for a given restricted domain is
      something that has already been studied by some Alpage
      members for several years (ACI Biotim, biographic information
      extraction from the Maitron corpus, Scribo project).
      François-Régis Chaumartin, PhD student at Alpage and CEO of
      Proxem, is working on information extraction from the English
      Wikipedia. Indeed, chunking or, better, syntactic (and
      semantic) parsing gives an access, through learning
      techniques, to useful information present in documents.
      Obviously, the progressive extension of Alpage parsing
      systems to a full syntactic 
      <i>and</i>semantic parsing will increase the quality of the
      extracted information, as well as the scope of information
      that can be extracted. Such knowledge acquisition efforts
      bring solutions to current problems related to information
      access and take place into the emerging notion of 
      <i>Semantic Web</i>. The transition from a web based on data
      (textual documents,...) to a web based on knowledge requires
      linguistic processing tools which are able to provide fine
      grained pieces of information, in particular by relying on
      high-quality deep parsing. For a given domain of knowledge
      (say, tourism), the extraction of a domain ontology that
      represents its key concepts and the relations between them is
      a crucial task, which has a lot in common with the extraction
      of linguistic information.</p>
      <p>All these applications in the domain of information
      extraction raise exciting challenges that require altogether
      ideas and tools coming from the domains of computational
      linguistics, machine learning and knowledge
      representation.</p>
    </subsection>
    <subsection id="uid37" level="1">
      <bodyTitle>Processing answers to open-ended questions in
      surveys: 
      <i>vera</i></bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <p>Verbatim Analysis is a startup co-created by Benoît Sagot
      from Alpage and Dimitri Tcherniak from Towers Watson, a
      world-wide leader in the domain of employee research (opinion
      mining among the employees of a company or organization). The
      aim of its first product, 
      <i>vera</i>, is to provide an all-in-one environment for
      editing (i.e., normalizing the spelling and typography),
      understanding and classifying answers to open-ended
      questions, and relating them with closed-ended questions, so
      as to extract as much valuable information as possible from
      both types of questions. The editing part relies in part on 
      <span class="smallcap" align="left">Sx</span>Pipe (see
      section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid48" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) and Alexina morphological
      lexicons. Several other parts of 
      <i>vera</i>are co-owned by Verbatim Analysis and by
      INRIA.</p>
    </subsection>
    <subsection id="uid38" level="1">
      <bodyTitle>Shallow processing of e-mails</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
      </participants>
      <p>Shallow processing is one of the most important NLP
      application domains. This includes, in particular, detecting
      named entities in a broad sense (person names, organization
      names, locations, addresses, date and time mentions, and
      others), with many possible purposes, such as text
      normalization and even anonymization, but more importantly
      for extracting events and other kinds of structured
      information from text. This is what the new company Kwaga is
      trying to do on e-mails, challenging difficulties related to
      the high level of noise that characterizes e-mail corpora
      (spelling mistakes, shortenings, inter-e-mail structure...).
      In 2009-2010, an ARITT contract has been set up to try and
      study the usability of Alpage's 
      <span class="smallcap" align="left">Sx</span>Pipe shallow
      processing chain for part of this purpose.</p>
    </subsection>
    <subsection id="uid39" level="1">
      <bodyTitle>Multilingual terminologies and lexical resources
      for companies</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <p>Lingua et Machina is a small company now head by François
      Brown de Colstoun, a former INRIA researcher, that provides
      services for developing specialized multilingual
      terminologies for its clients. It develops the framework
      Libellex for validating such terminologies. A formal
      collaboration with ALPAGE is under preparation, centered
      around the joint extension and improvement of Lingua et
      Machina’s and ALPAGE’s lexical resources and associated
      tools.</p>
    </subsection>
    <subsection id="uid40" level="1">
      <bodyTitle>Generation of textual reports about statistical
      data: EASYTEXT</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
      </participants>
      <p>In 2010, the generation system EASYTEXT has been polished
      up so that it is operational at Kantar Media which sailed it
      to a bunch of customers. As Kantar Media was pleasantly
      surprised by the quality of the automatically generated
      texts, they asked for further extensions of EASYTEXT which
      are currently worked on, especially an extension to generate
      English texts.</p>
      <p>A paper describing roughly this system and the economic
      stakes of Natural Language Generation has been published in 
      <i>La Recherche</i>
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid41" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. See also a column in 
      <i>La Tribune</i>(9/11/2010).</p>
      <p>Another application of NLG we foresee is the automatic
      production of captions for photos. There is ongoing
      discussions with AFP ( 
      <i>Agence France-Presse</i>) on the topic.</p>
    </subsection>
    <subsection id="uid41" level="1">
      <bodyTitle>Automatic and semi-automatic spelling correction
      in an industrial setting</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
      </participants>
      <p>NLP tools and resources used for spelling correction, such
      as large n-gram collections, POS taggers and finite-state
      machinery are now mature and precise. In industrial setting
      such as post-processing after large-scale OCR, these tools
      and resources should enable spelling correction tools to work
      on a much larger scale and with a much better precision than
      what can be found in different contexts with different
      constraints (e.g., in text editors). Moreover, such
      industrial contexts allow for a non-costly manual
      intervention, in case one is able to identify the most
      uncertain corrections. An FUI project on this topic has been
      proposed in collaboration with Diadeis, a company specialized
      in text digitalization, and two other partners. It is
      currently under review.</p>
    </subsection>
    <subsection id="uid42" level="1">
      <bodyTitle>Experimental linguistics</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378770960">
          <firstname>Benoît</firstname>
          <lastname>Crabbé</lastname>
        </person>
        <person key="alpage-2009-idm402038273904">
          <firstname>Juliette</firstname>
          <lastname>Thuilier</lastname>
        </person>
        <person key="alpage-2009-idm402038353920">
          <firstname>Luc</firstname>
          <lastname>Boruta</lastname>
        </person>
      </participants>
      <p>Alpage is a team that dedicates efforts in producing
      ressources and algorithms for processing large amounts of
      textual materials. These ressources can be applied not only
      for purely NLP purposes but also for linguistic purposes.
      Indeed, the specific needs of NLP applications led to the
      development of electronic linguistic resources (in particular
      lexica, annotated corpora, and treebanks) that are
      sufficiently large for carrying statistical analysis on
      linguistic issues. In the last 10 years, pioneering work has
      started to use these new data sources to the study of English
      grammar, leading to important new results in such areas as
      the study of syntactic preferences 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid42" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid43" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, the existence of graded
      grammaticality judgments 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid44" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p>The reasons for getting interested for statistical
      modelling of language can be traced back by looking at the
      recent history of grammatical works in linguistics. In the
      1980s and 1990s, theoretical grammarians have been mostly
      concerned with improving the conceptual underpinnings of
      their respective subfields, in particular through the
      construction and refinement of formal models. In syntax, the
      relative consensus on a generative-transformational approach 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid45" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>gave way on the one hand to more
      abstract characterizations of the language faculty 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid45" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, and on the other hand to the
      construction of detailed, formally explicit, and often
      implemented, alternative formulation of the generative
      approach 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid46" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid47" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. For French several grammars
      have been implemented in this trend, among which the tree
      adjoining grammars of 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid48" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid49" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>among others. This general
      movement led to much improved descriptions and understanding
      of the conceptual underpinnings of both linguistic competence
      and language use. It was in large part catalyzed by a
      convergence of interests of logical, linguistic and
      computational approaches to grammatical phenomena.</p>
      <p>However, starting in the 1990s, a growing portion of the
      community started being frustrated by the paucity and
      unreliability of the empirical evidence underlying their
      research. In syntax, data was generally collected
      impressionistically, either as ad-hoc small samples of
      language use, or as ill-understood and little-controlled
      grammaticality judgements (Schütze 1995). This shift towards
      quantitative methods is also a shift towards new scientific
      questions and new scientific fields. Using richly annotated
      data and statistical modelling, we address questions that
      could not be addressed by previous methodology in
      linguistics. In this line, at Alpage we have started
      investigating the question of choice in French syntax with a
      statistical modelling methodology. Currently two studies are
      being led on the position of attributive adjectives
      w.r.t. the noun and the relative position of postverbal
      complement. This research has contributed to establish new
      links with the Laboratoire de Linguistique Formelle (LLF,
      Paris 7) and the Laboratoire de Psychologie et
      Neuropsychologie Cognitives (LPNCog, Paris 5) with which we
      intend to submit joint research projects next year.</p>
      <p>On the other hand we have also started a collaboration
      with the Laboratoire de Sciences Cognitives de Paris
      (LSCP/ENS) where we explore the design of algorithms towards
      the statistical modelling of language acquisition
      (phonological acquisition). This is currently supported by
      one PhD project.</p>
    </subsection>
  </domaine>
  <logiciels id="uid43">
    <bodyTitle>Software</bodyTitle>
    <subsection id="uid44" level="1">
      <bodyTitle>
        <span class="smallcap" align="left">Syntax</span>
      </bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727947600">
          <firstname>Pierre</firstname>
          <lastname>Boullier</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="alpage-2009-idm402038277728">
          <firstname>Sattisvar</firstname>
          <lastname>Tandabany</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <moreinfo>
        <p>See also the web page 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://syntax.gforge.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>syntax. 
        <allowbreak/>gforge. 
        <allowbreak/>inria. 
        <allowbreak/>fr/ 
        <allowbreak/></ref>.</p>
      </moreinfo>
      <p>The (currently beta) version 6.0 of the 
      <span class="smallcap" align="left">Syntax</span>system
      (freely available on INRIA GForge) includes various
      deterministic and non-deterministic CFG parser generators. It
      includes in particular an efficient implementation of the
      Earley algorithm, with many original optimizations, that is
      used in several of Alpage's NLP tools, including the
      pre-processing chain 
      <span class="smallcap" align="left">Sx</span>Pipe and the LFG
      deep parser 
      <span class="smallcap" align="left">SxLfg</span>. This
      implementation of the Earley algorithm has been recently
      extended to handle probabilistic CFG (PCFG), by taking into
      account probabilities both during parsing (beam) and after
      parsing ( 
      <span class="math"><hi rend="it">n</hi></span>-best computation). 
      <span class="smallcap" align="left">Syntax</span>6.0 also
      includes parsers for various contextual formalisms, including
      a parser for Range Concatenation Grammars (RCG) that can be
      used among others for TAG and MC-TAG parsing.</p>
      <p>Direct NLP users of 
      <span class="smallcap" align="left">Syntax</span>for NLP,
      outside Alpage, include Alexis Nasr (Marseilles) and other
      members of the 
      <span class="smallcap" align="left">Sequoia</span>ANR project
      (see section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid94" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), Owen Rambow and co-workers at
      Columbia University (New York), as well as (indirectly) all 
      <span class="smallcap" align="left">Sx</span>Pipe and/or 
      <span class="smallcap" align="left">SxLfg</span>users. The
      project-team VASY (INRIA Rhône-Alpes) is one of 
      <span class="smallcap" align="left">Syntax</span>' user for
      non-NLP applications.</p>
    </subsection>
    <subsection id="uid45" level="1">
      <bodyTitle>System 
      <span class="smallcap" align="left">DyALog</span></bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
          <moreinfo>maintainer</moreinfo>
        </person>
      </participants>
      <moreinfo>
        <p><span class="smallcap" align="left">DyALog</span>on INRIA
        GForge: 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://dyalog.gforge.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>dyalog. 
        <allowbreak/>gforge. 
        <allowbreak/>inria. 
        <allowbreak/>fr/ 
        <allowbreak/></ref></p>
      </moreinfo>
      <p><span class="smallcap" align="left">DyALog</span>provides an
      environment to compile and execute grammars and logic
      programs. It is essentially based on the notion of
      tabulation, i.e. of sharing computations by tabulating traces
      of them. 
      <span class="smallcap" align="left">DyALog</span>is mainly
      used to build parsers for Natural Language Processing (NLP).
      It may nevertheless be used as a replacement for traditional
      PROLOG systems in the context of highly ambiguous
      applications where sub-computations can be shared.</p>
      <p>The current release 
      <b>1.13.0</b>of 
      <span class="smallcap" align="left">DyALog</span>is freely
      available by FTP under an open source license and runs on
      Linux platforms for x86 and architectures and on Mac OS intel
      (both 32 and 64bits architectures). A partial port for Window
      Cygwin has been successful but has not yet been integrated
      and finalized.</p>
      <p>The current release handles logic programs, DCGs ( 
      <i>Definite Clause Grammars</i>), FTAGs ( 
      <i>Feature Tree Adjoining Grammars</i>), FTIGs ( 
      <i>Feature Tree Insertion Grammars</i>) and XRCGs ( 
      <i>Range Concatenation Grammars</i>with logic arguments).
      Several extensions have been added to most of these
      formalisms such as intersection, Kleene star, and interleave
      operators. Typed Feature Structures (TFS) as well as finite
      domains may be used for writing more compact and declarative
      grammars 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid50" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p>C libraries can be used from within 
      <span class="smallcap" align="left">DyALog</span>to import
      APIs ( 
      <tt>mysql</tt>, 
      <tt>libxml</tt>, 
      <tt>sqlite</tt>, ...).</p>
      <p><span class="smallcap" align="left">DyALog</span>is largely
      used within ALPAGE to build parsers but also derivative
      softwares, such as a compiler of Meta-Grammars (cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid46" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>). It has also been used for
      building a parser from a large coverage French TIG/TAG
      grammar derived from a Meta-Grammar. This parser has been
      used for the Parsing Evaluation campaign EASy, the two
      Passage campaigns (Dec. 2007 and Nov. 2009), cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid97" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid51" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, and very large amount of data
      (700 millions of words) for the SCRIBO action, cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid92" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p><span class="smallcap" align="left">DyALog</span>is used at
      LORIA (Nancy), University of Coruña (Spain), Instut Gaspard
      Monge (Univ. Marne La Vallée), University of Nice, and a few
      other users.</p>
      <p><span class="smallcap" align="left">DyALog</span>and other
      companion modules are available on INRIA GForge.</p>
    </subsection>
    <subsection id="uid46" level="1">
      <bodyTitle>Tools and resources for Meta-Grammars</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
          <moreinfo>maintainer</moreinfo>
        </person>
      </participants>
      <moreinfo>
        <p><tt>mgcomp</tt>, 
        <span class="smallcap" align="left">MgTools</span>, and
        FRMG on INRIA GForge: 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://mgkit.gforge.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>mgkit. 
        <allowbreak/>gforge. 
        <allowbreak/>inria. 
        <allowbreak/>fr/ 
        <allowbreak/></ref></p>
      </moreinfo>
      <p><span class="smallcap" align="left">DyALog</span>(cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid45" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) has been used to implement 
      <tt>mgcomp</tt>, a compiler of Meta-Grammar (cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid55" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>). Starting from an XML
      representation of a MG, 
      <tt>mgcomp</tt>produces an XML representation of its TAG
      expansion.</p>
      <p>The current version 
      <b>1.5.0</b>is freely available by FTP under an open source
      license. It is used within ALPAGE and (occasionally) at LORIA
      (Nancy) and at University of Pennsylvania.</p>
      <p>The current version adds the notion of namespace, to get
      more compact and less error-prone meta-grammars. It also
      provides other extensions of the standard notion of
      Meta-Grammar in order to generate very compact TAG grammars.
      These extensions include the notion of 
      <i>Guarded nodes</i>, i.e. nodes whose existence and
      non-existence depend on the truth value of a guard, and the
      use of the regular operators provided by 
      <span class="smallcap" align="left">DyALog</span>on nodes,
      namely disjunction, interleaving and Kleene star. The current
      release provides a dump/restore mechanism for faster
      compilations on incremental changes of a meta-grammars.</p>
      <p>The current version of 
      <tt>mgcomp</tt>has been used to compile a wide coverage
      Meta-Grammar FRMG (version 2.0.1) to get a grammar of around
      200 TAG trees 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid52" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Without the use of guarded
      nodes and regular operators, this grammar would have more
      than several thousand trees and would be almost intractable.
      FRMG has been packaged and is freely available.</p>
      <p>To ease the design of meta-grammars, a set of tools have
      been implemented, mostly by Éric de La Clergerie, and
      collected in 
      <span class="smallcap" align="left">MgTools</span>(version 
      <b>2.2.2</b>). This package includes a converter from a
      compact format to a XML pivot format, an Emacs mode for the
      compact and XML formats, a graphical viewer interacting with
      Emacs and XSLT stylesheets to derive HTML views. A new
      version is under development to provide an even more compact
      syntax and some checking mechanisms to avoid frequent typo
      errors.</p>
      <p>The various tools on Metagrammars are available on INRIA
      GForge.</p>
    </subsection>
    <subsection id="uid47" level="1">
      <bodyTitle>The Bonzai PCFG-LA parser</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378770960">
          <firstname>Benoît</firstname>
          <lastname>Crabbé</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="alpage-2008-idm542378777200">
          <firstname>Marie</firstname>
          <lastname>Candito</lastname>
        </person>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2008-idm542378729584">
          <firstname>Djamé</firstname>
          <lastname>Seddah</lastname>
        </person>
      </participants>
      <moreinfo>
        <p>Web page:</p>
        <p noindent="true">
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://alpage.inria.fr/statgram/frdep/fr_stat_dep_parsing.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>alpage. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>statgram/ 
          <allowbreak/>frdep/ 
          <allowbreak/>fr_stat_dep_parsing. 
          <allowbreak/>html</ref>
        </p>
      </moreinfo>
      <p>Alpage has developped as support of the research papers 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid14" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid17" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid53" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid15" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>a statistical parser for French,
      named Bonzai, trained on the French Treebank. This parser
      provides both a phrase structure and a projective dependency
      structure specified in 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid54" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>as output. This parser operates
      sequentially: (1) it first outputs a phrase structure
      analysis of sentences reusing the Berkeley implementation of
      a PCFG-LA trained on French by Alpage (2) it applies on the
      resulting phrase structure trees a process of conversion to
      dependency parses using a combination of heuristics and
      classifiers trained on the French treebank. The parser
      currently outputs several well known formats such as Penn
      treebank phrase structure trees, Xerox like triples and
      CONLL-like format for dependencies. The parsers also comes
      with basic preprocessing facilities allowing to perform
      elementary sentence segmentation and word tokenisation,
      allowing in theory to process unrestricted text. However it
      is believed to perform better on newspaper-like text. The
      parser is available under a GPL license.</p>
    </subsection>
    <subsection id="uid48" level="1">
      <bodyTitle>Alpage's linguistic workbench, including 
      <span class="smallcap" align="left">Sx</span>Pipe</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
        <person key="atoll-2006-idm57727947600">
          <firstname>Pierre</firstname>
          <lastname>Boullier</lastname>
        </person>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
      </participants>
      <moreinfo>
        <p>See also the web page 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://lingwb.gforge.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>lingwb. 
        <allowbreak/>gforge. 
        <allowbreak/>inria. 
        <allowbreak/>fr/ 
        <allowbreak/></ref>.</p>
      </moreinfo>
      <p>Alpage's linguistic workbench is a set of packages for
      corpus processing and parsing. Among these packages, the 
      <span class="smallcap" align="left">Sx</span>Pipe package is
      of a particular importance</p>
      <p><span class="smallcap" align="left">Sx</span>Pipe, now in
      version 2 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid55" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>is a modular and customizable
      chain aimed to apply to raw corpora a cascade of surface
      processing steps. It is used</p>
      <simplelist>
        <li id="uid49">
          <p noindent="true">as a preliminary step before Alpage's
          parsers (FRMG, 
          <span class="smallcap" align="left">SxLfg</span>);</p>
        </li>
        <li id="uid50">
          <p noindent="true">for surface processing (named entities
          recognition, text normalization...).</p>
        </li>
      </simplelist>
      <p>Developed for French and for other languages, 
      <span class="smallcap" align="left">Sx</span>Pipe 2 includes,
      among others, various named entities recognition modules in
      raw text, a sentence segmenter and tokenizer, a spelling
      corrector and compound words recognizer, and an original
      context-free patterns recognizer, used by several specialized
      grammars (numbers, impersonal constructions,
      quotations...).</p>
    </subsection>
    <subsection id="uid51" level="1">
      <bodyTitle>MElt</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <p>MElt is a part-of-speech tagger, trained for French (on
      the French TreeBank and coupled with the Le 
      <i>fff</i>) and English 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid56" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. It is state-of-the-art for
      French. It is distributed freely as a part of the Alpage
      linguistic workbench.</p>
    </subsection>
    <subsection id="uid52" level="1">
      <bodyTitle>The syntactic lexicon Le 
      <i>fff</i>and the Alexina framework</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
      </participants>
      <moreinfo>
        <p>See also the web page 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://gforge.inria.fr/projects/alexina/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>gforge. 
        <allowbreak/>inria. 
        <allowbreak/>fr/ 
        <allowbreak/>projects/ 
        <allowbreak/>alexina/ 
        <allowbreak/></ref>.</p>
      </moreinfo>
      <p>Alexina is Alpage's Alexina framework for the acquisition
      and modeling of morphological and syntactic lexical
      information. The first and most advanced lexical resource
      developed in this framework is the Le 
      <i>fff</i>, a morphological and syntactic lexicon for
      French.</p>
      <p>Historically, the Le 
      <i>fff</i> 1 was a freely available French morphological
      lexicon for verbs that has been automatically extracted from
      a very large corpus. Since version 2, the Le 
      <i>fff</i>covers all grammatical categories (not just verbs)
      and includes syntactic information (such as subcategorization
      frames); Alpage's tools, including Alpage's parsers, rely on
      the Le 
      <i>fff</i>. The version 3 of the Le 
      <i>fff</i>, which has been released in 2008, improves the
      linguistic relevance and the interoperability with other
      lexical models.</p>
      <p>Other Alexina lexicons are under development, in
      particular for Spanish (the Le 
      <i>ff</i>e), Polish, Slovak, English, Galician, Persian
      (PerLex, see 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid85" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), Kurdish.</p>
    </subsection>
    <subsection id="uid53" level="1">
      <bodyTitle>System 
      <span class="smallcap" align="left">
      EasyRef</span></bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
          <moreinfo>maintainer</moreinfo>
        </person>
      </participants>
      <moreinfo>
        <p>PASSAGE action</p>
      </moreinfo>
      <p>A collaborative WEB service 
      <span class="smallcap" align="left">EasyRef</span>has been
      developed, in the context of ANR action Passage, to handle
      syntactically annotated corpora. 
      <span class="smallcap" align="left">EasyRef</span>may be used
      to view annotated corpus, in both EASY or PASSAGE formats.
      The annotations may be created and modified. Bug reports may
      be emitted. The annotations may be imported and exported. The
      system provides standard user right management. The interface
      has been designed with the objectives to be intuitive and to
      speed edition.</p>
      <p><span class="smallcap" align="left">EasyRef</span>relies on
      an Model View Controller design, implemented with the Perl
      Catalyst framework. It exploits WEB 2.0 technologies (i.e.
      AJAX and JavaScript).</p>
      <p>Version 2 has been used by ELDA and LIMSI to annotate a
      new corpus of several thousands words for PASSAGE.</p>
      <p>A preliminary version 3 has been developed by
      François Guérin and revised by Éric de La Clergerie, relying
      on Berkeley DB XML to handle very large annotated corpora and
      to provide a complete query language expanded as XQuery
      expressions. 
      <span class="smallcap" align="left">EasyRef</span>is
      maintained under INRIA GForge.</p>
    </subsection>
  </logiciels>
  <resultats id="uid54">
    <bodyTitle>New Results</bodyTitle>
    <subsection id="uid55" level="1">
      <bodyTitle>Designing efficient parsers using Meta-Grammars
      and DyALog</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
      </participants>
      <glosslist>Glossary 
      <label>MG</label>
      <li><p><i>Meta-Grammars</i></p></li></glosslist>
      <p>Éric de La Clergerie has continued to improve the
      coverage, quality and efficiency of the French meta-grammar
      FRMG. This work is made progressively easier, using the
      various testing scripts developed in 2009 (confusion matrices
      for instance). A small but very practical shell ( 
      <span class="smallcap" align="left">frmg_shell</span>) has
      been written to ease the use of FRMG, in particular for
      testing sentences.</p>
      <p>Preliminary experiments have been tried to integrate, in
      the post-parsing disambiguation phase, some quantitative
      information provided by the knowledge acquisition experiments
      (cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid57" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) about for instance the strength
      of a dependency through some preposition between a governor
      noun and a governee noun. Weights for several kinds of
      dependencies have been used, exploiting their frequency of a
      large corpus but also the semantic proximity between the
      governors or between the governees, as computed by the
      knowledge acquisition experiments. However, while real, the
      benefits of these weights for a better disambiguation remain
      very small. Further experiments have to be tried to
      investigate the situation, with maybe a better calibration of
      the imported weights wrt the various weights manually
      attached to the disambiguation rules.</p>
    </subsection>
    <subsection id="uid56" level="1">
      <bodyTitle>Large scale corpus processing</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
      </participants>
      <p>In the context of the PASSAGE and SCRIBO actions, we have
      continued the explore the use of distributed computing for
      processing of very large corpora, largely using
      GRID 5000 and a local cluster at INRIA Rocquencourt. For
      the SCRIBO action (cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid92" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), GRID 5000 was in
      particular used to parse with FRMG a 700 million words corpus
      (including Wikipedia, Wikisource, and 30 months of AFP news).
      Several problems were again identified and corrected to get
      more and more robust treatments.</p>
      <p>Distributed computing is also used on local clusters to
      collect and count patterns in the output of FRMG, using an
      adapted version of the 
      <i>map-reduce</i>algorithm. These patterns with counts are
      then used as input for knowledge acquisition (cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid56" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
    </subsection>
    <subsection id="uid57" level="1">
      <bodyTitle>Knowledge acquisition and ontologies</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038308688">
          <firstname>Éric</firstname>
          <lastname>Villemonte de La Clergerie</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
        <person key="alpage-2010-idm152476259776">
          <firstname>Kata</firstname>
          <lastname>Gábor</lastname>
        </person>
        <person key="PASUSERID">
          <firstname>Tim</firstname>
          <lastname>van de Cruys</lastname>
        </person>
        <person key="alpage-2010-idm152476230416">
          <firstname>Yayoi</firstname>
          <lastname>Nakamura-Delloye</lastname>
        </person>
        <person key="alpage-2010-idm152476291760">
          <firstname>Marianna</firstname>
          <lastname>Apidianaki</lastname>
        </person>
      </participants>
      <p>The parsing results provided by FRMG over a very large
      corpus covering various style and domains (30 months of AFP
      news [2007, 2009, and 2010], wikipedia, wikisource, Est
      Republicain, EuroParlement, JRC) have been used as input for
      the acquisition of semantic knowledge. This work was part of
      the SCRIBO action (cf.  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid92" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), in order to explore the
      techniques and methodologies that may be used to enrich a
      lexicalized seed ontology in a supervised way, i.e. using
      some human validation at some point.</p>
      <p>The guiding principle for most of the experiments that
      were tried is the Harris distributional hypothesis, stating
      that semantically close words occur in similar contexts,
      syntactic contexts in our case.</p>
      <p>The experiments may be classified around 2 main
      directions, those trying to identify and organize concepts,
      and those trying to identify and organize classes of
      “events”, an event class being (often) used to establish some
      relationship between named entities (for instance, to denote
      that “someone” becomes president of “something”). These event
      class may properly denote events, but more generally, may
      denote the attachment of a property to an entity.</p>
      <subsection id="uid58" level="2">
        <bodyTitle>Terminology extraction</bodyTitle>
        <p>A first experiment about concepts, done by Éric de La
        Clergerie, dealt with terminology extraction, using
        frequency information to select sequences of Passage chunks
        that follow some patterns (essentially, nominal phrases
        possibly with adjectives, completed by prepositional
        phrases). The selection of the candidate terms was refined
        using mutual information and a notion of autonomy (a
        candidate term should not always occur within prepositional
        phrases or been modified by prepositional phrases). A
        preliminary detection of variants was used to group close
        terms (at the form level) and to discard some artifacts
        that have many variants (such as some date or interval
        constructions). Two ranked lists of terms were extracted on
        the AFP corpus and on the whole corpus. The AFP list was
        communicated to 
        <i>Lingua et Machina</i>, an INRIA startup, to be loaded in
        their 
        <span class="smallcap" align="left">
        LIBELLEX</span>platform, in order to start some human
        validation. This experiment was the starting point for a
        collaboration with this company about the managing of
        lexical resources.</p>
        <p>At this stage, this terminology extraction process is
        not as sophisticated than some existing software such as
        Acabit and should only seen as a starting point. More
        element of information could be used such a derivationnal
        morphology (to group variants) and coordinations (which
        were discarded). The exploitation of semantic similarity
        between words (as provided by the other experiments
        conducted below) could also be used to group variants.</p>
      </subsection>
      <subsection id="uid59" level="2">
        <bodyTitle>Building word network</bodyTitle>
        <p>Another experiment led by Éric de La Clergerie was to
        regroup words by semantic similarity, exploiting as much as
        possible the Harris distributional hypothesis. Having
        collected the frequencies of dependencies triples
        (governor, relation, governee) on lemmas, such as ( 
        <i>assoir_v</i>, 
        <i>sur_prep</i>, 
        <i>chaise_nc</i>), a graph was built connecting the words
        (say 
        <i>assoir</i>) with their syntactic context (say 
        <i>sur_chaise</i>), the weight of an edge being derived
        from the frequency of the underlying dependency triple.
        Using ideas from the Markow CLustering (MCL) algorithm, an
        iterative algorithm was designed and implemented in Perl to
        identify pairs of words (and dually pairs of contexts) that
        are related by a dense set of relatively short paths. One
        of the interest of the algorithm is to provide a set of
        weighted contexts explaining the (semantic) proximity of
        two words. Another particularity of the algorithm is the
        strong duality between words and contexts, the algorithm
        being able to group words but also contexts. It also takes
        into account the fact that the syntactic contexts have an
        internal structure, including in particular a word (if we
        assume that 
        <span class="math"><hi rend="it">X</hi></span>and 
        <span class="math"><hi rend="it">Y</hi></span>are close, then given some relation 
        <span class="math"><hi rend="it">r</hi></span>, the contexts 
        <span class="math"><hi rend="it">r</hi>_ 
        <hi rend="it">X</hi></span>and 
        <span class="math"><hi rend="it">r</hi>_ 
        <hi rend="it">Y</hi></span>are also close, and
        conversely).</p>
        <p>Several extensions of the algorithm have been
        implemented. Random Indexing (RI) was for instance used to
        complement MCL, with the intuition that RI provides a way
        to quickly compare the similarity of large context sets,
        when MCL focus on the specific contexts that tend to group
        two words (and may miss some global differences). The
        presence of coordinations between two words was concretized
        by a bonus used to strengthen their proximity. Similarly,
        proximity was also strengthened by morphological or
        spelling closeness. Finally, a bonus may also be added for
        pairs of similar words found in a external wordnet-like
        seed resource (we tried with the French WordNet and with
        Wolf, an acquired French wordnet, but the usefulness of
        such resources was finally not obvious).</p>
        <p>Running 10 to 20 iterations on the dependencies
        extracted from the whole 700 million parsed corpus (around
        2 days, using around Go RAM), we get information about
        around 22000 words for around 44000 pairs of words. For
        each pair of words is specified how close they are (in a
        non symmetrical way) and which syntactic contexts are the
        most specific to explain the their proximity.</p>
        <p>The amount of data makes it difficult to evaluate the
        quality of these pairs. Several evaluation experiments were
        tried by comparing with wordnet-like resources (French
        wordnet and WOLF) but the results remain difficult to
        interpret. Another option was to visualize and browse the
        pairs as a connecting graph, using 
        <span class="smallcap" align="left">Tulip</span>, a
        software for large graphs. Browsing the graph, while hiding
        many important pieces of information (the degree of
        similarity, the explaining contexts) was nevertheless very
        useful to assess the interest of such a word network (and
        of the underlying clustering algorithm). Browsing the graph
        was also useful to point out some characteristic
        topological structures, for instance bush-like structures
        generally characterizes strong clusters (such as all month
        names).</p>
        <p>These topological properties should guide further
        developments to get a better detection of the strongest
        word clusters, but also to get a better detection of
        polysemous words. An important evolution would also to
        shift from word to terms (resulting from the previous
        extraction).</p>
      </subsection>
      <subsection id="uid60" level="2">
        <bodyTitle>Tensor based clustering</bodyTitle>
        <p>Starting from the same material (namely the dependencies
        with their frequencies), Tim van de Cruys has tried other
        techniques for word clustering. More precisely, he used a
        matrix-based approach using tensors and their non-negative
        factorization to identify the dimensions that cluster
        words. The base clusters were then used to build an
        hierarchical clustering. An advantage of the tensors over
        matrices is also the possibility to add more axes, for
        instance to cluster words along the syntactic axe given by
        the dependencies but also along a thematic axe given by the
        word occurring in a document or in the keyword field of a
        document (such as an AFP news).</p>
      </subsection>
      <subsection id="uid61" level="2">
        <bodyTitle>Cluster labeling</bodyTitle>
        <p>A second step in Tim van de Cruys' work was to establish
        ontological relationships between concepts, for instance to
        establish the hyperonomy (IS-A) relation between two
        concepts. This work was partially achieved by being able to
        assign labels to word clusters. A word cluster of
        synonymous words may be seen as denoting a concept and the
        label may be seen as the hyperonym concept. Cluster
        labeling was conducted by extracting and analyzing the
        syntactic content of the first meaningful sentence of
        Wikipedia pages. The first sentence of the page with title
        X usually mentions the 
        <i>genus</i>of X. This genus found (with variations) for
        several elements of a cluster may be used as a label. It is
        even often possible to assign a term (rather than a single
        word). In practice, the labels are not always assigned to
        cluster of synonymous words but rather clusters of related
        words, such as 
        <i>navire de guerre</i>( 
        <i>warship</i>), 
        <i>élément chimique</i>( 
        <i>chemical element</i>) or related named entities such as 
        <i>chanteur français</i>( 
        <i>French singer</i>).</p>
      </subsection>
      <subsection id="uid62" level="2">
        <bodyTitle>Acquisition of event structures</bodyTitle>
        <p>Kata Gábor worked on the acquisition of event classes
        (or event structures) characterized by verb classes or verb
        nominalizations. Semantic verb classes (Gross 1975, Levin
        1993, Kipper-Schuler 2005) generalise over a set of
        syntactic and semantic properties: they participate in the
        same syntactic alternations and share one or more meaning
        components. Such classifications can be useful in a variety
        of NLP tasks, including semantic role labeling (Swier &amp;
        Stevenson 2004) and information extraction. Semantic
        classes can be obtained automatically from corpora (Schulte
        im Walde 2006, O Seaghdha &amp; Copestake 2008, Sun &amp;
        Korhonen 2009, Messiant et al. 2010), in compliance with
        the distributional hypothesis which states that
        semantically related words tend to occur in similar
        contexts.</p>
        <p>Kata Gábor applied an unsupervised learning method to
        obtain verb clusters from corpora, using a set of syntactic
        and semantic features (complement structure and the
        semantic profile of the arguments which fill the complement
        positions).</p>
        <p>To overcome the sparse data problem, we expanded the
        verbal data by distributional information about
        corresponding deverbal nouns. In order to do so, she
        developed another algorithm to detect event nominalisations
        and to map nominal complement structure to that of finite
        verbs. The detection of event nominalisations is based on
        three measures:</p>
        <orderedlist>
          <li id="uid63">
            <p noindent="true">distributional similarity;</p>
          </li>
          <li id="uid64">
            <p noindent="true">morphological similarity;</p>
          </li>
          <li id="uid65">
            <p noindent="true">the so-called 'event indicator'
            score which shows how likely it is that the noun refers
            to an event.</p>
          </li>
        </orderedlist>
        <p>The intuition behind the notion of event indicator is
        that event nominalisations are characterized by a high
        proportion of occurrences in verb-like dependent positions
        (where a clause could also occur). The event indicator is
        obtained from corpus data by quantifying the proportion of
        syntactic heads having the noun as a dependent in a
        position where infinitives are also accepted (e.g. " 
        <i>accepter de restreindre</i>" - " 
        <i>accepter la restriction</i>").</p>
      </subsection>
      <subsection id="uid66" level="2">
        <bodyTitle>Dependency paths between named
        entities</bodyTitle>
        <p>Yayoi Nakamura-Delloye worked on the identification of
        dependency-based extraction patterns denoting relations
        between named entities, for instance the membership
        relation between a person and an organization. The idea was
        to explore the regularities in the SCRIBO corpus, parsed
        with FRMG. Two extraction methods have been tried, a
        semi-supervised one and a fully non-supervised one. The
        recurring syntactic dependency paths are then abstracted
        into patterns for a given relation, the motivation being to
        use the patterns to extract new occurrences of the relation
        in other corpora during information extraction task.</p>
      </subsection>
      <subsection id="uid67" level="2">
        <bodyTitle>Word-sense disambiguation and
        integration</bodyTitle>
        <p>Marianna Apidianaki joined lately the Alpage team in
        September 2010. Since then, she has been working on the
        automatic acquisition of lexical semantic knowledge from
        text corpora for the development of resources in the SCRIBO
        project. More precisely, she has pursued her previous
        research on exploiting parallel corpora for unsupervised
        word sense induction and disambiguation for enriching the
        ontology used in the SCRIBO project.</p>
        <p>Furthermore, she worked on the integration into existing
        lexical semantic resources of the results of monolingual
        semantic analysis methods (based on clustering techniques)
        carried out by the other members of ALPAGE involved in
        SCRIBO.</p>
      </subsection>
      <subsection id="uid68" level="2">
        <bodyTitle>Validation methodologies</bodyTitle>
        <p>The above mentioned experiments return ranked lists of
        candidates (terms, word pairs, clusters, verb class,
        verb/noun pairs, ...) that need to be validated as some
        point before being used to enrich some reference lexical
        resource. More precisely, in the context of SCRIBO, the
        idea is that a candidate should be phrased as an enrichment
        of the seed ontology (for instance the addition of a new
        concept through an IS-A ontological relation with an
        existing concept). To ease the validation, a ticked should
        be attached to each candidate, describing the scope of the
        candidate, providing explaining features (such as the
        syntactic contexts used to regroup a pair a words) and
        illustrative sentences (from the SCRIBO corpus). This
        notion of tickets has been formalized and the acquisition
        algorithm are or will be modified to return such tickets.
        Already, the notion of tickets has guided the development
        of prototype Web validation interfaces (for terms, cluster
        labels, and noun/verb pairs).</p>
      </subsection>
    </subsection>
    <subsection id="uid69" level="1">
      <bodyTitle>Automatic construction of distributional thesauri
      for French</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038316144">
          <firstname>Enrique</firstname>
          <lastname>Henestroza Anguiano</lastname>
        </person>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2008-idm542378777200">
          <firstname>Marie</firstname>
          <lastname>Candito</lastname>
        </person>
      </participants>
      <p>This work involves the automatic construction of
      distributional thesauri for French, with an eye toward use in
      statistical parsing. The distributional hypothesis states
      that words occurring in the same contexts tend to have
      similar meanings, as posited by Harris (1954). Additionally,
      distributional similarity based on syntactic contexts
      naturally indicates shared selectional preference, which may
      be useful for statistical parsing. Finally, distributional
      lexical resources are appealing because they can be
      constructed automatically from raw text corpora using
      unsupervised approaches, avoiding the problem of limited
      lexical coverage found in hand-built resources.</p>
      <subsection id="uid70" level="2">
        <bodyTitle>Thesaurus creation and evaluation</bodyTitle>
        <p>Following primarily from the distributional similarity
        work of Lin (1998) and Curran (2004), we use a raw corpus
        of text to extract context relations consisting of a
        primary word, a relation, and a secondary word. We chose to
        use the L'Est Républicain corpus, a 125 million word
        journalistic corpus, freely available at CNRTL ( 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.cnrtl.fr/corpus/estrepublicain" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>www. 
        <allowbreak/>cnrtl. 
        <allowbreak/>fr/ 
        <allowbreak/>corpus/ 
        <allowbreak/>estrepublicain</ref>). Extracted context
        relation frequency counts are weighted using a function
        such as relative frequency or t-test, then similarities
        between pairs of primary words are calculated using a
        measure function such as Jaccard or cosine. Testing
        different combinations of weight and measure functions, we
        evaluated each resulting thesaurus using average cosine
        similarity against synsets from the WOLF and the French
        EuroWordNet, two existing wordnet resources for French. Our
        results indicate that the best approach for constructing
        distributional thesauri uses both linear bigram and
        syntactic dependency context relations, the t-test weight
        function, and the jaccard similarity function.</p>
      </subsection>
      <subsection id="uid71" level="2">
        <bodyTitle>Thesaurus and software availability</bodyTitle>
        <p>A major motivation behind our work is to make freely
        available a wide-coverage distributional thesaurus for
        French, as well as software for the construction of
        distributional thesauri using different corpora, settings,
        or languages. This effort has been named FreDist, with an
        associated project webpage ( 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://alpage.inria.fr/~henestro/fredist.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>alpage. 
        <allowbreak/>inria. 
        <allowbreak/>fr/ 
        <allowbreak/>~henestro/ 
        <allowbreak/>fredist. 
        <allowbreak/>html</ref>). The initial release includes a
        distributional thesaurus for French, and software is
        currently being consolidated and packaged for inclusion in
        the next release. The project webpage also includes a
        technical report detailing this work.</p>
      </subsection>
    </subsection>
    <subsection id="uid72" level="1">
      <bodyTitle>Improving the lexical coverage of statistical
      parsers</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378777200">
          <firstname>Marie</firstname>
          <lastname>Candito</lastname>
        </person>
        <person key="alpage-2009-idm402038316144">
          <firstname>Enrique</firstname>
          <lastname>Henestroza Anguiano</lastname>
        </person>
        <person key="alpage-2008-idm542378729584">
          <firstname>Djamé</firstname>
          <lastname>Seddah</lastname>
        </person>
      </participants>
      <p>Probabilistic parsers are trained on treebanks, namely
      syntactically annotated sentences, and this training allows
      to capture syntactic regularities. Yet, though lexical
      information is known to play a crucial role in determining
      the syntactic structure of a sentence, many lexical phenomena
      cannot be learned simply by training on a treebank of a few
      thousands of sentences (the French treebank we use contains
      about 12000 sentences). First because treebanks cover only a
      small part of the French vocabulary. Second, because lexical
      data is very sparse : a corpus contains a few very frequent
      words, and a lot of rare words. Compared to English, this is
      even truer for French, or more generally inflected languages
      : morphological marks for gender, number, tense etc...
      drastically augment the vocabulary size.</p>
      <p>To cope with this inherent limitation of statistical
      parsing techniques, we have investigated the use of word
      clusters instead of words as input to the parser. Our work
      was inspired by [Koo et al. 08] , who have shown that word
      clusters obtained with unsupervised techniques could improve
      statistical dependency parsing, when used as features for
      classifiers determining the weights of dependency arcs. We
      tried in 2009 to use word clusters within the framework of
      generative statistical parsing [Candito and Crabbé, 09]. We
      continued this investigation en 2010: we tested the impact on
      parsing performance of two morphological clustering
      techniques on both lexicalized models 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid57" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and PCFG-LA models 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid58" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>: the "desinflection" process
      proposed in 2009 (a lexicon-based morphological clustering),
      and "lemmatisation" 
      <footnote id="uid73" id-text="4">Conducted by a data driven
      lemmatizer 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid59" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>which we adapted for French
      during a visit at Saarbrucken in 2009.</footnote>, which is
      the more classic technique that groups inflected word forms
      into part-of-speech+lemma pairs. Though with this second
      technique the oracle obtained with gold part-of-speech and
      gold lemmas is higher, the results obtained in a realistic
      setting (predicted part-of-speech and lemmas) are comparable
      to the rougher desinflection method. We have also analyzed
      the improvement in performance for both techniques with
      respect to word frequency. We found that replacing word forms
      with clusters improves attachment performance for words that
      are originally either unknown or low-frequency, since these
      words are replaced by cluster symbols that tend to have
      higher frequencies. Furthermore, clustering also helps
      significantly for medium to high frequency words, suggesting
      that training on word clusters leads to better probability
      estimates for these words.</p>
      <p noindent="true">It shall be noted that this work serves as
      a basis of a grant proposal to the FP7 ICT-Call, named 
      <i>parse4real</i>, jointly made by Dublin City University,
      Alpage, Uppsala University and others European leaders in
      parsing morphologically-rich languages on which augmenting
      the lexical coverage of statistical parsers if of crucial
      importance. Djamé Seddah is Alpage's leader for that
      proposal, to which Marie Candito, Éric de La Clergerie and
      Benoît Sagot also participate.</p>
    </subsection>
    <subsection id="uid74" level="1">
      <bodyTitle>Dependency parsing</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378777200">
          <firstname>Marie</firstname>
          <lastname>Candito</lastname>
        </person>
        <person key="alpage-2008-idm542378770960">
          <firstname>Benoît</firstname>
          <lastname>Crabbé</lastname>
        </person>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2009-idm402038316144">
          <firstname>Enrique</firstname>
          <lastname>Henestroza Anguiano</lastname>
        </person>
      </participants>
      <p>Dependency trees are often preferred to syntagmatic trees
      for many NLP tasks, such as information extraction, question
      answering, lexical acquisition. We started in 2008, and
      continued in 2009, to work on the conversion of the
      syntagmatic trees of the French treebank into surface
      dependency trees. We have now a stabilized version of a
      dependency treebank : the French treebank converted to
      dependencies 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid54" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p>The constituent-to-dependency conversion procedure can
      also be applied to syntagmatic trees as output by a parser
      trained on the syntagmatic treebank. Hence, we have various
      ways to obtain a parser outputting dependency trees : (i)
      training a parser on syntagmatic trees, and converting the
      output of this parser into dependencies. And (ii) directly
      using existing algorithms to train a dependency parser on the
      treebank converted to dependencies. We have performed a
      comparison of the two approaches (i) and (ii). Approach (i)
      is tested with an architecture where a parser is trained on
      the French treebank (using Petrov's algorithm), and output
      trees from this parser are converted to dependencies.
      Approach (ii) is tested with two dependency parser training
      algorithms : MST [McDonald and Pereira, 06] and MaltParser
      [Nivre et al., 06]. First bare results 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid54" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>showed that directly training a
      dependency parser with the MST algorithm [McDonald and
      Pereira, 06] outperforms the architecture base on Petrov's
      algorithm. We then performed a more sophisticated benchmark
      between the three architectures (Petrov, MSTparser,
      MaltParser), with the integration of morphological features
      (lemmas, gender, number...) and unsupervised word clustering
      features (cf. results "Improving the lexical coverage of
      statistical parsers"). We found 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid60" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>that with these additional
      information, the differences between parsing architectures
      are generally small, and there is no consistent trend
      favoring either constituency-based or dependency-based
      methods. The best performance is achieved using MSTParser,
      enhanced with predicted part-of-speech tags, lemmas,
      morphological features, and unsupervised clusters of word
      forms. MaltParser achieves slightly lower labeled accuracy,
      but is probably the best option if speed is crucial</p>
    </subsection>
    <subsection id="uid75" level="1">
      <bodyTitle>New results on Mildly-Context Sensitive
      formalisms</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2008-idm542378729584">
          <firstname>Djamé</firstname>
          <lastname>Seddah</lastname>
        </person>
      </participants>
      <p>Understanding the properties of formal languages more
      sophisticated than Context-Free Grammars has been a research
      topic for several Alpage members for a long time. Indeed,
      although probablistic models based on simple CFG backbones or
      TAG-based systems are quite successful for parsing tasks,
      they fail to model correctly some linguistic constructions
      that are complex but not necessarily rare. So-called Mildly
      Context-Sensitive formalisms are a particular class of
      grammars that have reasonable expressive power (strictly
      higher than TAGs, for example, but strictly less than Range
      Concatenation Grammars that cover PTIME) although they have a
      reasonable parsing complexity (polynomial). Studying these
      formalisms is therefore a very important research track.</p>
      <p>Following up on work started back in 2006 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid61" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, Djamé Seddah and Benoît Sagot
      have introduced a new extension of the so-called
      Multi-Component TAGS, and more precisely an extension of the
      MCTAGs with Local Shared Deriva- tion introduced in 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid62" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>which can handle non local
      elliptic coordinations. Based on a model for control verbs
      that makes use of so-called ghost trees, one can show that
      this extension leads to an analysis of argument cluster
      coordinations that provides an adequate derivation graph.
      This is made possible by an original interpretation of the
      MCTAG derivation tree mixing the views of 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid63" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid64" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
      <p>MCTAGs and some of their variants are equivalent to a
      well-studied MCS formalism, that of Linear Context-Free
      Rewriting Systems or LCFRSs 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid65" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Having NLP applications and
      language modeling in mind, studying the formal properties of
      LCFRSs is relevant. In collaboration with Giorgio Satta, from
      the University of Padova (Italy), Benoît Sagot has finalized
      and presented at ACL 2010 an optimal algorithm for reducing
      the rank of a sub-class of LCFRSs (namely those with fan-out
      2) 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid66" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
    </subsection>
    <subsection id="uid76" level="1">
      <bodyTitle>Temporal information processing</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378786864">
          <firstname>André</firstname>
          <lastname>Bittar</lastname>
        </person>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2009-idm402038296432">
          <firstname>Philippe</firstname>
          <lastname>Muller</lastname>
        </person>
      </participants>
      <p>An important task in temporal processing is to recover the
      chronology of the events that are described in a text. Most
      recent work has focused on learning temporal relations (e.g.,
      precedence, inclusion) between given events in a text, while
      rarely ensuring that these separate pieces of information
      remain consistent. The target representations also differ,
      according to the distinctions they make or the inferences
      they allow.</p>
      <p>In 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid67" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we investigate the impact of
      using different temporal algebras for learning temporal
      relations between events. Specifically, we compare three
      interval-based algebras: Allen (1983) algebra, Bruce (1972)
      algebra, and the algebra derived from the TempEval-07
      campaign. These algebras encode different granularities of
      relations and have different inferential properties. They in
      turn behave differently when used to enforce global
      consistency constraints on the building of a temporal
      representation. Through various experiments conducted on the
      English TimeBank/AQUAINT corpus, we show that although
      TempEval smaller relation set leads to the best
      classification accuracy performance, it is too vague to be
      used for enforcing consistency. By contrast, the other two
      relation sets are similarly harder to learn, but more useful
      when global consistency is important. Overall, the Bruce
      algebra is shown to give the best compromise between
      learnability and expressive power. In forthcoming work, we
      consider the use of yet another temporal algebra, namely
      point algebra, in the context of a global inference problem
      to address the problem of predicting temporal structure for
      texts.</p>
      <p>This first work has been performed on English, for until
      recently there was no available TimeBank for French. One of
      the contributions of André Bittar's PhD dissertation,
      supervised by Laurence Danlos and co-supervised by Pascal
      Denis that was successfully defended this year, was to
      develop such a resource and to make it publicly available to
      the community. The current version of the French TimeBank
      consists of 109 journalistic texts (16,208 tokens) from 7
      different sub-genres which have been annotated according to
      the ISO-TimeML standard. Bittar's dissertation also suggests
      a number of improvements to the ISO-TimeML schema in order to
      account for linguistic phenomena which apply across
      languages, as well as adaptations necessary for the
      processing of French texts. The French TimeBank is soon to be
      made available (via the INRIA Forge) to the wider scientific
      community and will provide a useful basis for studying the
      linguistic expression of temporal phenomena in French, as
      well as providing data for evaluating automatic temporal
      annotation systems.</p>
    </subsection>
    <subsection id="uid77" level="1">
      <bodyTitle>Discourse processing</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
        <person key="alpage-2008-idm542378764240">
          <firstname>Pascal</firstname>
          <lastname>Denis</lastname>
        </person>
        <person key="alpage-2009-idm402038296432">
          <firstname>Philippe</firstname>
          <lastname>Muller</lastname>
        </person>
        <person key="alpage-2009-idm402038290176">
          <firstname>Charlotte</firstname>
          <lastname>Roze</lastname>
        </person>
      </participants>
      <p>Discourse interpretation is often automated in two steps:
      a 
      <i>segmentation</i>step where discourse units (DU) are
      extracted, and a 
      <i>parsing</i>step where these DUs are related to derive a
      discourse structure. The relations are labelled with
      functions reflecting the underlying intention of the producer
      of the discourse.</p>
      <p>Within that perspective, one can proceed bottom-up, and
      isolate the elementary discourse units (EDU) before building
      a structure made of groupings of such EDUs. Alternatively, a
      text can be segmented in a top-down fashion, separating
      topically coherent parts (this is called 
      <i>text segmentation</i>or 
      <i>text tiling</i>) before applying the more fine-grained
      approach mentioned before. Ideally the two methods complement
      each other, while this is rarely done in practice.</p>
      <subsection id="uid78" level="2">
        <bodyTitle>Discourse Unit Segmentation</bodyTitle>
        <p>A contribution to the bottom-up approach was made in 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid68" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, with an additional constraint
        on the EDUs. Previous research on discourse segmentation
        have relied on the assumption that elementary discourse
        units (EDUs) in a document always form a linear sequence.
        Unfortunately, this assumption turns out to be too strong,
        for some theories of discourse allow for nested discourse
        units. To address this problem, we developed a system using
        standard multi-class classification techniques making use
        of a regularized maximum entropy model, combined with a
        simple repairing heuristic that enforces global coherence.
        Our system was developed and evaluated on the first round
        of annotations provided by the French Annodis project (an
        ongoing effort to create a discourse bank for French) with
        an encouraging performance (an F-score of 73% for finding
        EDUs) on a small set of about 50 documents.</p>
        <p>Another approach which is currently explored consists in
        examining whether discourse unit segmentation can be
        automatically obtained from the output of a deep syntactic
        analyzer, i.e. a parser which produces analyses closed to
        semantic dependency trees, like the parser FRMG developed
        by E. de La Clergerie in the formalism of Tree Adjoining
        Grammar 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid51" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. This approach requires
        linguistic insights before being tested on real
        corpora.</p>
      </subsection>
      <subsection id="uid79" level="2">
        <bodyTitle>Text Segmentation</bodyTitle>
        <p>From the other end of the scale, we have tried to
        contribute to a better definition of the requirements of
        the text segmentation (TS) task 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid69" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, by stressing the need for
        taking into account the types of texts that can be
        appropriately considered. Our hypothesis is that while TS
        is indeed relevant to analyze texts with a thematic
        organization, this task is ill-fitted to deal with other
        modes of text organization (temporal, rhetorical, etc.). By
        comparing the performance of a TS system on two corpora,
        with either a "strong" or a "weak" thematic organization,
        we show that TS is sensitive to text types.</p>
      </subsection>
      <subsection id="uid80" level="2">
        <bodyTitle>Lexical Resource for Discourse
        Processing</bodyTitle>
        <p>The intentions of the producer of a discourse are often
        expressed by discourse connectives (or discourse markers):
        they explicitly signal that a relation is holding between
        two discourse units. We have focused on these linguistic
        cues, and have manually built a lexicon of discourse
        connectives for French, named 
        <span class="smallcap" align="left">LEXCONN</span>and
        described in 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid70" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. The lexicon contains 330
        connectives, collected with their syntactic category
        (conjunction, adverbial, preposition) and the discourse
        relation(s) they express. We are now improving 
        <span class="smallcap" align="left">LEXCONN</span>by adding
        some information about the position(s) than can be occupied
        by the markers in a syntactic clause. Indeed, some
        discourse markers (especially adverbial ones) are
        ambiguous: they don't have a discourse function in all the
        position(s) they can occur.</p>
        <p>This lexicon is used in various tasks: it provides
        automatically annotated data for discourse parsing, and
        permits to extract specific discourse structures for
        linguistic empirical studies.</p>
      </subsection>
      <subsection id="uid81" level="2">
        <bodyTitle>Determining Equivalent Discourse
        Structures</bodyTitle>
        <p>Two tasks are crucial for the development of discourse
        parsing systems: the creation of gold-standard annotations,
        and the evaluation of annotations produced by discourse
        parsers. These two tasks require the development of metrics
        for accurately comparing distinct annotations of the same
        text(s); this involves in particular determining the
        conditions under which discourse structures are equivalent.
        While discourse theories provide some indication as to how
        to compare different discourse structures for the same
        text, they haven't studied this issue to its full extent.
        We try to investigate this question by studying discourse
        structures extracted using 
        <span class="smallcap" align="left">LEXCONN</span>. In our
        study, we examine the possibility of deducing an annotation
        from another, assuming that an annotation can contain
        implicit information.</p>
        <p>Given distinct discourse annotations of the same text,
        composed by relations between text segmenst, our goal is to
        calculate, using deduction rules about relations, the 
        <i>discourse closure</i>of these annotations. In effect,
        this allows us to compare these annotations by considering
        all the implicit information (relations) they contain. Our
        overall goal is to build a discourse relations algebra, as
        it has been done by Allen (1893) for temporal relations. At
        least two types of rules seem necessary. Considering a
        discourse containing three adjacent segments 
        <span class="math"><img width="12" height="12" align="bottom" border="0" src="../../images/img_alpha.png" alt="$ \alpha$"/></span>, 
        <span class="math"><img width="12" height="26" align="middle" border="0" src="../../images/img_beta.png" alt="$ \beta$"/></span>, and 
        <span class="math"><img width="11" height="24" align="middle" border="0" src="../../images/img_gamma.png" alt="$ \gamma$"/></span>, either we know the relations 
        <span class="math"><hi rend="it">R</hi><sub><hi rend="it">x</hi></sub>( 
        <img width="12" height="12" align="bottom" border="0" src="../../images/img_alpha.png" alt="$ \alpha$"/>, 
        <img width="12" height="26" align="middle" border="0" src="../../images/img_beta.png" alt="$ \beta$"/>)</span>and 
        <span class="math"><hi rend="it">R</hi><sub><hi rend="it">y</hi></sub>( 
        <img width="12" height="26" align="middle" border="0" src="../../images/img_beta.png" alt="$ \beta$"/>, 
        <img width="11" height="24" align="middle" border="0" src="../../images/img_gamma.png" alt="$ \gamma$"/>)</span>, and try to deduce the discourse
        relation 
        <span class="math"><hi rend="it">R</hi><sub><hi rend="it">z</hi></sub></span>holding between 
        <span class="math"><img width="12" height="12" align="bottom" border="0" src="../../images/img_alpha.png" alt="$ \alpha$"/></span>and 
        <span class="math"><img width="11" height="24" align="middle" border="0" src="../../images/img_gamma.png" alt="$ \gamma$"/></span>; or we know the relations 
        <span class="math"><hi rend="it">R</hi><sub><hi rend="it">x</hi></sub>( 
        <img width="12" height="12" align="bottom" border="0" src="../../images/img_alpha.png" alt="$ \alpha$"/>, 
        <img width="12" height="26" align="middle" border="0" src="../../images/img_beta.png" alt="$ \beta$"/>)</span>and 
        <span class="math"><hi rend="it">R</hi><sub><hi rend="it">z</hi></sub>( 
        <img width="12" height="12" align="bottom" border="0" src="../../images/img_alpha.png" alt="$ \alpha$"/>, 
        <img width="11" height="24" align="middle" border="0" src="../../images/img_gamma.png" alt="$ \gamma$"/>)</span>, and we try to deduce the
        discourse relation 
        <span class="math"><hi rend="it">R</hi><sub><hi rend="it">y</hi></sub></span>holding between 
        <span class="math"><img width="12" height="26" align="middle" border="0" src="../../images/img_beta.png" alt="$ \beta$"/></span>and 
        <span class="math"><img width="11" height="24" align="middle" border="0" src="../../images/img_gamma.png" alt="$ \gamma$"/></span>. These rules rely on theoretical relation's
        description and empirical data, gathered with our lexicon
        of connectives.</p>
      </subsection>
    </subsection>
    <subsection id="uid82" level="1">
      <bodyTitle>“Wrong” strong punctuation signs</bodyTitle>
      <participants>
        <person key="alpage-2008-idm542378767840">
          <firstname>Laurence</firstname>
          <lastname>Danlos</lastname>
        </person>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <p>Some strong punctuation signs are “wrongly” used instead
      of weak punctuation signs, leading to graphic sentences which
      are not grammatical sentences, see the following discourse
      which includes five graphic sentences only made up of
      adverbial phrases.</p>
      <p rend="center">On avait donné dans le Nord un grand coup de
      pied dans la fourmilière, et les fourmis s'en allaient.
      Laborieusement. Sans panique. Sans espoir. Sans désespoir.
      Comme par devoir. [Saint Exupéry, Pilote de guerre]</p>
      <p>In 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid71" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we present a corpus study of
      this phenomenon — sometimes called “épexégèse” — and a tool
      in the early stages to automatically detect wrong strong
      punctuation signs. The goal of this tool is to automatically
      categorize these punctuation signs as weak, so that a parser
      can make a standard syntactic and semantic analysis.</p>
    </subsection>
    <subsection id="uid83" level="1">
      <bodyTitle>Lexical incompleteness: typology and exploration
      of unknown words</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
        <person key="alpage-2009-idm402038293216">
          <firstname>Gaëlle</firstname>
          <lastname>Recourcé</lastname>
        </person>
      </participants>
      <p>In an attempt to cope with lexical incompleteness within
      the EDyLex project ( 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid95" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), a typology of unknown words
      (i.e. words, forms, tokens) has been proposed. This typology
      reflects both linguistic structures and operational issues
      regarding unknown words. It is indeed intended to guide
      automatic processing modules in the handling of
      out-of-lexicon words . Unknown words are defined relatively
      to the kind of unknown tokens which compose them. Those can
      be either productive sequences such as dates and recognizable
      for example by a local grammar, productive lexical creations
      ( 
      <i>red-hair</i>), lexicalized forms ( 
      <i>cupboard</i>), proper names, borrowings, dependant
      components ( 
      <i>priori</i>) or errors (spelling, misprint).</p>
      <p>In order to verify and improve this typology, a corpus
      annotation of unknown words based on it has been carried out
      in two phases. First the corpus, consisting of xxx news items
      from Agence France Presse in French, English and Spanish,
      have been automatically annotated with the Alpage surface
      processing chain SxPipe, able to recognize a series of
      out-of-lexicon sequences and forms (dates, URLs, numerical
      values, proper names, some prefixed compositions...); this
      automatic annotation then marked remaining out-of-lexicon
      forms, based on the lexicons available in the three languages
      within the Alexina framework (Lefff, Enlex and Leffe). In the
      second phase the latter forms have been reviewed by human
      annotators who assigned to each of them the appropriate
      category from the typology. A high inter-annotators agreement
      showed the relevance of this typology and can therefore help
      the building of a complete and modular processing chain fo
      lexical resources enrichment.</p>
    </subsection>
    <subsection id="uid84" level="1">
      <bodyTitle>Named entities recognition and resolution: a
      modular system and its resources</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
        <person key="alpage-2009-idm402038280912">
          <firstname>Rosa</firstname>
          <lastname>Stern</lastname>
        </person>
      </participants>
      <p>Within the Alpage surface processing chain SxPipe, a
      series of modules based on local grammars enable the analysis
      of sequences at the token- and form-level such as dates,
      URLs, addresses... A new version of NP, the named entity
      recognition tool, has been integrated to SxPipe in order to
      cope with named entities of different types (person,
      location, organization and company names). NP's local grammar
      consists of 130 rules, including contextual patterns and
      triggers, for detection and typing of named entities. In
      order for those rules to operate efficiently, a lexicon of
      proper nouns can be associated to it. The lexicon consists in
      a list of forms acceptable by the grammar as named entities
      variants and can be obtained by several means.</p>
      <p>In this prospect, a database called Aleda has been built,
      based on two main external and freely available resources:
      Wikipedia and Geonames. Aleda intends to gather information
      and knowledge on entities and not only a list of entity
      names. This knowledge (precise type of the entity (for
      example capital, country, museum are subtypes of location),
      decomposition and variation of its name (title, last name,
      pseudonym, short form...), main sector of organizations and
      companies...) is reflected in its structure by dedicated
      typed fields. The base can then be converted into a lexicon,
      linking each entity to its variants with a unique identifier.
      This structure allows for the ulterior use of information
      contained in Aleda by the client application.</p>
      <p>In order to make named entities recognition more complete
      and usable as an information extraction module, the
      denotational aspect of named entities must be handled, i.e.
      the entity to which a recognized name refer to must be
      identified. This process of 
      <i>entity resolution</i>can be based on an entity base such
      as Aleda. After the recognition phase, the result of which
      being a set of entity mentions in text, the resolution phase
      intends to link each mention to the adequate entity in the
      reference base. This operation must deal with possible
      ambiguities among homonyms or names refering to entities
      absent from the base. Disambiguation can benefit from the
      knowledge gathered in Aleda, for example by comparing
      information associated to entities and named entities
      contexts in the text.</p>
    </subsection>
    <subsection id="uid85" level="1">
      <bodyTitle>Developing language resources for Persian and
      Kurdish languages</bodyTitle>
      <participants>
        <person key="atoll-2006-idm57727917280">
          <firstname>Benoît</firstname>
          <lastname>Sagot</lastname>
        </person>
      </participants>
      <p>In 2010, Alpage has taken part actively in the PerGram
      French-German project (co-funded by ANR and DFG, see 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid100" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>). In particular, the development
      of an Alexina description of the morphology of Persian and
      the development of an associated Persian Alexina lexicon,
      named PerLex, has been pursued following a first preliminary
      version in end-2009 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid72" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. This work, in collaboration
      with Géraldine Walther (from LLF, Université Paris 7) and
      Pollet Samvelian, Pegah Fagiri and Ariel Gutman (MII, CNRS
      and Université Paris 3), has also lead to adapting the
      shallow processing chain 
      <span class="smallcap" align="left">Sx</span>Pipe to Persian 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid73" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Ongoing work has started for
      the manual validation of PerLex and for its extension to the
      syntactic level (sub-categorization frames, entries for
      “complex predicates”...).</p>
      <p>Benoît Sagot and Géraldine Walther have then pursued their
      efforts for resourcing Western Iranian languages. First, they
      formalized a methodology for developing a morphological
      lexicon for a language lacking any resource, and applied its
      first steps to Sorani Kurdish, hence creating a preliminary
      small-scale Alexina lexicon for this language 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid72" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. Second, they performed
      experiments on later stages of this methodology, but in
      Kurmanji Kurdish 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid74" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, which is another Kurdish
      variant for which lexical resources do exist, although not
      formalized. Their work include preliminary experiments on
      developing a POS tagger using a lexicon but no annotated
      training corpus. These experiments will be pursued in 2011,
      and both Kurdish lexicons should reach a significant
      size.</p>
    </subsection>
    <subsection id="uid86" level="1">
      <bodyTitle>Word ordering</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038273904">
          <firstname>Juliette</firstname>
          <lastname>Thuilier</lastname>
        </person>
        <person key="alpage-2008-idm542378770960">
          <firstname>Benoît</firstname>
          <lastname>Crabbé</lastname>
        </person>
      </participants>
      <p>We study the problem of choice in the ordering of French
      words building upon two case studies. Both studies try to
      identify the factors that come into play when one has two
      choose among several possible orderings : the first inquiry
      is dedicated to the position of attributive adjectives wrt
      the noun. The second is dedicated to the relative order of
      postverbal dependants. Both questions have almost never been
      adressed for French.</p>
      <p>In collaboration with Gwen Fox (Université Paris 3), the
      first investigation in this direction has been led towards
      identifying the importance of constraints that drive the
      placement of attributive adjectives wrt the noun in the noun
      phrase in French. This study brings an additional element to
      Bresnan’s thesis, according to which the syntactic competence
      of human beings is indeed probabilistic. This year we
      enhanced our previous statistical models with a qualitative
      study trying to shed light (1) on semantic effects and (2) on
      word independant versus word specific constraints.</p>
      <p>Another study on preferences in verbal complementation has
      started this year. We are planning to study the preferences
      between postverbal dependants (direct objects and indirect
      objects). This year we started by extracting data suitable
      for statistical modeling mainly from the French Treebank and
      started to annotate the treebank with missing information (of
      semantic nature). The expected outcome from this work is
      first to identify factors that are relevant in French and
      beyond in a crosslinguistic perspective we plan to compare
      the constraints observed in other languages such as german.
      This is intended to be realised in collaboration with
      psycholinguistic teams both in Paris 5 (LPNCog) and in
      Germany (Frias, Freiburg) and the Laboratoire de Linguistique
      Formelle (LLF) in Paris 7 also intends to set up experimental
      work in connection with our modeling results in this
      framework for French.</p>
      <p>As can be seen from the outline above, this line of
      research brings us closer to cognitive sciences and more
      specifically to frameworks inspired by construction grammar.
      We hope in the very long run that these investigations will
      bring – among other – further insights on the design of
      probabilistic parsers. In NLP the framework that is closest
      to implementing construction grammar is Data Oriented
      Parsing.</p>
    </subsection>
    <subsection id="uid87" level="1">
      <bodyTitle>Unsupervised acquisition of allophonic
      rules</bodyTitle>
      <participants>
        <person key="alpage-2009-idm402038353920">
          <firstname>Luc</firstname>
          <lastname>Boruta</lastname>
        </person>
        <person key="alpage-2008-idm542378770960">
          <firstname>Benoît</firstname>
          <lastname>Crabbé</lastname>
        </person>
      </participants>
      <p>This is an exploratory work on modelling the acquisition
      of allophonic rules. It is made in collaboration with the
      Laboratoire de Sciences Cognitives de Paris, LSCP). It
      explores the acquisition of the phonological system made by
      children relying upon the assumption that word segmentation
      and phonological learning are dependant processes feeding
      each other. Hence this work splits into two subproblems, that
      of segmentation and that of phonological clustering.</p>
      <p>State-of-the-art models of the acquisition of word
      segmentation have been evaluated using phonemically
      transcribed corpora. As such, they implicitly assume that
      children know how to undo phonetic variation when they learn
      to extract words from fluent speech. Moreover, whereas models
      of language acquisition should perform similarly across
      languages, evaluation is often limited to English samples. We
      first argue that online learning is a sound desideratum for
      any model of language acquisition and use this criterion to
      select candidate segmentation models. Then, using
      child-directed corpora of English, French and Japanese, we
      evaluate the models' performance given inputs where phonetic
      variation has not been reduced. To do so, we propose a
      parametric benchmark where segmentation robustness can be
      measured across different levels of noise, simulating uniform
      errors in phoneme recognition or systematic allophonic
      variation. We show that statistical models do not resist
      noisy inputs and do not generalize to typologically different
      languages. From the perspective of early language
      acquisition, the results strengthen the hypothesis according
      to which phonological knowledge is acquired in large part
      before the construction of a lexicon.</p>
      <p>It is recognized that infants learn phonemes through some
      kind of unsupervized clustering of the speech signal.
      Previous work has shown the feasibility of unsupervized
      clustering, using as input manually segmented phonetic
      parameters 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid75" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid76" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>showed that an HMM
      state-splitting algorithm run on conversational speech coded
      using standard MFCC coefcients automatically grows a network
      of HMM states which successfully encoded speech sounds with
      no loss of informaton compared to supervized HMM training.
      However the obtained states did not map one-to-one to
      phonemes: phoneme-size strings of states did not yield
      abstract phonemes, but rather, context dependant allophones.
      This problem is serious enough to impede subsequent
      unsupervized learning of words 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid77" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>. To adress this issue, we will
      recluster allophonic variants using higher order information
      in additon to acoustic distance in order to improve the
      metric used in the clustering algorithm. Two such informaton
      have been shown to be helpful: distributional information
      about adjacent segments 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid78" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>and (pseudo)-lexical informaton
      obtained through approximatng a lexicon using frequent 
      <span class="math"><hi rend="it">n</hi></span>-grams 
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#alpage-2010-bid79" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>.</p>
    </subsection>
  </resultats>
  <contrats id="uid88">
    <bodyTitle>Contracts and Grants with Industry</bodyTitle>
    <subsection id="uid89" level="1">
      <bodyTitle>Contracts with Industry</bodyTitle>
      <p>Alpage has developed several collaborations with
      industrial partners. Apart from grants described in the next
      section, specific collaboration agreements have been set up
      with Verbatim Analysis (license agreement, see section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid37" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), Kwaga (ARITT contract, see
      section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid38" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>), TNS-Sofres (see section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid40" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) and possibly soon Lingua et
      Machina (see section  
      <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="#uid39" location="intern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>).</p>
    </subsection>
  </contrats>
  <international id="uid90">
    <bodyTitle>Other Grants and Activities</bodyTitle>
    <subsection id="uid91" level="1">
      <bodyTitle>Regional Initiatives</bodyTitle>
      <subsection id="uid92" level="2">
        <bodyTitle>Action Scribo (2007 – 2009, extended until
        2010)</bodyTitle>
        <participants>
          <person key="alpage-2009-idm402038308688">
            <firstname>Éric</firstname>
            <lastname>Villemonte de La Clergerie</lastname>
          </person>
          <person key="alpage-2010-idm152476259776">
            <firstname>Kata</firstname>
            <lastname>Gábor</lastname>
          </person>
          <person key="alpage-2010-idm152476291760">
            <firstname>Marianna</firstname>
            <lastname>Apidianaki</lastname>
          </person>
          <person key="PASUSERID">
            <firstname>Tim</firstname>
            <lastname>van de Cruys</lastname>
          </person>
          <person key="alpage-2010-idm152476230416">
            <firstname>Yayoi</firstname>
            <lastname>Nakamura-Delloye</lastname>
          </person>
          <person key="alpage-2009-idm402038280912">
            <firstname>Rosa</firstname>
            <lastname>Stern</lastname>
          </person>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
          </person>
        </participants>
        <moreinfo>
          <p>Scribo Homepage: 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.scribo.ws/xwiki/bin/view/Main/WebHome" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>www. 
          <allowbreak/>scribo. 
          <allowbreak/>ws/ 
          <allowbreak/>xwiki/ 
          <allowbreak/>bin/ 
          <allowbreak/>view/ 
          <allowbreak/>Main/ 
          <allowbreak/>WebHome</ref></p>
        </moreinfo>
        <p>Scribo aims at algorithms and collaborative free
        software for the automatic extraction of knowledge from
        texts and images, and for the semi-automatic annotation of
        digital documents. Scribo has a total budget of 4.3M Euros
        and is funded by the French “Pôle de compétivité”
        Systematic from Mid 2008 til end 2010. It brings 9
        participants together: AFP, CEA LIST, INRIA, LRDE (Epita),
        Mandriva, Nuxeo, Proxem, Tagmatica and XWiki.</p>
      </subsection>
    </subsection>
    <subsection id="uid93" level="1">
      <bodyTitle>National Initiatives</bodyTitle>
      <subsection id="uid94" level="2">
        <bodyTitle>ANR project 
        <span class="smallcap" align="left">Sequoia</span>(2009 –
        2011)</bodyTitle>
        <participants>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
          </person>
          <person key="atoll-2006-idm57727947600">
            <firstname>Pierre</firstname>
            <lastname>Boullier</lastname>
          </person>
          <person key="alpage-2008-idm542378777200">
            <firstname>Marie</firstname>
            <lastname>Candito</lastname>
          </person>
          <person key="alpage-2008-idm542378770960">
            <firstname>Benoît</firstname>
            <lastname>Crabbé</lastname>
          </person>
          <person key="alpage-2008-idm542378764240">
            <firstname>Pascal</firstname>
            <lastname>Denis</lastname>
          </person>
          <person key="alpage-2009-idm402038308688">
            <firstname>Éric</firstname>
            <lastname>Villemonte de La Clergerie</lastname>
          </person>
          <person key="alpage-2008-idm542378729584">
            <firstname>Djamé</firstname>
            <lastname>Seddah</lastname>
          </person>
          <person key="alpage-2009-idm402038277728">
            <firstname>Sattisvar</firstname>
            <lastname>Tandabany</lastname>
          </person>
        </participants>
        <p>Alpage plays a major role in the ANR-funded project 
        <span class="smallcap" align="left">Sequoia</span>, lead by
        Alexis Nasr (LIF, University of Marseille-Provence, former
        member of the Talana team at University Paris 7). This
        project aims at developing or adapting probabilistic
        parsing techniques in order to release a high-performance
        parser for French based on 
        <span class="smallcap" align="left">Syntax</span>. It
        brings together specialists of NLP and specialists of
        Machine Learning, in a very fruitful way.</p>
      </subsection>
      <subsection id="uid95" level="2">
        <bodyTitle>ANR project EDyLex (2010 – 2012)</bodyTitle>
        <participants>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
            <moreinfo>principal investigator</moreinfo>
          </person>
          <person key="alpage-2009-idm402038280912">
            <firstname>Rosa</firstname>
            <lastname>Stern</lastname>
          </person>
          <person key="alpage-2008-idm542378767840">
            <firstname>Laurence</firstname>
            <lastname>Danlos</lastname>
          </person>
          <person key="alpage-2008-idm542378764240">
            <firstname>Pascal</firstname>
            <lastname>Denis</lastname>
          </person>
        </participants>
        <p>EDyLex is an ANR project (STIC/CONTINT) headed by Benoît
        Sagot. The focus of the project is the dynamic acquisition
        of new entries in existing lexical resources that are used
        in syntactic and semantic parsing systems: how to detect
        and qualify an unknown word or a new named entity in a
        text? How to associate it with phonetic, morphosyntactic,
        syntactic, semantic properties and information? Various
        complementary techniques will be explored and crossed
        (probabilistic and symbolic, corpus-based and
        rule-based...). Their application to the contents produced
        by the AFP news agency (Agence France-Presse) constitutes a
        context that is representative for the problems of
        incompleteness and lexical creativity: indexing, creation
        and maintainance of ontologies (location and person names,
        topics), both necessary for handling and organizing a
        massive information flow (over 4,000 news wires per
        day).</p>
        <p>The participants of the project, besides Alpage, are the
        LIF (Université de Méditerranée), the LIMSI (CNRS team),
        two small companies, Syllabs and Vecsys Research, and the
        AFP.</p>
      </subsection>
      <subsection id="uid96" level="2">
        <bodyTitle>ANR project Rhapsodie (2008 – 2010)</bodyTitle>
        <participants>
          <person key="alpage-2008-idm542378745744">
            <firstname>Sylvain</firstname>
            <lastname>Kahane</lastname>
          </person>
          <person key="alpage-2009-idm402038308688">
            <firstname>Éric</firstname>
            <lastname>Villemonte de La Clergerie</lastname>
          </person>
          <person key="alpage-2008-idm542378777200">
            <firstname>Marie</firstname>
            <lastname>Candito</lastname>
          </person>
          <person key="alpage-2008-idm542378770960">
            <firstname>Benoît</firstname>
            <lastname>Crabbé</lastname>
          </person>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
          </person>
        </participants>
        <p>Rhapsodie is an ANR project headed by Anne Lacheret
        (University Paris X). The aim of the project is to study
        the matching of prosody and syntax on a 30 hours corpus of
        spoken French by providing prosodic and syntactic
        annotations. Alpage participates to the project at two
        different levels: the specification of the transciption and
        syntactic annotation framework and the use of parsers for
        preparing the manually validated syntactic corpus
        annotation.</p>
      </subsection>
      <subsection id="uid97" level="2">
        <bodyTitle>ANR project PASSAGE (2007 – mid
        2010)</bodyTitle>
        <participants>
          <person key="alpage-2009-idm402038308688">
            <firstname>Éric</firstname>
            <lastname>Villemonte de La Clergerie</lastname>
          </person>
        </participants>
        <moreinfo>
          <p>PASSAGE Homepage: 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://atoll.inria.fr/passage" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>atoll. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>passage</ref></p>
          <p noindent="true">EASy homepage: 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.elda.org/easy" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>www. 
          <allowbreak/>elda. 
          <allowbreak/>org/ 
          <allowbreak/>easy</ref></p>
        </moreinfo>
        <p>PASSAGE is an action in ANR MDCA program ( 
        <i>Masse de Données Connaissance Ambiantes</i>) started in
        2007 and extended till mid 2010. The participants are
        Alpage (coordinator), LIR (LIMSI, Orsay), “Langue &amp;
        Dialogue” (LORIA, Nancy), LI2CM (CEA-LIST), plus several
        contractors (ELDA, TAGMATICA and several providers of
        parsing systems).</p>
        <p>PASSAGE stands for “ 
        <i>Large Scale Production of Syntactic Annotations to move
        forward</i>” . Its main objectives are to parse a large
        corpus (100 to 200 million words) with several parsers
        (around 10 systems), combine the results provided by these
        parsers and use the resulting annotations to acquire new
        linguistic knowledge (semantic classes, subcategorization
        frames, disambiguation probabilities, ...). A small part of
        the corpus (around 400000 words) will be manually validated
        to be used as a reference treebank. Two evaluation
        campaigns based on the work done during the Technolangue
        action EASy will be conducted during PASSAGE to assess the
        performances of the parsing systems. The annotations and
        derived linguistic resources will be made available.</p>
      </subsection>
    </subsection>
    <subsection id="uid98" level="1">
      <bodyTitle>European Initiatives</bodyTitle>
      <subsection id="uid99" level="2">
        <bodyTitle>Galician government research project Victoria
        (2008 – 2010)</bodyTitle>
        <participants>
          <person key="alpage-2009-idm402038308688">
            <firstname>Éric</firstname>
            <lastname>Villemonte de La Clergerie</lastname>
          </person>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
          </person>
        </participants>
        <p>As a follow-up of a long lasting collaboration with
        Galician universities, ALPAGE, Éric de La Clergerie and
        Benoît Sagot are strongly involved as associate researchers
        in the Galician government research project Victoria on the
        development of Spanish and Galician linguistic resources by
        adapting tools, methods and resources developed by
        ALPAGE.</p>
      </subsection>
      <subsection id="uid100" level="2">
        <bodyTitle>French-German ANR project Pergram (2009 –
        2011)</bodyTitle>
        <participants>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
          </person>
        </participants>
        <p>The Pergram project (French-German ANR/DFG project) is
        lead by Pollet Samvelian (University Paris 3). Its
        goal is the description of central phenomena in Persian and
        the development of a non-trivial grammar fragment in the
        framework of HPSG. The development of this grammar will
        benefit from the expertise of the German side on phenomena
        that are not found in French or English, such as
        scrambling, but will also deal with Persian-specific
        phenomena such as complex noun-verb predicates. In
        parallel, the project includes the development of various
        lexical resources, thanks in part to techniques and tools
        developed by Alpage members within the Alexina framework:
        (i) a full form lexicon of verbs and common nouns, for
        which a first version is now available, (ii) valency frames
        for verbs (iii) the most common Light Verb Constructions
        (LVCs) and including idiomatic preverb light verb
        combinations.</p>
      </subsection>
      <subsection id="uid101" level="2">
        <bodyTitle>French-Slovene bilateral project “Building
        Slovene-French Linguistic Ressources” (2010 –
        2011)</bodyTitle>
        <participants>
          <person key="atoll-2006-idm57727917280">
            <firstname>Benoît</firstname>
            <lastname>Sagot</lastname>
          </person>
          <person key="alpage-2010-idm152476291760">
            <firstname>Marianna</firstname>
            <lastname>Apidianaki</lastname>
          </person>
        </participants>
        <p>The objective of this project, jointly lead by Benoît
        Sagot (Alpage) and Mojca Schlamberger-Brezar (University of
        Ljubljana) is the development of multilingual linguistic
        resources for Slovene and French. The French funding is
        provided by EGIDE. The project is organized around two main
        goals: the development of a French-Slovene aligned and
        morphosyntactically annotated corpus, and the extension
        using semi-automatic techniques (automatic and manual
        validation construction) of the WOLF and of SloWNet, the
        wordnets for both languages. All these resources will be
        made available to the community by a distribution under a
        free license (e.g., LGPL-LR).</p>
      </subsection>
    </subsection>
    <subsection id="uid102" level="1">
      <bodyTitle>International Initiatives</bodyTitle>
      <subsection id="uid103" level="2">
        <bodyTitle>ISO subcommittee TC37 SC4 on “Language Resources
        Management”</bodyTitle>
        <participants>
          <person key="alpage-2009-idm402038308688">
            <firstname>Éric</firstname>
            <lastname>Villemonte de La Clergerie</lastname>
          </person>
        </participants>
        <p>The participation of ALPAGE to French Technolangue
        action Normalangue has resulted in a strong implication in
        ISO subcommittee TC37 SC4 on “Language Resources
        Management” ( 
        <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.tc37sc4.org/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
        <allowbreak/>www. 
        <allowbreak/>tc37sc4. 
        <allowbreak/>org/ 
        <allowbreak/></ref>). Éric de La Clergerie has
        participated to ISO events and has played a role of expert
        (in particular on morpho-syntactic annotations [MAF],
        feature structures [FSR &amp; new FSD], and syntactic
        annotations [SynAF]).</p>
      </subsection>
    </subsection>
  </international>
  <diffusion id="uid104">
    <bodyTitle>Dissemination</bodyTitle>
    <subsection id="uid105" level="1">
      <bodyTitle>Animation of the scientific community</bodyTitle>
      <simplelist>
        <li id="uid106">
          <p noindent="true">Éric de La Clergerie is an elected
          substitute member of INRIA's “Conseil scientifique”.</p>
        </li>
        <li id="uid107">
          <p noindent="true">Alpage is involved in the French
          journal T.A.L. (AERES linguistic rank: A). Éric de La
          Clergerie is “Rédacteur en chef” and was the editor of
          the regular issue 52/1 (2011). Laurence Danlos and
          Philippe Muller are members of the editorial board.
          Benoît Sagot was “Secrétaire de rédaction” of the journal
          until September 2010. He has been invited to be the guest
          editor, with Nuria Bel, for a special issue on Language
          Resources.</p>
        </li>
        <li id="uid108">
          <p noindent="true">Alpage is deeply involved in a
          forthcoming special issue of the major journal in our
          field of research, Computational Linguistics. Djamé
          Seddah is one of the guest editor of this issue devoted
          to “Parsing of morphologically-rich languages” while
          Marie Candito is a reviewer for this issue.</p>
        </li>
        <li id="uid109">
          <p noindent="true">Alpage members were involved in many
          Program, Scientific or Reviewing Committees for other
          journals and conferences, such as TALN 2010 (Laurence
          Danlos, Benoît Sagot, Éric de La Clergerie, Sylvain
          Kahane, Benoît Crabbé, Djamé Seddah, Philippe Muller),
          the 2nd CMLF (Laurence Danlos), ACL 2010 (parsing area,
          Éric de La Clergerie), ECAI 2010 (Éric de La Clergerie),
          TAG+10 (Éric de La Clergerie), STAIRS 2010 (Éric de La
          Clergerie), Computational Linguistics (Éric de La
          Clergerie), LRE (Éric de La Clergerie), CoLing 2010
          (Pascal Denis, Éric de La Clergerie), NAACL-HLT 2010
          (syntax and parsing area, Éric de La Clergerie) and EMNLP
          2010 (Pascal Denis)</p>
        </li>
        <li id="uid110">
          <p noindent="true">Djamé Seddah and Benoît Sagot are
          elected board member of the French NLP society
          (ATALA);</p>
          <p noindent="true">Djamé Seddah is Program Chair of the
          “Journées ATALA” (one day long workshops in NLP, 4 or 5
          per year); Benoît Sagot is Deputy Secretary since
          September 2010.</p>
        </li>
        <li id="uid111">
          <p noindent="true">Laurence Danlos is a member of the
          Permanent Committee of the TALN conference organized by
          ATALA</p>
        </li>
        <li id="uid112">
          <p noindent="true">Éric de La Clergerie has reviewed a
          proposal for the French program ANR CONTINT.</p>
        </li>
        <li id="uid113">
          <p noindent="true">Djamé Seddah is one of the founders of
          the statistical parsing of morphologically rich language
          initiative that started during IWPT'09. He was the
          program co-chair of the successful SPMRL 2010 NAACL-HLT
          Workshop (2nd most successful workshop of this conference
          in terms of attendees) and will be as well for its next
          utterance (that will take place during IWPT'11). Alpage
          is deeply involved in this initiative (with Marie Candito
          part of its core members and Benoît Sagot member of its
          review committee).</p>
        </li>
        <li id="uid114">
          <p noindent="true">Marianna Apidianaki has undertaken the
          organization of an ACL Workshop on “Syntax, Semantics and
          Structure in Statistical Translation” together with
          Marine Carpuat (National Research Council, Canada), Lucia
          Specia (University of Wolverhampton, UK) and Prof. Dekai
          Wu (Hong Kong University).</p>
        </li>
        <li id="uid115">
          <p noindent="true">Benoît Sagot has started the
          organization of WoLer 2011, an ESSLLI 2011 workshop on
          Lexical Resources ( 
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://alpage.inria.fr/~sagot/woler2011/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>alpage. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>~sagot/ 
          <allowbreak/>woler2011/ 
          <allowbreak/></ref>), to be held in Ljubljana, Slovenia
          in August 2011.</p>
        </li>
        <li id="uid116">
          <p noindent="true">Marianna Apidianaki and Benoît Sagot
          are organizing a one-day ATALA workshop on the
          “Extraction of lexical, semantic and syntactic,
          information from multilingual corpora” that will take
          place in May 2011.</p>
        </li>
        <li id="uid117">
          <p noindent="true">Laurence Danlos, Benoît Sagot and Éric
          de La Clergerie co-organized with Laure Aït-Ali the
          Journée Iliatech on "Apport des technologies de la langue
          pour l'accès à l'information". Laurence Danlos presented
          Alpage's work in a talk entitled "Au-delà de l'analyse
          syntaxique, analyse sémantique et discursive". Éric de La
          Clergerie has presented demonstrations of Alpage tools,
          and Benoît Sagot presented his work on 
          <i>vera</i>.</p>
        </li>
        <li id="uid118">
          <p noindent="true">Laurence Danlos attented to the
          Journée Club Ina SUP (Cap-Digital), Paris, on "Moteur de
          recherche ; de l'accès à la maîtrise des contenus"</p>
        </li>
        <li id="uid119">
          <p noindent="true">Alpage is an active member in the
          LabEx proposal on Experimental Linguistics, headed by
          Jacqueline Vaissière (Univ. Paris 3) and supported by the
          PRES Paris-Cité. Benoît Sagot is in charge of one of the
          6 scientific “strands”, the strand on Language
          Resources.</p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid120" level="1">
      <bodyTitle>Participation to workshops, conferences, and
      invitations</bodyTitle>
      <li id="uid121">
        <p noindent="true">Laurence Danlos, Charlotte Roze and
        Philippe Muller co-presented a paper at the Conference on
        Multidisciplinary Approaches to Discourse (MAD 2010) in
        Moissac, France, on "LEXCONN: a French Lexicon of Discourse
        Connectives"</p>
      </li>
      <li id="uid122">
        <p noindent="true">Several Alpage members attended LREC
        2010 at Valetta, Malta. Laurence Danlos presented a paper
        on "Learning recursive segments for discourse parsing" on
        behalf of herself, Pascal Denis and Philippe Muller and a
        fourth co-author. Marie Candito presented a poster on
        "Statistical French dependency parsing: treebank conversion
        and first results" on behalf of herself, Benoît Crabbé and
        Pascal Denis. Benoît Sagot presented a paper on "The Le 
        <i>fff</i>, a freely available, accurate and large-coverage
        lexicon for French". Laurence Danlos, Benoît Sagot and Rosa
        Stern co-presented a poster on "A Lexicon of French
        Quotation Verbs for Automatic Quotation Extraction". Benoît
        Sagot co-presented a poster on "A morphological lexicon for
        the Persian language". Other communications were presented
        during LREC workshops, and in particular a poster on
        "Resources for Named Entity Recognition and Resolution in
        News Wires" (Rosa Stern and Benoît Sagot), a poster on
        "Developing a large-scale lexicon for a less-resourced
        language: general methodology and preliminary experiments
        on Sorani Kurdish" (Benoît Sagot and a co-author),
        "Creating and maintaining language resources: the main
        guidelines of the Victoria project" (Benoît Sagot and
        co-authors).</p>
      </li>
      <li id="uid123">
        <p noindent="true">Several Alpage members attended the
        NAACL workshop on statistical parsing of morphologically
        rich languages (SPMRL), co-organised by Djamé Seddah. Marie
        Candito presented a paper on "Parsing word clusters" on
        behalf of herself and Djamé Seddah. Djamé Seddah presented
        a paper on "Lemmatization and Statistical Lexicalized
        Parsing of Morphologically-Rich Languages" on behalf of
        himself, Gregorz ChrupaŁa, Ozem Cetinoglu, Josef van
        Genabith and Marie Candito.</p>
      </li>
      <li id="uid124">
        <p noindent="true">Laurence Danlos attended the 2ème
        Congrès Mondial de Linguistique Française, New Orleans,
        United States, where she presented a paper on "Analyse
        discursive des incises de citation" on behalf of herself,
        Benoît Sagot and Rosa Stern.</p>
      </li>
      <li id="uid125">
        <p noindent="true">Several Alpage members attended the TALN
        conference in Montréal, Canada. Pascal Denis, on behalf of
        himself and Benoît Sagot, presented a paper on
        "Exploitation d'une ressource lexicale pour la construction
        d'un étiqueteur morphosyntaxique état-de-l'art du
        français". Benoît Sagot and his co-author presented a paper
        on "Développement de ressources pour le persan: lexique
        morphologique et chaîne de traitements de surface".
        Laurence Danlos and Benoît Sagot co-presentation a poster
        on "Ponctuations fortes abusives". Benoît Sagot and Rosa
        Stern co-presented a poster on "Traitement des inconnus :
        une approche systématique de l’incomplétude lexicale" with
        other co-authors. Rosa Stern and Benoît Sagot co-presented
        a poster on "Détection et résolution d'entités nommées dans
        des dépêches d'agence". Éric de La Clergerie presented on
        behalf of himself and Yayoi Nakamura-Delloye a poster on
        "Exploitation de résultats d'analyse syntaxique pour
        extraction semi-supervisée des chemins de relations".
        Juliette Thuilier presented on behalf of herself, Benoît
        Crabbé and one co-author a paper on "Approche quantitative
        en syntaxe : l'exemple de l'alternance de position de
        l'adjectif épithète en français". Philippe Muller presented
        two communications with co-authors.</p>
      </li>
      <li id="uid126">
        <p noindent="true">Pascal Denis presented two papers at the
        23rd International Conference on Computational Linguistics
        (COLING 2010), held in Beijing, China. The first, full
        paper "Comparison of different algebras for inducing the
        temporal structure of texts" was presented on his and
        Philippe Muller's behalf. The second, poster paper
        "Benchmarking of statistical dependency parsers for French"
        was presented on behalf of Marie Candito, himself, Enrique
        Enestroza and a fourth co-author.</p>
      </li>
      <li id="uid127">
        <p noindent="true">Laurence Danlos and Benoît Sagot
        attented the 28th Conference on Lexis and Grammar,
        Belgrade, Serbia. Laurence Danlos and Benoît Sagot
        co-presented a paper on "Les verbes de citation dans le
        Lexique-Grammaire", and Benoît Sagot and his co-authors
        presented a paper on "Fast Development of Basic NLP Tools:
        Towards a Lexicon and a POS Tagger for Kurmanji
        Kurdish".</p>
      </li>
      <li id="uid128">
        <p noindent="true">Éric de La Clergerie and Djamé Seddah
        have participated (with presentations) to TAG+10.</p>
      </li>
      <li id="uid129">
        <p noindent="true">Djamé Seddah, Marie Candito have
        presented their respective and joint works at the NAACL-HLT
        SPRML'2010 workshop, LREC'2010.</p>
      </li>
      <li id="uid130">
        <p noindent="true">Éric de La Clergerie has presented
        results and demonstrations relative to the SCRIBO action at
        the SCRIBO-CoLab Barcamp (November 2010).</p>
      </li>
      <li id="uid131">
        <p noindent="true">Éric de La Clergerie has presented
        results on the PASSAGE action at the Grand Colloque STIC
        (January 2010).</p>
      </li>
      <li id="uid132">
        <p noindent="true">Participation of Éric de La Clergerie to
        ISO TC37SC4 meetings (Hong Kong, January 2010; Berlin,
        October 2010), to the related FlareNet meeting (Barcelona,
        February 2010) and during LREC 2010 (May 2010).</p>
      </li>
      <li id="uid133">
        <p noindent="true">Laurence Danlos made a 5-day visit at
        the Université de Montréal, Canada, where she gave an
        invited talk on "Présentation du formalisme D-STAG"</p>
      </li>
      <li id="uid134">
        <p noindent="true">Éric de La Clergerie has presented a
        tutorial on MAF (Morpho-syntactic Annotation Framework) at
        LREC 2010 (day on “Standards for Language Resources.
        Overview and Use”).</p>
      </li>
      <li id="uid135">
        <p noindent="true">Éric de La Clergerie has presented his
        work on “Comment améliorer une chaîne de traitement
        syntaxique ?” at Institut Gaspard Monge (University Marne
        la Vallée, January 2010) and on “Concevoir, améliorer et
        exploiter une méta-grammaire factorisée du français” at
        Geneva University (November 2010).</p>
      </li>
      <li id="uid136">
        <p noindent="true">Laurence Danlos gave an invited talk at
        the Université de Genève on "La traduction (automatique)
        des connecteurs de discours"</p>
      </li>
      <li id="uid137">
        <p noindent="true">Benoît Sagot made a 2-day visit at the
        University of Vigo, Spain, where he gave an invited
        talk</p>
      </li>
      <li id="uid138">
        <p noindent="true">Philippe Muller was invited to give a
        class, titled "Sémantique du discours et interprétation
        temporelle", at the "Atelier Jeunes Chercheurs des Journées
        Sémantique et Modélisation" at Nancy in march 2010</p>
      </li>
      <li id="uid139">
        <p noindent="true">Pascal Denis was invited to give an
        opening class (tutorial), titled "Résolution automatique
        des anaphores", at the "Atelier Jeunes Chercheurs des
        Journées Sémantique et Modélisation" at Nancy in march
        2010</p>
      </li>
      <li id="uid140">
        <p noindent="true">Djamé Seddah made a 3 days visit at
        Dublin City University and presented his work on
        lemmatization of lexicalized parsing models for MRLs.
        During his stay, he prepared the writing of the parse4real
        FP7 project proposal.</p>
      </li>
    </subsection>
    <subsection id="uid141" level="1">
      <bodyTitle>Teaching</bodyTitle>
      <p>Alpage is in charge of the prestigious cursus of
      Computational Linguistics of Paris 7, historically the
      first cursus in France in this domain. This cursus, which
      starts in License 3 and includes a Master 2 (research) and a
      professional Master 2, is directed by Laurence Danlos. Marie
      Candito is in charge of the License 3, and Laurence Danlos is
      in charge of both Master 2. All faculty members of Alpage are
      strongly involved in this cursus, but some Inria members also
      participate in teaching and supervizing internships. Unless
      otherwise specified, all teaching done by Alpage members
      belong to this cursus. Teaching by associate members in other
      universities are not indicated.</p>
      <p>Laurence Danlos (INRIA partial delegation): Introduction
      to NLP (3rd year of License, 28h); Discourse, NLU and NLG
      (2nd year of Master, 28h).</p>
      <p>Marie Candito: Information retrieval (2nd year of
      professional Master, 12h); Clustering and Classification (2nd
      year of professional Master, 12h); Probabilistic methods for
      Natural language processing (1st year of Master, 48h);
      Machine translation (1st year of Master, 48h); Probabilities
      and statistics for Natural language processing (3rd year of
      Licence, 24h);</p>
      <p>Benoît Sagot: Parsing systems (2nd year of Master, 24h).
      Introduction to NLP (3rd year of License in Computer Science,
      24h).</p>
      <p>Benoît Crabbé (INRIA delegation): Probabilistic methods
      for NLP (1st year of Master, 48h); Introduction to
      programming II (3rd year of Licence, 24h).</p>
      <p>Pascal Denis: Computational Semantics (2nd year of Master,
      24h).</p>
      <p>Charlotte Roze: Introduction to Programming (3rd year of
      License, 24h); Algorithmics (3rd year of License, 24h).</p>
      <p>Juliette Thuilier: Introduction to Linguistics (1st year
      of License in “Lettres modernes”, TD, 24h);</p>
      <p>François-Régis Chaumartin: Modélisation (UML) et bases de
      données (SQL) (2rd year of professional Master, 24h).</p>
      <p>Djamé Seddah, as an Assistant Professor in CS in the
      University Paris 4 Sorbonne, member of the UFR ISHA, mainly
      teaches “Generic Programming and groupware”, “Distributed
      Application and Object Programming”, “Syntaxic tools and text
      Processing for NLP”, “Machine Translation Seminars” in both
      years of the Master “Ingénierie de la Langue pour la Gestion
      Intelligente de l'Information”. Djamé Seddah is also the
      “Directeur des études” of a CS transversal module for the
      Sorbonne's undergraduate students (ie “Certificat
      Informatique et Internet”).</p>
      <p>André Bittar is an ATER at Université Paris-Est
      Marne-la-Vallée, where he taught “Introduction to Operating
      Systems” (1st year of DUT, 52h), “Unix/HTML” (1st year of
      License, 48h) and “Programming with Python” (1st year of
      Master, 12h) during the first semester of the university year
      2009-2010.</p>
    </subsection>
    <subsection id="uid142" level="1">
      <bodyTitle>PhD committees</bodyTitle>
      <simplelist>
        <li id="uid143">
          <p noindent="true">Laurence Danlos was a reviewer for
          Eric Charton's dissertation on "Génération de phrases
          multilingues par apprentissage automatique de modèles de
          phrases", (Université d'Avignon, LIA, Computer Science
          Department)</p>
        </li>
        <li id="uid144">
          <p noindent="true">Laurence Danlos was President of Mario
          Barcala's PhD Committee (Computer Science Department,
          University of Vigo, Spain); the title of his dissertation
          is "Création de corpus et fouille de textes en
          Galicien"</p>
        </li>
        <li id="uid145">
          <p noindent="true">Laurence Danlos was a member of
          Anne-Laure Jousse's PhD Committee (Université de
          Montréal, Department of Linguistics, and Université Paris
          Diderot, UFR of Linguistics); the title of her
          dissertation is "Modèle de structuration des relations
          lexicales fondé sur le formalisme des fonctions
          lexicales"</p>
        </li>
        <li id="uid146">
          <p noindent="true">Laurence Danlos was in the PhD defense
          committees as PhD supervisor for André Bittar ("Building
          a TimeBank for French: A Reference Corpus Annotated
          According to the ISO-TimeML Standard", UFR de
          Linguistique de l'Université Paris Diderot) and SinWon
          Yoo ("Une grammaire TAG du Coréen", UFR de Linguistique
          de l'Université Paris Diderot). Philippe Muller was
          member and Pascal Denis invited member of the committee
          for the former. Benoît Crabbé was member of the committee
          for the latter.</p>
        </li>
        <li id="uid147">
          <p noindent="true">Benoît Sagot was a member of Lionel
          Nicolas's PhD Committee (Université de Nice, Computer
          Science Department); the title of his dissertation is
          "Efficient production of linguistic resources: the
          Victoria Project"</p>
        </li>
        <li id="uid148">
          <p noindent="true">Benoît Sagot was a member of Claire
          Mouton's PhD Committee (Université Paris-Sud Orsay,
          LIMSI); the title of her dissertation is "Ressources et
          méthodes semi-supervisées pour l'analyse sémantique de
          texte en français"</p>
        </li>
      </simplelist>
    </subsection>
    <subsection id="uid149" level="1">
      <bodyTitle>Commissions</bodyTitle>
      <simplelist>
        <li id="uid150">
          <p noindent="true">Laurence Danlos was a member of the
          Comité de Sélection for a Full Professor position at
          INALCO (team Ertim) specialized on “Sémantique textuelle
          outillée multilingue” (CNU section 07), for an Assistant
          Professor position at Université de Montpellier 2 (team
          LIRMM-CNRS) specialized on "Traitement Automatique des
          Langues (syntaxe)" (CNU section 27) and for a Full
          Professor position at Université de Marne la Vallée (team
          Informatique Linguistique) specialized on "Informatique
          Linguistique" (CNU sections 07 et 27).</p>
        </li>
        <li id="uid151">
          <p noindent="true">Benoît Sagot was a member of the
          Comité de Sélection for an Assistant Professor position
          at University of Marseilles (team LIF), for an Assistant
          Professor position in Computer Science at University of
          Marne-la-Vallée (Institut Gaspard Monge) and for an
          Engineer position at University of Marne-la-Vallée (team
          Informatique Linguistique).</p>
        </li>
        <li id="uid152">
          <p noindent="true">Marie Candito was a member of the
          Comité de Sélection for an Assistant Professor position
          at University of Marseilles (team LIF).</p>
        </li>
        <li id="uid153">
          <p noindent="true">Laurence Danlos is a member of the
          Scientific Committee of the Linguistics UFR of University
          Paris Diderot</p>
        </li>
        <li id="uid154">
          <p noindent="true">Laurence Danlos is a member of the
          Scientific Committee of the LIF (Laboratoire
          d'Informatique Fondamentale de Aix-Marseille) and
          participated to this team's scientific days (17-18 Juin
          in Agay, France)</p>
        </li>
        <li id="uid155">
          <p noindent="true">Laurence Danlos is a member of the
          Conseil de l'Ecole Doctorale "Sciences du Langage" from
          University Paris Diderot</p>
        </li>
      </simplelist>
    </subsection>
  </diffusion>
  <biblio id="bibliography" html="bibliography" numero="10" titre="Bibliography">
    <biblStruct id="alpage-2010-bid109" type="incollection" rend="refer" n="refercite:Boullier:TSLT04">
      <analytic>
        <title level="a">Range Concatenation Grammars</title>
        <author>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName>Harry</foreName>
            <surname>Bunt</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>John</foreName>
            <surname>Carroll</surname>
            <initial>J.</initial>
          </persName>
          <persName key="alpage-2008-idm542378733072">
            <foreName>Giorgio</foreName>
            <surname>Satta</surname>
            <initial>G.</initial>
          </persName>
        </editor>
        <title level="m">New Developments in Parsing
        Technology</title>
        <title level="s">Text, Speech and Language
        Technology</title>
        <imprint>
          <biblScope type="volume">23</biblScope>
          <publisher>
            <orgName>Kluwer Academic Publishers</orgName>
          </publisher>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">269–289</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid111" type="inproceedings" rend="refer" n="refercite:boullier07iwpt">
      <analytic>
        <title level="a">Are very large grammars computationnaly
        tractable?</title>
        <author>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of IWPT'07</title>
        <loc>Prague, Czech Republic</loc>
        <imprint>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="bnote">(selected for publication as a book
      chapter)</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid53" type="inproceedings" rend="refer" n="refercite:ccs:09">
      <analytic>
        <title level="a">On statistical parsing of French with
        supervised and semi-supervised strategies</title>
        <author>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">EACL 2009 Workshop Grammatical
        inference for Computational Linguistics</title>
        <loc>Athens, Greece</loc>
        <imprint>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid32" type="article" rend="refer" n="refercite:danlos09tal">
      <analytic>
        <title level="a">D-STAG : un formalisme d'analyse
        automatique de discours fondé sur les TAG
        synchrones</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes">
        <title level="j">Traitement Automatique des Langues</title>
        <imprint>
          <biblScope type="volume">50</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid112" type="article" rend="refer" n="refercite:danlossagot09">
      <analytic>
        <title level="a">Constructions pronominales dans
        Dicovalence et le lexique-grammaire – Intégration dans le
        Le 
        <i>fff</i></title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <title level="j">Linguisticæ Investigationes</title>
        <imprint>
          <biblScope type="volume">2</biblScope>
          <biblScope type="number">32</biblScope>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid38" type="inproceedings" rend="refer" n="refercite:naaclDenisB07">
      <analytic>
        <title level="a">Joint Determination of Anaphoricity and
        Coreference Resolution using Integer Programming</title>
        <author>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Jason</foreName>
            <surname>Baldridge</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes">
        <title level="m">HLT-NAACL</title>
        <imprint>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
          <biblScope type="pages">236-243</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid29" type="article" rend="refer" n="refercite:TAL08:sxpipe">
      <analytic>
        <title level="a">SxPipe 2: architecture pour le traitement
        présyntaxique de corpus bruts</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <title level="j">Traitement Automatique des Langues
        (T.A.L.)</title>
        <imprint>
          <biblScope type="volume">49</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid20" type="inproceedings" rend="refer" n="refercite:ACL06:em">
      <analytic>
        <title level="a">Error Mining in Parsing Results</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of the 21st International
        Conference on Computational Linguistics and 44th Annual
        Meeting of the Association for Computational
        Linguistics</title>
        <loc>Sydney, Australia</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <month>July</month>
            <year>2006</year>
          </dateStruct>
          <biblScope type="pages">329–336</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid15" type="inproceedings" rend="refer" n="refercite:seddah:09c">
      <analytic>
        <title level="a">Cross Parser Evaluation and Tagset
        Variation: a French Treebank Study</title>
        <author>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of the 11th Internation
        Conference on Parsing Technologies (IWPT'09)</title>
        <loc>Paris, France</loc>
        <imprint>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
          <biblScope type="pages">150-161</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid110" type="inproceedings" rend="refer" n="refercite:MG:IWPT05">
      <analytic>
        <title level="a">From Metagrammars to Factorized TAG/TIG
        Parsers</title>
        <author>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of IWPT'05</title>
        <loc>Vancouver, Canada</loc>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">190–191</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="5874" id="alpage-2010-bid106" type="proceedings" rend="year" n="cite:seddah:2010:inria-00525752:1">
      <identifiant type="hal" value="inria-00525752"/>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of the NAACL HLT 2010 First
        Workshop on Statistical Parsing of Morphologically-Rich
        Languages</title>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">113</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00525752/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00525752/ 
          <allowbreak/>en</ref>
        </imprint>
      </monogr>
      <affiliation>
        <country>SE</country>
        <country>IN</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="2115" id="alpage-2010-bid104" type="incollection" rend="year" n="cite:boullier:2010:inria-00516341:1">
      <identifiant type="hal" value="inria-00516341"/>
      <analytic>
        <title level="a">Are Very Large Context-Free Grammars
        Tractable?</title>
        <author>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes/no">
        <editor role="editor">
          <persName>
            <foreName>Harry</foreName>
            <surname>Bunt</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Paola</foreName>
            <surname>Merlo</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Joakim</foreName>
            <surname>Nivre</surname>
            <initial>J.</initial>
          </persName>
        </editor>
        <title level="m">Trends in Parsing Technology</title>
        <title level="s">Text, Speech and Language
        Technology</title>
        <imprint>
          <biblScope type="volume">43</biblScope>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <month>Oct</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00516341/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00516341/ 
          <allowbreak/>en</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2163" id="alpage-2010-bid105" type="incollection" rend="year" n="cite:danlos:2010:inria-00524746:1">
      <identifiant type="hal" value="inria-00524746"/>
      <analytic>
        <title level="a">Extension de la notion de verbe
        support</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes/no">
        <editor role="editor">
          <persName>
            <foreName>Takuya</foreName>
            <surname>Nakamura</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Éric</foreName>
            <surname>Laporte</surname>
            <initial>É.</initial>
          </persName>
          <persName>
            <foreName>Anne</foreName>
            <surname>Dister</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Cédric</foreName>
            <surname>Fairon</surname>
            <initial>C.</initial>
          </persName>
        </editor>
        <title level="m">Les Tables, La grammaire par le menu,
        Volume d'hommage à Christian Leclère</title>
        <imprint>
          <publisher>
            <orgName>Presses Universitaires de Louvain</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">81–90</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00524746/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00524746/ 
          <allowbreak/>en</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="0614" id="alpage-2010-bid41" type="article" rend="year" n="cite:danlos:2010:inria-00511267:1">
      <identifiant type="hal" value="inria-00511267"/>
      <analytic>
        <title level="a">Écriture automatique</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01414" x-scientific-popularization="yes" x-editorial-board="yes" x-international-audience="no">
        <title level="j">La Recherche. Les Cahiers de
        l'Inria</title>
        <imprint>
          <biblScope type="number">443 Juillet-Août
          2010</biblScope>
          <dateStruct>
            <month>Jul</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00511267/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00511267/ 
          <allowbreak/>en</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="0032" id="alpage-2010-bid107" type="article" rend="year" n="cite:messiant:2010:hal-00538752:1">
      <identifiant type="hal" value="hal-00538752"/>
      <analytic>
        <title level="a">Acquisition de connaissances lexicales à
        partir de corpus : la sous-catégorisation verbale en
        français</title>
        <author>
          <persName>
            <foreName>Cédric</foreName>
            <surname>Messiant</surname>
            <initial>C.</initial>
          </persName>
          <persName key="alpage-2010-idm152476259776">
            <foreName>Kata</foreName>
            <surname>Gábor</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>Thierry</foreName>
            <surname>Poibeau</surname>
            <initial>T.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01924" x-editorial-board="yes" x-international-audience="yes">
        <title level="j">Traitement Automatique des Langues
        (T.A.L.)</title>
        <imprint>
          <biblScope type="volume">51</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">65–96</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00538752/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00538752/ 
          <allowbreak/>en</ref>
        </imprint>
      </monogr>
      <affiliation>
        <country>HU</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="5154" subtype="nonparu" id="alpage-2010-bid69" type="inproceedings" rend="year" n="cite:adam:2010:inria-00511605:1">
      <analytic>
        <title level="a">Une évaluation de l'impact des types de
        textes sur la tâche de segmentation thématique</title>
        <author>
          <persName>
            <foreName>Clémentine</foreName>
            <surname>Adam</surname>
            <initial>C.</initial>
          </persName>
          <persName key="alpage-2009-idm402038296432">
            <foreName>Philippe</foreName>
            <surname>Muller</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Cécile</foreName>
            <surname>Fabre</surname>
            <initial>C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles - TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Association pour le
            Traitement Automatique des Langues</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.iro.umontreal.ca/~felipe/TALN2010/Xml/Papers/all/taln2010_submission_60.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>www. 
          <allowbreak/>iro. 
          <allowbreak/>umontreal. 
          <allowbreak/>ca/ 
          <allowbreak/>~felipe/ 
          <allowbreak/>TALN2010/ 
          <allowbreak/>Xml/ 
          <allowbreak/>Papers/ 
          <allowbreak/>all/ 
          <allowbreak/>taln2010_submission_60. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00511605/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00511605/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3902" id="alpage-2010-bid68" type="inproceedings" rend="year" n="cite:afantenos:2010:hal-00468210:1">
      <identifiant type="hal" value="hal-00468210"/>
      <analytic>
        <title level="a">Learning Recursive Segments for Discourse
        Parsing</title>
        <author>
          <persName>
            <foreName>Stergos</foreName>
            <surname>Afantenos</surname>
            <initial>S.</initial>
          </persName>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="alpage-2009-idm402038296432">
            <foreName>Philippe</foreName>
            <surname>Muller</surname>
            <initial>P.</initial>
          </persName>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName>Nicoletta</foreName>
            <surname>Calzolari</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Khalid</foreName>
            <surname>Choukri</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>Bente</foreName>
            <surname>Maegaard</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Joseph</foreName>
            <surname>Mariani</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Jan</foreName>
            <surname>Odijk</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Stelios</foreName>
            <surname>Piperidis</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Mike</foreName>
            <surname>Rosner</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Daniel</foreName>
            <surname>Tapias</surname>
            <initial>D.</initial>
          </persName>
        </editor>
        <title level="m">Language Resources and Evaluation</title>
        <loc>Malte La Valette</loc>
        <imprint>
          <publisher>
            <orgName>European Language Resources Association
            (ELRA)</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00468210/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00468210/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid289398">
          <title>International Conference on Language Resources and Evaluation</title>
          <num>7</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2604" id="alpage-2010-bid98" type="inproceedings" rend="year" n="cite:bittar:2010:inria-00522315:1">
      <identifiant type="hal" value="inria-00522315"/>
      <analytic>
        <title level="a">Annotation of Events and Temporal
        Expressions in French Texts</title>
        <author>
          <persName key="alpage-2008-idm542378786864">
            <foreName>André</foreName>
            <surname>Bittar</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Computational Linguistics in the
        Netherlands 19</title>
        <loc>Pays-Bas Groningen</loc>
        <imprint>
          <dateStruct>
            <month>Feb</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00522315/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00522315/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid353687">
          <title>Meeting of Computational Linguistics in The Netherlands</title>
          <num>20</num>
          <abbr type="sigle">CLIN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="5106" id="alpage-2010-bid94" type="inproceedings" rend="year" n="cite:blancafortsanjose:2010:inria-00521237:1">
      <identifiant type="hal" value="inria-00521237"/>
      <analytic>
        <title level="a">Traitement des inconnus : une approche
        systématique de l'incomplétude lexicale</title>
        <author>
          <persName>
            <foreName>Helena</foreName>
            <surname>Blancafort San José</surname>
            <initial>H.</initial>
          </persName>
          <persName key="alpage-2009-idm402038293216">
            <foreName>Gaëlle</foreName>
            <surname>Recourcé</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Javier</foreName>
            <surname>Couto</surname>
            <initial>J.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2009-idm402038280912">
            <foreName>Rosa</foreName>
            <surname>Stern</surname>
            <initial>R.</initial>
          </persName>
          <persName>
            <foreName>Denis</foreName>
            <surname>Teyssou</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles : TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521237/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521237/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
      <affiliation>
        <country>ES</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="4964" subtype="nonparu" id="alpage-2010-bid77" type="inproceedings" rend="year" n="cite:boruta:11">
      <analytic>
        <title level="a">Testing the Robustness of OnlineWord
        Segmentation:Effects of Linguistic Diversity and Phonetic
        Variation</title>
        <author>
          <persName key="alpage-2009-idm402038353920">
            <foreName>Luc</foreName>
            <surname>Boruta</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>Sharon</foreName>
            <surname>Peperkamp</surname>
            <initial>S.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Emmanuel</foreName>
            <surname>Dupoux</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of CogSci 2011</title>
        <imprint>
          <dateStruct>
            <year>2011</year>
          </dateStruct>
        </imprint>
        <meeting id="cid388165">
          <title>Annual Conference of the Cognitve Science Society</title>
          <num>33</num>
          <abbr type="sigle">COGSCI</abbr>
        </meeting>
      </monogr>
      <note type="bnote">submitted</note>
    </biblStruct>
    <biblStruct dedoublkey="4876" id="alpage-2010-bid54" type="inproceedings" rend="year" n="cite:candito:2010:hal-00495196:1">
      <identifiant type="hal" value="hal-00495196"/>
      <analytic>
        <title level="a">Statistical French dependency parsing:
        treebank conversion and first results</title>
        <author>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Seventh International Conference on
        Language Resources and Evaluation - LREC 2010</title>
        <loc>Malte La Valletta</loc>
        <imprint>
          <publisher>
            <orgName>European Language Resources Association
            (ELRA)</orgName>
          </publisher>
          <dateStruct>
            <month>May</month>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">1840-1847</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00495196/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00495196/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid289398">
          <title>International Conference on Language Resources and Evaluation</title>
          <num>7</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2834" id="alpage-2010-bid60" type="inproceedings" rend="year" n="cite:candito:2010:hal-00514815:1">
      <identifiant type="hal" value="hal-00514815"/>
      <analytic>
        <title level="a">Benchmarking of Statistical Dependency
        Parsers for French</title>
        <author>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Joakim</foreName>
            <surname>Nivre</surname>
            <initial>J.</initial>
          </persName>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="alpage-2009-idm402038316144">
            <foreName>Enrique</foreName>
            <surname>Henestroza Anguiano</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">23rd International Conference on
        Computational Linguistics - COLING 2010</title>
        <loc>Chine Beijing</loc>
        <imprint>
          <publisher>
            <orgName>Coling 2010 Organizing Committee</orgName>
          </publisher>
          <dateStruct>
            <month>Aug</month>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">108-116</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00514815/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00514815/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid115519">
          <title>International Conference on Computational Linguistics</title>
          <num>23</num>
          <abbr type="sigle">COLING</abbr>
        </meeting>
      </monogr>
      <note type="bnote">9 pages</note>
      <affiliation>
        <country>SE</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="4401" id="alpage-2010-bid58" type="inproceedings" rend="year" n="cite:candito:2010:hal-00495177:1">
      <identifiant type="hal" value="hal-00495177"/>
      <analytic>
        <title level="a">Parsing word clusters</title>
        <author>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">NAACL/HLT-2010 Workshop on Statistical
        Parsing of Morphologically Rich Languages - SPMRL
        2010</title>
        <loc>États-Unis Los Angeles</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Association for
            Computational Linguistics</orgName>
          </publisher>
          <dateStruct>
            <month>Jun</month>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">76-84</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00495177/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00495177/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388128">
          <title>Workshop on Statistical Parsing of Morphologically Rich Languages</title>
          <num>1</num>
          <abbr type="sigle">SPMRL</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4463" id="alpage-2010-bid71" type="inproceedings" rend="year" n="cite:danlos:2010:inria-00521235:1">
      <identifiant type="hal" value="inria-00521235"/>
      <analytic>
        <title level="a">Ponctuations fortes abusives</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles : TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521235/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521235/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2512" id="alpage-2010-bid83" type="inproceedings" rend="year" n="cite:danlos:2010:inria-00511397:1">
      <identifiant type="hal" value="inria-00511397"/>
      <analytic>
        <title level="a">Analyse discursive des incises de
        citation</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2009-idm402038280912">
            <foreName>Rosa</foreName>
            <surname>Stern</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">2ème Congrès Mondial de Linguistique
        Française - CMLF 2010</title>
        <loc>États-Unis La Nouvelle Orléans</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Institut de Linguistique
            Française</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00511397/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00511397/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid55237">
          <title>Congrès Mondial de Linguistique Française</title>
          <num>2</num>
          <abbr type="sigle">CMLF</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2995" id="alpage-2010-bid67" type="inproceedings" rend="year" n="cite:denis:2010:inria-00511586:1">
      <analytic>
        <title level="a">Comparison of different algebras for
        inducing the temporal structure of texts</title>
        <author>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="alpage-2009-idm402038296432">
            <foreName>Philippe</foreName>
            <surname>Muller</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName/>
            <surname>Coling 2010 Organizing Committee</surname>
            <initial/>
          </persName>
        </editor>
        <title level="m">Proceedings of the 23rd International
        Conference on Computational Linguistics - Coling
        2010</title>
        <loc>Chine Beijing</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">250–258</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.aclweb.org/anthology/C10-1029.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>www. 
          <allowbreak/>aclweb. 
          <allowbreak/>org/ 
          <allowbreak/>anthology/ 
          <allowbreak/>C10-1029. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00511586/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00511586/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid115519">
          <title>International Conference on Computational Linguistics</title>
          <num>23</num>
          <abbr type="sigle">COLING</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3453" id="alpage-2010-bid85" type="inproceedings" rend="year" n="cite:denis:2010:inria-00514364:1">
      <identifiant type="hal" value="inria-00514364"/>
      <analytic>
        <title level="a">Exploitation d'une ressource lexicale pour
        la construction d'un étiqueteur morpho-syntaxique
        état-de-l'art du français</title>
        <author>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement automatique des langues
        naturelles</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Association pour le
            Traitement Automatique des Langues</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00514364/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00514364/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3453" id="alpage-2010-bid92" type="inproceedings" rend="year" n="cite:denis:2010:inria-00521231:1">
      <identifiant type="hal" value="inria-00521231"/>
      <analytic>
        <title level="a">Exploitation d'une ressource lexicale pour
        la construction d'un étiqueteur morphosyntaxique
        état-de-l'art du français</title>
        <author>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles : TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521231/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521231/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3794" id="alpage-2010-bid80" type="inproceedings" rend="year" n="cite:fort:2010:hal-00484294:1">
      <identifiant type="hal" value="hal-00484294"/>
      <analytic>
        <title level="a">Influence of Pre-annotation on POS-tagged
        Corpus Development</title>
        <author>
          <persName key="calligramme-2006-idm133559948416">
            <foreName>Karën</foreName>
            <surname>Fort</surname>
            <initial>K.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">The Fourth ACL Linguistic Annotation
        Workshop</title>
        <loc>Suède Uppsala</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00484294/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00484294/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid351579">
          <title>Linguistic Annotation Workshop</title>
          <num>4</num>
          <abbr type="sigle">LAW</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4481" id="alpage-2010-bid86" type="inproceedings" rend="year" n="cite:fox:2010:inria-00515393:1">
      <analytic>
        <title level="a">Predicting the Position of Attributive
        Adjectives in the French NP</title>
        <author>
          <persName>
            <foreName>Gwendoline</foreName>
            <surname>Fox</surname>
            <initial>G.</initial>
          </persName>
          <persName key="alpage-2009-idm402038273904">
            <foreName>Juliette</foreName>
            <surname>Thuilier</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName>Marija</foreName>
            <surname>Slavkovik</surname>
            <initial>M.</initial>
          </persName>
        </editor>
        <title level="m">Student session of the European Summer
        School for Logic, Language and Information</title>
        <loc>Danemark Copenhague</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Marija Slavkovik</orgName>
          </publisher>
          <dateStruct>
            <month>Sep</month>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">173-183</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://marija.gforge.uni.lu/proceedings.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>marija. 
          <allowbreak/>gforge. 
          <allowbreak/>uni. 
          <allowbreak/>lu/ 
          <allowbreak/>proceedings. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00515393/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00515393/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid70768">
          <title>European Summer School in Logic, Language and Information</title>
          <num>22</num>
          <abbr type="sigle">ESSLLI</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2979" subtype="nonparu" id="alpage-2010-bid84" type="inproceedings" rend="year" n="cite:muller:2010:inria-00511599:1">
      <analytic>
        <title level="a">Comparaison de ressources lexicales pour
        l'extraction de synonymes</title>
        <author>
          <persName key="alpage-2009-idm402038296432">
            <foreName>Philippe</foreName>
            <surname>Muller</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Philippe</foreName>
            <surname>Langlais</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles - TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Association pour le
            Traitement Automatique des Langues</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.iro.umontreal.ca/~felipe/TALN2010/Xml/Papers/all/taln2010_submission_124.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>www. 
          <allowbreak/>iro. 
          <allowbreak/>umontreal. 
          <allowbreak/>ca/ 
          <allowbreak/>~felipe/ 
          <allowbreak/>TALN2010/ 
          <allowbreak/>Xml/ 
          <allowbreak/>Papers/ 
          <allowbreak/>all/ 
          <allowbreak/>taln2010_submission_124. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00511599/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00511599/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
      <note type="bnote">papier court</note>
      <affiliation>
        <country>CA</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="3477" id="alpage-2010-bid81" type="inproceedings" rend="year" n="cite:nakamuradelloye:2010:hal-00511481:1">
      <identifiant type="hal" value="hal-00511481"/>
      <analytic>
        <title level="a">Extraction des chemins entre deux entités
        nommées en vue de l'acquisition des patrons de
        relations</title>
        <author>
          <persName key="alpage-2010-idm152476230416">
            <foreName>Yayoi</foreName>
            <surname>Nakamura-Delloye</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">21es Journées francophones d'Ingénierie
        des Connaissances - IC2010</title>
        <loc>France Nîmes</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">P120_Poster62</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00511481/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00511481/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid344524">
          <title>Journées Francophones d'Ingénierie des Connaissances</title>
          <num>21</num>
          <abbr type="sigle">IC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4907" id="alpage-2010-bid101" type="inproceedings" rend="year" n="cite:nakamuradelloye:2010:hal-00540541:1">
      <identifiant type="hal" value="hal-00540541"/>
      <analytic>
        <title level="a">Subordonnants japonais : réflexion sur les
        caractères substantifs des mots</title>
        <author>
          <persName key="alpage-2010-idm152476230416">
            <foreName>Yayoi</foreName>
            <surname>Nakamura-Delloye</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="no" x-proceedings="no">
        <title level="m">Colloque international Morphologie,
        syntaxe et sémantique des subordonnants</title>
        <loc>France Clermont-Ferrand</loc>
        <imprint>
          <dateStruct>
            <month>Mar</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00540541/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00540541/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388065">
          <title>Colloque International Morphologie, Syntaxe et Sémantique des Subordonnants</title>
          <num>2010</num>
          <abbr type="sigle"/>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3411" id="alpage-2010-bid103" type="inproceedings" rend="year" n="cite:nakamuradelloye:2010:hal-00540543:1">
      <identifiant type="hal" value="hal-00540543"/>
      <analytic>
        <title level="a">Étude contrastive français-japonais :
        comportements syntaxiques des interrogatifs et
        indéfinis</title>
        <author>
          <persName key="alpage-2010-idm152476230416">
            <foreName>Yayoi</foreName>
            <surname>Nakamura-Delloye</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="no" x-proceedings="no">
        <title level="m">Neuvième colloque de la société française
        des études japonaises</title>
        <loc>France Paris</loc>
        <imprint>
          <dateStruct>
            <month>Dec</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00540543/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00540543/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388323">
          <title>Colloque de la Société Française d'Etudes Japonaises</title>
          <num>9</num>
          <abbr type="sigle"/>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3414" id="alpage-2010-bid102" type="inproceedings" rend="year" n="cite:nakamuradelloye:2010:hal-00540542:1">
      <identifiant type="hal" value="hal-00540542"/>
      <analytic>
        <title level="a">Étude sur les connecteurs syntaxiques
        inter-propositionnels du japonais : définition et
        catégorisation</title>
        <author>
          <persName key="alpage-2010-idm152476230416">
            <foreName>Yayoi</foreName>
            <surname>Nakamura-Delloye</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="no" x-proceedings="no">
        <title level="m">XXIIIèmes Journées de Linguistique d'Asie
        Orientale</title>
        <loc>France Paris</loc>
        <imprint>
          <dateStruct>
            <month>Jul</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00540542/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00540542/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388260">
          <title>Journées de Linguistique d'Asie Orientale</title>
          <num>23</num>
          <abbr type="sigle">JLAO</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3451" subtype="nonparu" id="alpage-2010-bid82" type="inproceedings" rend="year" n="cite:nakamuradelloye:2010:hal-00511541:1">
      <identifiant type="hal" value="hal-00511541"/>
      <analytic>
        <title level="a">Exploitation de résultats d'analyse
        syntaxique pour extraction semi-supervisée des chemins de
        relations</title>
        <author>
          <persName key="alpage-2010-idm152476230416">
            <foreName>Yayoi</foreName>
            <surname>Nakamura-Delloye</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">17e Conférence sur le Traitement
        Automatique des Langues Naturelles - TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">
          taln2010_submission_164</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00511541/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00511541/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3123" id="alpage-2010-bid96" type="inproceedings" rend="year" n="cite:nicolas:2010:inria-00521241:1">
      <identifiant type="hal" value="inria-00521241"/>
      <analytic>
        <title level="a">Creating and maintaining language
        resources: the main guidelines of the Victoria
        project</title>
        <author>
          <persName key="atoll-2006-idm57727902672">
            <foreName>Lionel</foreName>
            <surname>Nicolas</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>Miguel</foreName>
            <surname>Molinero</surname>
            <initial>M.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Nieves</foreName>
            <surname>Fernández Formoso</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Vanesa</foreName>
            <surname>Vidal Castro</surname>
            <initial>V.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Workshop on Language Resources: From
        Storyboard to Sustainability and LR Lifecycle Management
        (LREC 2010 workshop)</title>
        <loc>Malte Valletta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521241/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521241/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388227">
          <title>Workshop on Language Resources: From Storyboard to Sustainability and LR Lifecycle Management</title>
          <num>2010</num>
          <abbr type="sigle">LRSLM</abbr>
        </meeting>
      </monogr>
      <affiliation>
        <country>ES</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="3914" id="alpage-2010-bid70" type="inproceedings" rend="year" n="cite:roze:2010:inria-00511615:1">
      <analytic>
        <title level="a">LEXCONN: a French Lexicon of Discourse
        Connectives</title>
        <author>
          <persName key="alpage-2009-idm402038290176">
            <foreName>Charlotte</foreName>
            <surname>Roze</surname>
            <initial>C.</initial>
          </persName>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
          <persName key="alpage-2009-idm402038296432">
            <foreName>Philippe</foreName>
            <surname>Muller</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Multidisciplinary Approaches to Discourse
        - MAD 2010</title>
        <loc>France Moissac</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://w3.workshop-mad2010.univ-tlse2.fr/MAD_files/papers/RozeDanlosMuller.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>w3. 
          <allowbreak/>workshop-mad2010. 
          <allowbreak/>univ-tlse2. 
          <allowbreak/>fr/ 
          <allowbreak/>MAD_files/ 
          <allowbreak/>papers/ 
          <allowbreak/>RozeDanlosMuller. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00511615/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00511615/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid329870">
          <title>International Workshop on Multidisciplinary Approaches to Discourse</title>
          <num>8</num>
          <abbr type="sigle">MAD</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="5232" id="alpage-2010-bid90" type="inproceedings" rend="year" n="cite:sagot:2010:inria-00521229:1">
      <identifiant type="hal" value="inria-00521229"/>
      <analytic>
        <title level="a">Verbes de citation et Tables du
        Lexique-Grammaire</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">International Conference on Lexis and
        Grammar</title>
        <loc>Serbie Belgrade</loc>
        <imprint>
          <dateStruct>
            <month>Sep</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521229/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521229/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid42656">
          <title>Colloque international sur le Lexique et la Grammaire</title>
          <num>29</num>
          <abbr type="sigle">CLG</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2447" id="alpage-2010-bid89" type="inproceedings" rend="year" n="cite:sagot:2010:inria-00515461:1">
      <identifiant type="hal" value="inria-00515461"/>
      <analytic>
        <title level="a">A Lexicon of French Quotation Verbs for
        Automatic Quotation Extraction</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
          <persName key="alpage-2009-idm402038280912">
            <foreName>Rosa</foreName>
            <surname>Stern</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">7th international conference on Language
        Resources and Evaluation - LREC 2010</title>
        <loc>Malte Valetta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00515461/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00515461/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid289398">
          <title>International Conference on Language Resources and Evaluation</title>
          <num>7</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="5003" id="alpage-2010-bid26" type="inproceedings" rend="year" n="cite:sagot:2010:inria-00521242:1">
      <identifiant type="hal" value="inria-00521242"/>
      <analytic>
        <title level="a">The Lefff, a freely available and
        large-coverage morphological and syntactic lexicon for
        French</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">7th international conference on Language
        Resources and Evaluation (LREC 2010)</title>
        <loc>Malte Valletta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521242/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521242/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid289398">
          <title>International Conference on Language Resources and Evaluation</title>
          <num>7</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4337" id="alpage-2010-bid66" type="inproceedings" rend="year" n="cite:sagot:2010:inria-00515455:1">
      <identifiant type="hal" value="inria-00515455"/>
      <analytic>
        <title level="a">Optimal rank reduction for Linear
        Context-Free Rewriting Systems with Fan-Out Two</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378733072">
            <foreName>Giorgio</foreName>
            <surname>Satta</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">48th Annual Meeting of the Association for
        Computational Linguistics - ACL 2010</title>
        <loc>Suède Uppsala</loc>
        <imprint>
          <dateStruct>
            <month>Jul</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00515455/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00515455/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid33303">
          <title>Annual Meeting of the Association for Computational Linguistics</title>
          <num>48</num>
          <abbr type="sigle">ACL</abbr>
        </meeting>
      </monogr>
      <affiliation>
        <country>IT</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="2488" id="alpage-2010-bid97" type="inproceedings" rend="year" n="cite:sagot:2010:inria-00521243:1">
      <identifiant type="hal" value="inria-00521243"/>
      <analytic>
        <title level="a">A morphological lexicon for the Persian
        language</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Géraldine</foreName>
            <surname>Walther</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">7th international conference on Language
        Resources and Evaluation (LREC 2010)</title>
        <loc>Malte Valletta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521243/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521243/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid289398">
          <title>International Conference on Language Resources and Evaluation</title>
          <num>7</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3238" id="alpage-2010-bid73" type="inproceedings" rend="year" n="cite:sagot:2010:inria-00521233:1">
      <identifiant type="hal" value="inria-00521233"/>
      <analytic>
        <title level="a">Développement de ressources pour le
        persan: lexique morphologique et chaîne de traitements de
        surface</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Géraldine</foreName>
            <surname>Walther</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles : TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521233/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521233/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3908" id="alpage-2010-bid57" type="inproceedings" rend="year" n="cite:seddah:2010:inria-00525754:1">
      <identifiant type="hal" value="inria-00525754"/>
      <analytic>
        <title level="a">Lemmatization and Statistical Lexicalized
        Parsing of Morphologically-Rich Languages</title>
        <author>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Grzegorz</foreName>
            <surname>Chrupala</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Özlem</foreName>
            <surname>Çetinoglu</surname>
            <initial>Ö.</initial>
          </persName>
          <persName>
            <foreName>Josef</foreName>
            <surname>van Genabith</surname>
            <initial>J.</initial>
          </persName>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of the NAACL/HLT Workshop on
        Statistical Parsing of Morphologically Rich Languages -
        SPMRL 2010</title>
        <loc>États-Unis Los Angeles, CA</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00525754/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00525754/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388128">
          <title>Workshop on Statistical Parsing of Morphologically Rich Languages</title>
          <num>1</num>
          <abbr type="sigle">SPMRL</abbr>
        </meeting>
      </monogr>
      <affiliation>
        <country>IE</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="3094" id="alpage-2010-bid91" type="inproceedings" rend="year" n="cite:seddah:2010:inria-00521230:1">
      <identifiant type="hal" value="inria-00521230"/>
      <analytic>
        <title level="a">Control Verbs, Argument Cluster
        Coordination and MCTAG</title>
        <author>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">10th International Conference on Tree
        Adjoining Grammars and Related Formalisms (TAG+10)</title>
        <loc>États-Unis New Haven</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521230/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521230/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid336728">
          <title>International Workshop on Tree Adjoining Grammars and Related Formalisms</title>
          <num>10</num>
          <abbr type="sigle">TAG</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3463" id="alpage-2010-bid16" type="inproceedings" rend="year" n="cite:seddah:2010:inria-00525753:1">
      <identifiant type="hal" value="inria-00525753"/>
      <analytic>
        <title level="a">Exploring the Spinal-Stig Model for
        Parsing French</title>
        <author>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of the 7th International
        Conference on Language Resources and Evaluation (LREC
        2010)</title>
        <loc>Malte Malta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00525753/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00525753/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid289398">
          <title>International Conference on Language Resources and Evaluation</title>
          <num>7</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3225" id="alpage-2010-bid93" type="inproceedings" rend="year" n="cite:stern:2010:inria-00521234:1">
      <identifiant type="hal" value="inria-00521234"/>
      <analytic>
        <title level="a">Détection et résolution d'entités nommées
        dans des dépêches d'agence</title>
        <author>
          <persName key="alpage-2009-idm402038280912">
            <foreName>Rosa</foreName>
            <surname>Stern</surname>
            <initial>R.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles : TALN 2010</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521234/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521234/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4638" id="alpage-2010-bid95" type="inproceedings" rend="year" n="cite:stern:2010:inria-00521240:1">
      <identifiant type="hal" value="inria-00521240"/>
      <analytic>
        <title level="a">Resources for Named Entity Recognition and
        Resolution in News Wires</title>
        <author>
          <persName key="alpage-2009-idm402038280912">
            <foreName>Rosa</foreName>
            <surname>Stern</surname>
            <initial>R.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Entity 2010 Workshop at LREC 2010</title>
        <loc>Malte Valletta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521240/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521240/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid379784">
          <title>Workshop on Methodologies and Resources for Processing Spatial Language</title>
          <num>2010</num>
          <abbr type="sigle">LREC</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2649" id="alpage-2010-bid87" type="inproceedings" rend="year" n="cite:thuilier:2010:inria-00515411:1">
      <identifiant type="hal" value="inria-00515411"/>
      <analytic>
        <title level="a">Approche quantitative en syntaxe :
        l'exemple de l'alternance de position de l'adjectif
        épithète en français</title>
        <author>
          <persName key="alpage-2009-idm402038273904">
            <foreName>Juliette</foreName>
            <surname>Thuilier</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Gwendoline</foreName>
            <surname>Fox</surname>
            <initial>G.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Traitement Automatique des Langues
        Naturelles</title>
        <loc>Canada Montréal</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00515411/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00515411/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3563" id="alpage-2010-bid88" type="inproceedings" rend="year" n="cite:thuilier:2010:inria-00515415:1">
      <identifiant type="hal" value="inria-00515415"/>
      <identifiant type="doi" value="10.1051/cmlf/2010161"/>
      <analytic>
        <title level="a">Fréquence, longueur et préférences
        lexicales dans le choix de la position de l'adjectif
        épithète en français</title>
        <author>
          <persName key="alpage-2009-idm402038273904">
            <foreName>Juliette</foreName>
            <surname>Thuilier</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Gwendoline</foreName>
            <surname>Fox</surname>
            <initial>G.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <editor role="editor">
          <persName>
            <foreName>Franck</foreName>
            <surname>Neveu</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Valelia Muni</foreName>
            <surname>Toke</surname>
            <initial>V. M.</initial>
          </persName>
          <persName>
            <foreName>Thomas</foreName>
            <surname>Klingler</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Jacques</foreName>
            <surname>Durand</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Lorenz</foreName>
            <surname>Mondada</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>Sophie</foreName>
            <surname>Prévost</surname>
            <initial>S.</initial>
          </persName>
        </editor>
        <title level="m">2ème Congrès Mondial de Linguistique
        Française</title>
        <loc>États-Unis La Nouvelle-Orléans</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00515415/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00515415/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid55237">
          <title>Congrès Mondial de Linguistique Française</title>
          <num>2</num>
          <abbr type="sigle">CMLF</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3563" id="alpage-2010-bid100" type="inproceedings" rend="year" n="cite:thuilier:2010:inria-00525768:1">
      <identifiant type="hal" value="inria-00525768"/>
      <identifiant type="doi" value="10.1051/cmlf/2010161"/>
      <analytic>
        <title level="a">Fréquence, longueur et préférences
        lexicales dans le choix de la position de l'adjectif
        épithète en français</title>
        <author>
          <persName key="alpage-2009-idm402038273904">
            <foreName>Juliette</foreName>
            <surname>Thuilier</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Gwendoline</foreName>
            <surname>Fox</surname>
            <initial>G.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Congrés Mondial de Linguistique Française
        - CMLF 2010</title>
        <loc>États-Unis New Orleans</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">2197-2210</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00525768/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00525768/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid55237">
          <title>Congrès Mondial de Linguistique Française</title>
          <num>2</num>
          <abbr type="sigle">CMLF</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4878" id="alpage-2010-bid99" type="inproceedings" rend="year" n="cite:tsarfaty:2010:inria-00525751:1">
      <identifiant type="hal" value="inria-00525751"/>
      <analytic>
        <title level="a">Statistical Parsing of Morphologically
        Rich Languages (SPMRL) What, How and Whither</title>
        <author>
          <persName>
            <foreName>Reut</foreName>
            <surname>Tsarfaty</surname>
            <initial>R.</initial>
          </persName>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Yoav</foreName>
            <surname>Goldberg</surname>
            <initial>Y.</initial>
          </persName>
          <persName>
            <foreName>Sandra</foreName>
            <surname>Kubler</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Yannick</foreName>
            <surname>Versley</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Jennifer</foreName>
            <surname>Foster</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Ines</foreName>
            <surname>Rehbein</surname>
            <initial>I.</initial>
          </persName>
          <persName>
            <foreName>Lamia</foreName>
            <surname>Tounsi</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of the NAACL HLT 2010 First
        Workshop on Statistical Parsing of Morphologically-Rich
        Languages</title>
        <loc>États-Unis Los Angeles</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">1–12</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00525751/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00525751/ 
          <allowbreak/>en</ref>
        </imprint>
      </monogr>
      <affiliation>
        <country>SE</country>
        <country>IL</country>
        <country>IN</country>
        <country>DE</country>
        <country>IE</country>
      </affiliation>
    </biblStruct>
    <biblStruct dedoublkey="3498" id="alpage-2010-bid74" type="inproceedings" rend="year" n="cite:walther:2010:hal-00510999:1">
      <identifiant type="hal" value="hal-00510999"/>
      <analytic>
        <title level="a">Fast Development of Basic NLP Tools:
        Towards a Lexicon and a POS Tagger for Kurmanji
        Kurdish</title>
        <author>
          <persName>
            <foreName>Géraldine</foreName>
            <surname>Walther</surname>
            <initial>G.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="calligramme-2006-idm133559948416">
            <foreName>Karën</foreName>
            <surname>Fort</surname>
            <initial>K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">International Conference on Lexis and
        Grammar</title>
        <loc>Serbie Belgrade</loc>
        <imprint>
          <dateStruct>
            <month>Sep</month>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/hal-00510999/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>hal-00510999/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid42656">
          <title>Colloque international sur le Lexique et la Grammaire</title>
          <num>29</num>
          <abbr type="sigle">CLG</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3232" id="alpage-2010-bid72" type="inproceedings" rend="year" n="cite:walther:2010:inria-00521238:1">
      <identifiant type="hal" value="inria-00521238"/>
      <analytic>
        <title level="a">Developing a large-scale lexicon for a
        less-resourced language: general methodology and
        preliminary experiments on Sorani Kurdish</title>
        <author>
          <persName>
            <foreName>Géraldine</foreName>
            <surname>Walther</surname>
            <initial>G.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">SaLTMiL Workshop on Creation and use of
        basic lexical resources for less-resourced languages (LREC
        2010 workshop)</title>
        <loc>Malte Valetta</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00521238/en" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00521238/ 
          <allowbreak/>en</ref>
        </imprint>
        <meeting id="cid388195">
          <title>SaLTMiL Workshop on Creation and Use of Basic Lexical Resources for Less-resourced Languages</title>
          <num>7</num>
          <abbr type="sigle">SaLTMiL</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2882" id="alpage-2010-bid52" type="inproceedings" rend="year" n="cite:VILLEMONTEDELACLERGERIE:2010:INRIA-00551974:1">
      <identifiant type="hal" value="inria-00551974"/>
      <analytic>
        <title level="a">Building factorized TAGs with
        meta-grammars</title>
        <author>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">The 10th International Conference on Tree
        Adjoining Grammars and Related Formalisms - TAG+10</title>
        <loc>New Haven, CO États-Unis</loc>
        <imprint>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <biblScope type="pages">111-118</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00551974/PDF/mgfull.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00551974/ 
          <allowbreak/>PDF/ 
          <allowbreak/>mgfull. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00551974/en/" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00551974/ 
          <allowbreak/>en/ 
          <allowbreak/></ref>
        </imprint>
        <meeting id="cid336728">
          <title>International Workshop on Tree Adjoining Grammars and Related Formalisms</title>
          <num>10</num>
          <abbr type="sigle">TAG</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3100" id="alpage-2010-bid108" type="inproceedings" rend="year" n="cite:VILLEMONTEDELACLERGERIE:2010:INRIA-00551973:1">
      <identifiant type="hal" value="inria-00551973"/>
      <analytic>
        <title level="a">Convertir des dérivations TAG en
        dépendances</title>
        <author>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">17e Conférence sur le Traitement
        Automatique des Langues Naturelles - TALN 2010</title>
        <loc>Montreal Canada</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">ATALA</orgName>
          </publisher>
          <dateStruct>
            <year>2010</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00551973/PDF/dep.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00551973/ 
          <allowbreak/>PDF/ 
          <allowbreak/>dep. 
          <allowbreak/>pdf</ref>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.inria.fr/inria-00551973/en/" type="hal" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>inria-00551973/ 
          <allowbreak/>en/ 
          <allowbreak/></ref>
        </imprint>
        <meeting id="cid50084">
          <title>Conférence Annuelle sur le Traitement Automatique des Langues Naturelles</title>
          <num>17</num>
          <abbr type="sigle">TALN</abbr>
        </meeting>
      </monogr>
      <note type="bnote">Projet SCRIBO, financement Pôle
      SYSTEM@TIC</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid13" type="inproceedings" rend="foot" n="footcite:abeille:04">
      <analytic>
        <title level="a">Enriching a French Treebank</title>
        <author>
          <persName>
            <foreName>Anne</foreName>
            <surname>Abeillé</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Nicolas</foreName>
            <surname>Barrier</surname>
            <initial>N.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of LREC'04</title>
        <loc>Lisbon, Portugal</loc>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid0" type="incollection" rend="foot" n="footcite:Boullier:TSLT04">
      <analytic>
        <title level="a">Range Concatenation Grammars</title>
        <author>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Harry</foreName>
            <surname>Bunt</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>John</foreName>
            <surname>Carroll</surname>
            <initial>J.</initial>
          </persName>
          <persName key="alpage-2008-idm542378733072">
            <foreName>Giorgio</foreName>
            <surname>Satta</surname>
            <initial>G.</initial>
          </persName>
        </editor>
        <title level="m">New Developments in Parsing
        Technology</title>
        <title level="s">Text, Speech and Language
        Technology</title>
        <imprint>
          <biblScope type="volume">23</biblScope>
          <publisher>
            <orgName>Kluwer Academic Publishers</orgName>
          </publisher>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">269–289</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid46" type="book" rend="foot" n="footcite:bresnan82">
      <monogr>
        <title level="m">The mental representation of grammatical
        relations</title>
        <author>
          <persName>
            <foreName>Joan</foreName>
            <surname>Bresnan</surname>
            <initial>J.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>MIT press</orgName>
          </publisher>
          <dateStruct>
            <year>1982</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid42" type="incollection" rend="foot" n="footcite:bresnan2007">
      <analytic>
        <title level="a">Predicting the Dative Alternation</title>
        <author>
          <persName>
            <foreName>Joan</foreName>
            <surname>Bresnan</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Anna</foreName>
            <surname>Cueni</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Tatiana</foreName>
            <surname>Nikitina</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Harald</foreName>
            <surname>Baayen</surname>
            <initial>H.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Cognitive Foundations of
        Interpretation</title>
        <loc>Amsterdam</loc>
        <imprint>
          <publisher>
            <orgName>Royal Netherlands Academy of Science 
            <loc>Amsterdam</loc></orgName>
          </publisher>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
          <biblScope type="pages">69-94</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid48" type="phdthesis" rend="foot" n="footcite:candito99">
      <monogr>
        <title level="m">Organisation modulaire et paramétrable de
        grammaires électroniques lexicalisées</title>
        <author>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">Université
            Paris 7</orgName>
          </publisher>
          <dateStruct>
            <year>1999</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="typdoc">Ph. D. Thesis</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid17" type="inproceedings" rend="foot" n="footcite:ccdg:09short">
      <analytic>
        <title level="a">Analyse syntaxique du français : des
        constituants aux dépendances</title>
        <author>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="alpage-2009-idm402038319232">
            <foreName>François</foreName>
            <surname>Guérin</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of TALN'09</title>
        <loc>Senlis, France</loc>
        <imprint>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid39" type="inproceedings" rend="foot" n="footcite:cardie:wagstaff:99">
      <analytic>
        <title level="a">Noun phrase coreference as
        clustering</title>
        <author>
          <persName>
            <foreName>Claire</foreName>
            <surname>Cardie</surname>
            <initial>C.</initial>
          </persName>
          <persName>
            <foreName>Kiri</foreName>
            <surname>Wagstaff</surname>
            <initial>K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the Joint SIGDAT Conference
        on Empirical Methods in Natural Language Processing and
        Very Large Corpora</title>
        <loc>University of Maryland, MD</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <year>1999</year>
          </dateStruct>
          <biblScope type="pages">82–89</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid9" type="article" rend="foot" n="footcite:chiang:00">
      <analytic>
        <title level="a">Statistical parsing with an
        automatically-extracted Tree Adjoining Grammar</title>
        <author>
          <persName>
            <foreName>David</foreName>
            <surname>Chiang</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Proceedings of the 38th Annual Meeting on
        Association for Computational Linguistics</title>
        <imprint>
          <dateStruct>
            <year>2000</year>
          </dateStruct>
          <biblScope type="pages">456–463</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid45" type="book" rend="foot" n="footcite:chomsky65">
      <monogr>
        <title level="m">Aspects of the theory of Syntax</title>
        <author>
          <persName>
            <foreName>Noam</foreName>
            <surname>Chomsky</surname>
            <initial>N.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>MIT press</orgName>
          </publisher>
          <dateStruct>
            <year>1965</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid59" type="inproceedings" rend="foot" n="footcite:chrupala:08short">
      <analytic>
        <title level="a">Learning Morphology with Morfette</title>
        <author>
          <persName>
            <foreName>Grzegorz</foreName>
            <surname>Chrupała</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Georgiana</foreName>
            <surname>Dinu</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Josef</foreName>
            <surname>van Genabith</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of LREC2008</title>
        <imprint>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid8" type="phdthesis" rend="foot" n="footcite:collins:99">
      <monogr>
        <title level="m">Head Driven Statistical Models for Natural
        Language Parsing</title>
        <author>
          <persName>
            <foreName>Michael</foreName>
            <surname>Collins</surname>
            <initial>M.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">University of
            Pennsylvania</orgName>
            <address>
              <addrLine>Philadelphia</addrLine>
            </address>
          </publisher>
          <dateStruct>
            <year>1999</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="typdoc">Ph. D. Thesis</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid49" type="inproceedings" rend="foot" n="footcite:crabbe05lacl">
      <analytic>
        <title level="a">Grammatical Development with XMG</title>
        <author>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Logical Aspects of Computational
        Linguistics (LACL)</title>
        <loc>Bordeaux</loc>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">84-100</biblScope>
        </imprint>
      </monogr>
      <note type="bnote">Published in the Lecture Notes in Computer
      Science series (LNCS/LNAI), vol. 3492, Springer Verlag</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid14" type="inproceedings" rend="foot" n="footcite:crabbe:08">
      <analytic>
        <title level="a">Expériences D'Analyse Syntaxique
        Statistique Du Français</title>
        <author>
          <persName key="alpage-2008-idm542378770960">
            <foreName>Benoît</foreName>
            <surname>Crabbé</surname>
            <initial>B.</initial>
          </persName>
          <persName key="alpage-2008-idm542378777200">
            <foreName>Marie</foreName>
            <surname>Candito</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes de la 15ème Conférence sur le
        Traitement Automatique des Langues Naturelles
        (TALN'08)</title>
        <loc>Avignon, France</loc>
        <imprint>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">45–54</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid30" type="inproceedings" rend="foot" n="footcite:danlos06cd">
      <analytic>
        <title level="a">Discourse Verbs and Discourse Periphrastic
        Links</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Second International Workshop on
        Constraints in Discourse</title>
        <loc>Maynooth, Ireland</loc>
        <imprint>
          <dateStruct>
            <year>2006</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid31" type="inproceedings" rend="foot" n="footcite:danlos07taln">
      <analytic>
        <title level="a">D-STAG : un formalisme pour le
        discours basé sur les TAG synchrones</title>
        <author>
          <persName key="alpage-2008-idm542378767840">
            <foreName>Laurence</foreName>
            <surname>Danlos</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of TALN 2007</title>
        <loc>Toulouse, France</loc>
        <imprint>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="bnote">to appear</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid56" type="inproceedings" rend="foot" n="footcite:melt:09short">
      <analytic>
        <title level="a">Coupling an annotated corpus and a
        morphosyntactic lexicon for state-of-the-art POS tagging
        with less human effort</title>
        <author>
          <persName key="alpage-2008-idm542378764240">
            <foreName>Pascal</foreName>
            <surname>Denis</surname>
            <initial>P.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Proceedings of PACLIC 2009</title>
        <loc>Hong Kong, China</loc>
        <imprint>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://atoll.inria.fr/~sagot/pub/paclic09tagging.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>atoll. 
          <allowbreak/>inria. 
          <allowbreak/>fr/ 
          <allowbreak/>~sagot/ 
          <allowbreak/>pub/ 
          <allowbreak/>paclic09tagging. 
          <allowbreak/>pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid24" type="inproceedings" rend="foot" n="footcite:fiser07">
      <analytic>
        <title level="a">Leveraging Parallel Corpora and Existing
        Wordnets for Automatic Construction of the Slovene
        Wordnet</title>
        <author>
          <persName>
            <foreName>Darja</foreName>
            <surname>Fiser</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of L&amp;TC'07</title>
        <loc>Poznań, Poland</loc>
        <imprint>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid23" type="inproceedings" rend="foot" n="footcite:ide02">
      <analytic>
        <title level="a">Sense Discrimination with Parallel
        Corpora</title>
        <author>
          <persName>
            <foreName>Nancy</foreName>
            <surname>Ide</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Tomaz</foreName>
            <surname>Erjavec</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Dan</foreName>
            <surname>Tufis</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proc. of ACL'02 Workshop on Word Sense
        Disambiguation</title>
        <imprint>
          <dateStruct>
            <year>2002</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid63" type="article" rend="foot" n="footcite:kallmeyer:TLMCTAGSN">
      <analytic>
        <title level="a">Tree-Local Multicomponent Tree-Adjoining
        Grammars with Shared Nodes</title>
        <author>
          <persName>
            <foreName>Laura</foreName>
            <surname>Kallmeyer</surname>
            <initial>L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Computational Linguistic</title>
        <imprint>
          <biblScope type="volume">31</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">187–226</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid44" type="phdthesis" rend="foot" n="footcite:keller2000">
      <monogr>
        <title level="m">Gradience in Grammar: Experimental and
        Computational Aspects of Degrees of Grammaticality</title>
        <author>
          <persName>
            <foreName>Frank</foreName>
            <surname>Keller</surname>
            <initial>F.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">University of
            Edinburgh</orgName>
          </publisher>
          <dateStruct>
            <year>2000</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="typdoc">Ph. D. Thesis</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid5" type="inproceedings" rend="foot" n="footcite:manning:03">
      <analytic>
        <title level="a">Accurate Unlexicalized Parsing</title>
        <author>
          <persName>
            <foreName>Dan</foreName>
            <surname>Klein</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Christopher D.</foreName>
            <surname>Manning.</surname>
            <initial>C. D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 41st Meeting of the
        Association for Computational Linguistics</title>
        <imprint>
          <dateStruct>
            <year>2003</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid37" type="inproceedings" rend="foot" n="footcite:Luo:07">
      <analytic>
        <title level="a">Coreference or not: a twin model for
        coreference resolution</title>
        <author>
          <persName>
            <foreName>X.</foreName>
            <surname>Luo</surname>
            <initial>X.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of HLT-NAACL 2007</title>
        <loc>Rochester, NY</loc>
        <imprint>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
          <biblScope type="pages">73-80</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid79" type="inproceedings" rend="foot" n="footcite:Martin:09">
      <analytic>
        <title level="a">Learning Phonemes with a
        Pseudo-Lexicon</title>
        <author>
          <persName>
            <foreName>Andrew</foreName>
            <surname>Martin</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Sharon</foreName>
            <surname>Peperkamp</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Emmanuel</foreName>
            <surname>Dupoux</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Workshop on Computational Modelling of
        Sound Pattern Acquisition</title>
        <loc>Edmonton, Canada</loc>
        <imprint>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid35" type="inproceedings" rend="foot" n="footcite:mccallum:wellner:04">
      <analytic>
        <title level="a">Conditional Models of Identity Uncertainty
        with Application to Noun Coreference</title>
        <author>
          <persName>
            <foreName>A.</foreName>
            <surname>McCallum</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>B.</foreName>
            <surname>Wellner</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of NIPS 2004</title>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid12" type="inproceedings" rend="foot" n="footcite:mcdonald:pereira:06">
      <analytic>
        <title level="a">Online Learning of Approximate Dependency
        Parsing Algorithms</title>
        <author>
          <persName>
            <foreName>Ryan T.</foreName>
            <surname>McDonald</surname>
            <initial>R. T.</initial>
          </persName>
          <persName>
            <foreName>Fernando C. N.</foreName>
            <surname>Pereira</surname>
            <initial>F. C. N.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proc. of EACL'06</title>
        <imprint>
          <dateStruct>
            <year>2006</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid34" type="inproceedings" rend="foot" n="footcite:ng:cardie:02a">
      <analytic>
        <title level="a">Improving Machine Learning Approaches to
        Coreference Resolution</title>
        <author>
          <persName>
            <foreName>Vincent</foreName>
            <surname>Ng</surname>
            <initial>V.</initial>
          </persName>
          <persName>
            <foreName>Claire</foreName>
            <surname>Cardie</surname>
            <initial>C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of ACL 2002</title>
        <imprint>
          <dateStruct>
            <year>2002</year>
          </dateStruct>
          <biblScope type="pages">104–111</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid36" type="inproceedings" rend="foot" n="footcite:ng:05b">
      <analytic>
        <title level="a">Machine Learning for Coreference
        Resolution: From Local Classification to Global
        Ranking</title>
        <author>
          <persName>
            <foreName>Vincent</foreName>
            <surname>Ng</surname>
            <initial>V.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of ACL 2005</title>
        <loc>Ann Arbor, MI</loc>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">157–164</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid40" type="inproceedings" rend="foot" n="footcite:ng:08">
      <analytic>
        <title level="a">Unsupervised Models for Coreference
        Resolution</title>
        <author>
          <persName>
            <foreName>Vincent</foreName>
            <surname>Ng</surname>
            <initial>V.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of EMNLP 2008</title>
        <imprint>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid11" type="inproceedings" rend="foot" n="footcite:nivre-scholz:2004:COLING">
      <analytic>
        <title level="a">Deterministic Dependency Parsing of
        English Text</title>
        <author>
          <persName>
            <foreName>Joakim</foreName>
            <surname>Nivre</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Mario</foreName>
            <surname>Scholz</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of Coling 2004</title>
        <loc>Geneva, Switzerland</loc>
        <imprint>
          <publisher>
            <orgName>COLING</orgName>
          </publisher>
          <dateStruct>
            <month>Aug 23–Aug 27</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">64–70</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid78" type="article" rend="foot" n="footcite:Peperkamp:06">
      <analytic>
        <title level="a">The acquisition of allophonic rules:
        statistical learning with linguistic constraints</title>
        <author>
          <persName>
            <foreName>Sharon</foreName>
            <surname>Peperkamp</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Rozenn</foreName>
            <surname>Le Calvez</surname>
            <initial>R.</initial>
          </persName>
          <persName>
            <foreName>Jean-Pierre</foreName>
            <surname>Nadal</surname>
            <initial>J.-P.</initial>
          </persName>
          <persName>
            <foreName>Emmanuel</foreName>
            <surname>Dupoux</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Cognition</title>
        <imprint>
          <biblScope type="volume">101</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>2006</year>
          </dateStruct>
          <biblScope type="pages">B31–B41</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid6" type="inproceedings" rend="foot" n="footcite:petrov:06">
      <analytic>
        <title level="a">Learning Accurate, Compact, and
        Interpretable Tree Annotation</title>
        <author>
          <persName>
            <foreName>Slav</foreName>
            <surname>Petrov</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Leon</foreName>
            <surname>Barrett</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>Romain</foreName>
            <surname>Thibaux</surname>
            <initial>R.</initial>
          </persName>
          <persName>
            <foreName>Dan</foreName>
            <surname>Klein</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 21st International
        Conference on Computational Linguistics and 44th Annual
        Meeting of the Association for Computational
        Linguistics</title>
        <loc>Sydney, Australia</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <month>July</month>
            <year>2006</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid7" type="inproceedings" rend="foot" n="footcite:petrov-klein:07">
      <analytic>
        <title level="a">Improved Inference for Unlexicalized
        Parsing</title>
        <author>
          <persName>
            <foreName>Slav</foreName>
            <surname>Petrov</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Dan</foreName>
            <surname>Klein</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Human Language Technologies 2007: The
        Conference of the North American Chapter of the Association
        for Computational Linguistics; Proceedings of the Main
        Conference</title>
        <loc>Rochester, New York</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <month>April</month>
            <year>2007</year>
          </dateStruct>
          <biblScope type="pages">404–411</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://www.aclweb.org/anthology/N/N07/N07-1051" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>www. 
          <allowbreak/>aclweb. 
          <allowbreak/>org/ 
          <allowbreak/>anthology/ 
          <allowbreak/>N/ 
          <allowbreak/>N07/ 
          <allowbreak/>N07-1051</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid47" type="book" rend="foot" n="footcite:pollard94">
      <monogr>
        <title level="m">Head Driven Phrase Structure
        Grammar</title>
        <author>
          <persName key="calligramme-2008-idm354935285920">
            <foreName>Carl</foreName>
            <surname>Pollard</surname>
            <initial>C.</initial>
          </persName>
          <persName>
            <foreName>Ivan</foreName>
            <surname>Sag</surname>
            <initial>I.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>University of Chicago Press</orgName>
          </publisher>
          <dateStruct>
            <year>1994</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid21" type="inproceedings" rend="foot" n="footcite:resnik97">
      <analytic>
        <title level="a">A perspective on word sense disambiguation
        methods and their evaluation</title>
        <author>
          <persName>
            <foreName>Philip</foreName>
            <surname>Resnik</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>David</foreName>
            <surname>Yarowsky</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">ACL SIGLEX Workshop Tagging Text with
        Lexical Semantics: Why, What, and How?</title>
        <loc>Washington, D.C., USA</loc>
        <imprint>
          <dateStruct>
            <year>1997</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid1" type="inproceedings" rend="foot" n="footcite:sagot04a">
      <analytic>
        <title level="a">Les RCG comme formalisme grammatical pour
        la linguistique</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes de TALN'04</title>
        <loc>Fès, Maroc</loc>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">403-412</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid55" type="article" rend="foot" n="footcite:TAL08:sxpipe">
      <analytic>
        <title level="a">SxPipe 2: architecture pour le traitement
        présyntaxique de corpus bruts</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Traitement Automatique des Langues
        (T.A.L.)</title>
        <imprint>
          <biblScope type="volume">50</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="bnote">to appear</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid25" type="inproceedings" rend="foot" n="footcite:LREC06:Lefff">
      <identifiant type="hal" value="docs"/>
      <analytic>
        <title level="a">The Lefff 2 syntactic lexicon for French:
        architecture, acquisition, use</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="signes-2006-idm424409784176">
            <foreName>Lionel</foreName>
            <surname>Clément</surname>
            <initial>L.</initial>
          </persName>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
          <persName key="atoll-2006-idm57727947600">
            <foreName>Pierre</foreName>
            <surname>Boullier</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proc. of LREC'06</title>
        <imprint>
          <dateStruct>
            <year>2006</year>
          </dateStruct>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://hal.archives-ouvertes.fr/docs/00/41/30/71/PDF/LREC06b.pdf" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>hal. 
          <allowbreak/>archives-ouvertes. 
          <allowbreak/>fr/ 
          <allowbreak/>docs/ 
          <allowbreak/>00/ 
          <allowbreak/>41/ 
          <allowbreak/>30/ 
          <allowbreak/>71/ 
          <allowbreak/>PDF/ 
          <allowbreak/>LREC06b. 
          <allowbreak/>pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid27" type="inproceedings" rend="foot" n="footcite:sagot08ontolex">
      <analytic>
        <title level="a">Building a free French wordnet from
        multilingual resources</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Darja</foreName>
            <surname>Fiser</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes de Ontolex 2008</title>
        <loc>Marrakech, Maroc</loc>
        <imprint>
          <dateStruct>
            <year>2008</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid18" type="inproceedings" rend="foot" n="footcite:TSD05">
      <analytic>
        <title level="a">Automatic acquisition of a Slovak lexicon
        from a raw corpus</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Lecture Notes in Artificial Intelligence
        3658 (© Springer-Verlag), Proceedings of TSD'05</title>
        <loc>Karlovy Vary, Czech Republic</loc>
        <imprint>
          <dateStruct>
            <month>September</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">156–163</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid2" type="inproceedings" rend="foot" n="footcite:sagot05:LACL">
      <analytic>
        <title level="a">Linguistic facts as predicates over ranges
        of the sentence</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Lecture Notes in Computer Science 3492 (©
        Springer-Verlag), Proceedings of LACL'05</title>
        <loc>Bordeaux, France</loc>
        <imprint>
          <dateStruct>
            <month>April</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">271–286</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid28" type="inproceedings" rend="foot" n="footcite:LTCbest:polish">
      <analytic>
        <title level="a">Building a morphosyntactic lexicon and a
        pre-syntactic processing chain for Polish</title>
        <author>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">LNAI 5603, selected papers presented at
        the LTC 2007 conference</title>
        <imprint>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid61" type="inproceedings" rend="foot" n="footcite:TAG06">
      <analytic>
        <title level="a">Modeling and Analysis of Elliptic
        Coordination by Dynamic Exploitation of Derivation Forests
        in LTAG parsing</title>
        <author>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of TAG+8</title>
        <loc>Sydney, Australia</loc>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2006</year>
          </dateStruct>
          <biblScope type="pages">147-152</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid62" type="inproceedings" rend="foot" n="footcite:seddah:08">
      <analytic>
        <title level="a">The Use of MCTAG to Process Elliptic
        Coordination</title>
        <author>
          <persName key="alpage-2008-idm542378729584">
            <foreName>Djamé</foreName>
            <surname>Seddah</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" x-proceedings="yes">
        <title level="m">In Proceeding of the Ninth International
        Workshop on Tree Adjoining Grammars and Related Formalisms
        (TAG+9)</title>
        <loc>Tüebingen, Germany</loc>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2008</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid33" type="article" rend="foot" n="footcite:soon_et_al:01">
      <analytic>
        <title level="a">A machine learning approach to coreference
        resolution of noun phrases</title>
        <author>
          <persName>
            <foreName>W. M.</foreName>
            <surname>Soon</surname>
            <initial>W. M.</initial>
          </persName>
          <persName>
            <foreName>H. T.</foreName>
            <surname>Ng</surname>
            <initial>H. T.</initial>
          </persName>
          <persName>
            <foreName>D.</foreName>
            <surname>Lim</surname>
            <initial>D.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Computational Linguistics</title>
        <imprint>
          <biblScope type="volume">27</biblScope>
          <biblScope type="number">4</biblScope>
          <dateStruct>
            <year>2001</year>
          </dateStruct>
          <biblScope type="pages">521–544</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid4" type="inproceedings" rend="foot" n="footcite:MG:TALN05">
      <analytic>
        <title level="a">Comment obtenir plus des
        Méta-Grammaires</title>
        <author>
          <persName key="atoll-2006-idm57727935376">
            <foreName>François</foreName>
            <surname>Thomasset</surname>
            <initial>F.</initial>
          </persName>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of TALN'05</title>
        <loc>Dourdan, France</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">ATALA</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid75" type="article" rend="foot" n="footcite:Vallabha:07">
      <analytic>
        <title level="a">Unsupervised learning of vowel categories
        from infant-directed speech</title>
        <author>
          <persName>
            <foreName>Gautam</foreName>
            <surname>Vallabha</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>James</foreName>
            <surname>McClelland</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Ferran</foreName>
            <surname>Pons</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Janet</foreName>
            <surname>Werker</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Shigeaki</foreName>
            <surname>Amano</surname>
            <initial>S.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Proceedings of the National Academy of
        Sciences</title>
        <imprint>
          <biblScope type="volume">104</biblScope>
          <biblScope type="number">33</biblScope>
          <dateStruct>
            <year>2007</year>
          </dateStruct>
          <biblScope type="pages">13273–13278</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid19" type="inproceedings" rend="foot" n="footcite:noord04">
      <analytic>
        <title level="a">Error Mining for Wide-Coverage Grammar
        Engineering</title>
        <author>
          <persName>
            <foreName>Gertjan</foreName>
            <surname>van Noord</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proc. of ACL 2004</title>
        <loc>Barcelona, Spain</loc>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid76" type="inproceedings" rend="foot" n="footcite:varadarajan-khudanpur-dupoux:2008:ACLShort">
      <analytic>
        <title level="a">Unsupervised Learning of Acoustic Sub-word
        Units</title>
        <author>
          <persName>
            <foreName>Balakrishnan</foreName>
            <surname>Varadarajan</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Sanjeev</foreName>
            <surname>Khudanpur</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Emmanuel</foreName>
            <surname>Dupoux</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of ACL-08: HLT, Short
        Papers</title>
        <loc>Columbus, Ohio</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2008</year>
          </dateStruct>
          <biblScope type="pages">165–168</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid65" type="inproceedings" rend="foot" n="footcite:vwj87b">
      <identifiant type="doi" value="10.3115/981175.981190"/>
      <analytic>
        <title level="a">Characterizing structural descriptions
        produced by various grammatical formalisms</title>
        <author>
          <persName>
            <foreName>K.</foreName>
            <surname>Vijay-Shanker</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>David J.</foreName>
            <surname>Weir</surname>
            <initial>D. J.</initial>
          </persName>
          <persName>
            <foreName>Aravind K.</foreName>
            <surname>Joshi</surname>
            <initial>A. K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 25th annual meeting on
        Association for Computational Linguistics</title>
        <loc>Stroudsburg, PA, USA</loc>
        <imprint>
          <publisher>
            <orgName>Association for Computational
            Linguistics</orgName>
          </publisher>
          <dateStruct>
            <year>1987</year>
          </dateStruct>
          <biblScope type="pages">104–111</biblScope>
          <ref xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="http://dx.doi.org/10.3115/981175.981190" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http:// 
          <allowbreak/>dx. 
          <allowbreak/>doi. 
          <allowbreak/>org/ 
          <allowbreak/>10. 
          <allowbreak/>3115/ 
          <allowbreak/>981175. 
          <allowbreak/>981190</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid43" type="book" rend="foot" n="footcite:wasow2002">
      <monogr>
        <title level="m">Postverbal behavior</title>
        <author>
          <persName>
            <foreName>Tom</foreName>
            <surname>Wasow</surname>
            <initial>T.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>CSLI</orgName>
          </publisher>
          <dateStruct>
            <year>2002</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid64" type="phdthesis" rend="foot" n="footcite:weir:88">
      <monogr>
        <title level="m">Characterizing mildly context-sensitive
        grammar formalisms</title>
        <author>
          <persName>
            <foreName>David J.</foreName>
            <surname>Weir</surname>
            <initial>D. J.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="school">University of
            Pennsylvania</orgName>
            <address>
              <addrLine>Philadelphia, PA, USA</addrLine>
            </address>
          </publisher>
          <dateStruct>
            <year>1988</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note type="bnote">Supervisor-Aravind K. Joshi</note>
      <note type="typdoc">Ph. D. Thesis</note>
    </biblStruct>
    <biblStruct id="alpage-2010-bid10" type="inproceedings" rend="foot" n="footcite:yamada:03">
      <analytic>
        <title level="a">Statistical Dependency Analysis with
        Support Vector Machines</title>
        <author>
          <persName>
            <foreName>Hiroyasu</foreName>
            <surname>Yamada</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Yuji</foreName>
            <surname>Matsumoto</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">The 8th International Workshop of Parsing
        Technologies (IWPT2003)</title>
        <imprint>
          <dateStruct>
            <year>2003</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid51" type="inproceedings" rend="foot" n="footcite:ATALA09:frmg">
      <analytic>
        <title level="a">FRMG: évolutions d'un analyseur syntaxique
        TAG du français</title>
        <author>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
          <persName key="atoll-2006-idm57727917280">
            <foreName>Benoît</foreName>
            <surname>Sagot</surname>
            <initial>B.</initial>
          </persName>
          <persName key="atoll-2006-idm57727902672">
            <foreName>Lionel</foreName>
            <surname>Nicolas</surname>
            <initial>L.</initial>
          </persName>
          <persName key="signes-2006-idm424409744960">
            <foreName>Marie-Laure</foreName>
            <surname>Guénot</surname>
            <initial>M.-L.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="no" x-proceedings="yes">
        <title level="m">Actes électroniques de la Journée ATALA
        sur "Quels analyseurs syntaxiques pour le français
        ?"</title>
        <imprint>
          <publisher>
            <orgName type="organisation">ATALA</orgName>
          </publisher>
          <dateStruct>
            <month>October</month>
            <year>2009</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid50" type="inproceedings" rend="foot" n="footcite:DyALog:CSLP05">
      <analytic>
        <title level="a">DyALog: a Tabular Logic Programming based
        environment for NLP</title>
        <author>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of 2nd International Workshop
        on Constraint Solving and Language Processing
        (CSLP'05)</title>
        <loc>Barcelona, Spain</loc>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid3" type="inproceedings" rend="foot" n="footcite:MG:IWPT05">
      <analytic>
        <title level="a">From Metagrammars to Factorized TAG/TIG
        Parsers</title>
        <author>
          <persName key="alpage-2009-idm402038308688">
            <foreName>Éric</foreName>
            <surname>Villemonte de La Clergerie</surname>
            <initial>É.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of IWPT'05</title>
        <loc>Vancouver, Canada</loc>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">190–191</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct id="alpage-2010-bid22" type="book" rend="foot" n="footcite:vossen99">
      <monogr>
        <title level="m">EuroWordNet: a multilingual database with
        lexical semantic networks for European Languages</title>
        <author>
          <persName>
            <foreName/>
            <surname>Vossen, P.</surname>
            <initial/>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName>Kluwer, Dordrecht</orgName>
          </publisher>
          <dateStruct>
            <year>1999</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
  </biblio>
</raweb>
