<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE raweb PUBLIC "-//INRIA//DTD" "raweb2.dtd">
<raweb xmlns:html="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" year="2005">
  <identification id="axis" isproject="true">
    <shortname>AxIS</shortname>
    <projectName>User-Centered Design, Improvement and Analysis of Information Systems</projectName>
    <theme>COG</theme>
    <team id="uid1">
      <participants category="Team_Leader">
        <person key="axis-2005-id18078">
          <firstname>Brigitte</firstname>
          <lastname>Trousse</lastname>
          <moreinfo>Research Scientist (CR1), Inria Sophia Antipolis</moreinfo>
        </person>
      </participants>
      <participants category="Team_Vice-Leader">
        <person key="axis-2005-id18098">
          <firstname>Yves</firstname>
          <lastname>Lechevallier</lastname>
          <moreinfo>Research Scientist (DR2), Inria Rocquencourt</moreinfo>
        </person>
      </participants>
      <participants category="Administrative_Assistants">
        <person key="axis-2005-id18118">
          <firstname>Stéphanie</firstname>
          <lastname>Aubin</lastname>
          <moreinfo>TR Inria, Inria Rocquencourt</moreinfo>
        </person>
        <person key="aoste-2005-id18118">
          <firstname>Sophie</firstname>
          <lastname>Honnorat</lastname>
          <moreinfo>AI Inria, part-time, Inria Sophia Antipolis</moreinfo>
        </person>
      </participants>
      <participants category="Research_Scientists">
        <person key="axis-2005-id18152">
          <firstname>Thierry</firstname>
          <lastname>Despeyroux</lastname>
          <moreinfo>Research Scientist (CR1), Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18166">
          <firstname>Florent</firstname>
          <lastname>Masséglia</lastname>
          <moreinfo>Research Scientist (CR2), Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18259">
          <firstname>Fabrice</firstname>
          <lastname>Rossi</lastname>
          <moreinfo>Research Scientist (CR1), on secondment from October 15, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18195">
          <firstname>Bernard</firstname>
          <lastname>Senach</lastname>
          <moreinfo>Research Scientist (CR1), since November, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18210">
          <firstname>Anne-Marie</firstname>
          <lastname>Vercoustre</lastname>
          <moreinfo>Research Scientist (DR2), 75 %, Inria Rocquencourt</moreinfo>
        </person>
      </participants>
      <participants category="Research_Scientists_(partners)">
        <person key="axis-2005-id18230">
          <firstname>Mireille</firstname>
          <lastname>Arnoux</lastname>
          <moreinfo>Assistant Prof., Univ. Bretagne Occidentale, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18244">
          <firstname>Marc</firstname>
          <lastname>Csernel</lastname>
          <moreinfo>Assistant Prof., Univ. Paris IX Dauphine, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18259">
          <firstname>Fabrice</firstname>
          <lastname>Rossi</lastname>
          <moreinfo>Assistant Prof., Univ. Paris IX Dauphine, until October 15, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18273">
          <firstname>Brieuc</firstname>
          <lastname>Conan-Guez</lastname>
          <moreinfo>Assistant Prof., Univ. Metz, until January 31, Inria Rocquencourt</moreinfo>
        </person>
      </participants>
      <participants category="Technical_Staff">
        <person key="axis-2005-id18293">
          <firstname>Mihai</firstname>
          <lastname>Jurca</lastname>
          <moreinfo>Development engineer, EPIA project, until August 31, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18308">
          <firstname>Aicha</firstname>
          <lastname>El Golli</lastname>
          <moreinfo>Research engineer,EPIA project, until October 31, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18416">
          <firstname>Doru</firstname>
          <lastname>Tanasa</lastname>
          <moreinfo>Research engineer, EPIA project, since November 15, Inria Sophia Antipolis</moreinfo>
        </person>
      </participants>
      <participants category="Ph._D._Students">
        <person key="axis-2005-id18343">
          <firstname>Abdourahamane</firstname>
          <lastname>Baldé</lastname>
          <moreinfo>Univ. of Paris IX Dauphine, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18357">
          <firstname>Hicham</firstname>
          <lastname>Behja</lastname>
          <moreinfo>France-Morocco Cooperation (STIC-GL network), Univ. Hassan II Ben M'Sik, Casablanca, Morocco, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18372">
          <firstname>Sergiu</firstname>
          <lastname>Chelcea</lastname>
          <moreinfo>Univ. Nice Sophia Antipolis (UNSA-STIC), Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18387">
          <firstname>Alzennyr</firstname>
          <lastname>Da Silva</lastname>
          <moreinfo>Univ. Paris IX Dauphine, from October 1st, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18635">
          <firstname>Alice</firstname>
          <lastname>Marascu</lastname>
          <moreinfo>Univ. Nice Sophia Antipolis (UNSA-STIC), since October 1st, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18416">
          <firstname>Doru</firstname>
          <lastname>Tanasa</lastname>
          <moreinfo>Univ. Nice Sophia Antipolis (UNSA-STIC), until June 30, Inria Sophia Antipolis</moreinfo>
        </person>
      </participants>
      <participants category="Visiting_Scientists">
        <person key="axis-2005-id18436">
          <firstname>Teresa</firstname>
          <lastname>Bernarda Ludermir</lastname>
          <moreinfo>Prof., Federal Univ. of Pernambuco, Brazil, April, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18451">
          <firstname>Francisco</firstname>
          <lastname>De Carvalho</lastname>
          <moreinfo>Prof., Federal Univ. of Pernambuco, Brazil, April, September-November, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18466">
          <firstname>Elvira</firstname>
          <lastname>Romano</lastname>
          <moreinfo>PhD student, Univ. Federico II, Naples, November-December, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18481">
          <firstname>Rosanna</firstname>
          <lastname>Verde</lastname>
          <moreinfo>Prof., University of Napoli, Italy, March-May, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18496">
          <firstname>Osmar</firstname>
          <lastname>Zaiane</lastname>
          <moreinfo>Associate Prof., University of Alberta, Canada, June, Inria Sophia Antipolis</moreinfo>
        </person>
      </participants>
      <participants category="Student_Interns">
        <person key="axis-2005-id18516">
          <firstname>Rémi</firstname>
          <lastname>Busseuil</lastname>
          <moreinfo>ENS Cachan, June-July, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18530">
          <firstname>Patrick</firstname>
          <lastname>Chastellan</lastname>
          <moreinfo>Univ. Montpellier, June-September, Inria Sophia Antipolis &amp; LIRMM</moreinfo>
        </person>
        <person key="axis-2005-id18545">
          <firstname>Alzennyr</firstname>
          <lastname>da Silva</lastname>
          <moreinfo>Federal Univ. of Pernambuco, Brazil, April-September, Inria Sophia Antipolis and Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18560">
          <firstname>Marina</firstname>
          <lastname>Dufresne</lastname>
          <moreinfo>Univ. Paris XIII Institut Galilée, March-July, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18576">
          <firstname>Calin</firstname>
          <lastname>Garboni</lastname>
          <moreinfo>Univ. of Timisoara, May-Nov, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18591">
          <firstname>Saba</firstname>
          <lastname>Gul</lastname>
          <moreinfo>MIT, since September, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18605">
          <firstname>Selma</firstname>
          <lastname>Kebbache</lastname>
          <moreinfo>Univ. Paris I Panthéon-Sorbonne, June-August, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18621">
          <firstname>Nicomedes</firstname>
          <lastname>Lopes Calvacanti Junior</lastname>
          <moreinfo>Federal Univ. of Pernambuco, Brazil, October-March, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18635">
          <firstname>Alice</firstname>
          <lastname>Marascu</lastname>
          <moreinfo>Univ. Nice Sophia Antipolis (UNSA), January-July, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18650">
          <firstname>Mounir</firstname>
          <lastname>Fegas</lastname>
          <moreinfo>Univ. Paris Sud XI LRI, April-September, Inria Rocquencourt</moreinfo>
        </person>
        <person key="axis-2005-id18664">
          <firstname>Sofiane</firstname>
          <lastname>Sellah</lastname>
          <moreinfo>Univ. Lyon II, March-June, Inria Sophia Antipolis</moreinfo>
        </person>
        <person key="axis-2005-id18678">
          <firstname>Sattisvar</firstname>
          <lastname>Tandabany</lastname>
          <moreinfo>Univ. Orsay - ENS Lyon, March-June, Inria Sophia Antipolis</moreinfo>
        </person>
      </participants>
    </team>
    <UR name="Sophia"/>
    <UR name="Rocquencourt"/>
  </identification>
  <presentation id="uid3">
    <bodyTitle>Overall Objectives</bodyTitle>
    <subsection level="1" id="uid4">
      <bodyTitle>Objectives</bodyTitle>
      <keyword>information system</keyword>
      <keyword>user-centered design</keyword>
      <keyword>evaluation</keyword>
      <keyword>knowledge discovery</keyword>
      <keyword>KDD</keyword>
      <keyword>data mining</keyword>
      <keyword>usage mining</keyword>
      <keyword>document mining</keyword>
      <keyword>semantics checking</keyword>
      <keyword>semantic Web</keyword>
      <keyword>knowledge management</keyword>
      <keyword>information retrieval</keyword>
      <keyword>recommender system</keyword>
      <keyword>Web mining</keyword>
      <keyword>semantic Web</keyword>
      <keyword>data stream mining</keyword>
      <p>AxIS leads research in the area of Information Systems (ISs) with a special interest for evolving ISs such as Web based-information Systems. Our ultimate goal is to improve the overall quality of ISs, to support designers during the design process and to ensure ease of use to end users. We
      are convinced that to reach this goal, according to the constant evolution of web based ISs, it is necessary to anticipate the usage and the maintenance very early in the design process. Four main applicative objectives are then addressed by the team:</p>
      <simplelist>
        <li id="uid5">
          <p>supporting the design, validation/evaluation, maintenance, of evolving ISs (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid20" location="intern" xyref="1958661692013"/>);</p>
        </li>
        <li id="uid6">
          <p>developing methods and tools to support both the usage analysis (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid23" location="intern" xyref="1958661692013"/>) and the use of ISs (cf. sections 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid41" location="intern" xyref="1958661692013"/>);</p>
        </li>
        <li id="uid7">
          <p>developing methods and tools to facilitate the improvement or the re-design of an IS by confrontating static analysis with the usage analysis;</p>
        </li>
        <li id="uid8">
          <p>and finally, at the knowledge level, supporting the knowledge acquisition in designing and evaluating ISs in order to annotate such complex processes and to facilitate the reuse of past experiences.</p>
        </li>
      </simplelist>
      <p>To achieve such objectives, an interdisciplinary approach is necessary and in fact, the AxIS team, which was created in July 2003, regroups people coming from different domains in computer sciences: Artificial Intelligence, Data Mining &amp; Analysis, Software Engineering, all of them
      being involved in the world of XML documents and information systems.</p>
      <p>The research topics related to our objectives are presented in Figure 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid9" location="intern" xyref="1958661692013"/>according to three points of view:</p>
      <object id="uid9">
        <table>
          <tr>
            <td>
              <ressource aux="image_1.png" xylemeAttach="1" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-figGeneral_eng" type="float" width="140mm" xyref="2450704430027"/>
            </td>
          </tr>
        </table>
        <caption>Global View of AxIS Research Topics</caption>
      </object>
      <simplelist>
        <li id="uid10">
          <p>the structure and content point of view related to the design and the evaluation of static aspects of ISs (architecture, documents),</p>
        </li>
        <li id="uid11">
          <p>the usage point of view related to dynamic aspects of ISs i.e. both the design of support tools (information retrieval support tools, recommender systems), the IS use and then the usage analysis (usage mining).</p>
        </li>
        <li id="uid12">
          <p>the knowledge management point of view related to the capitalization of knowledge and experience in the evaluation process of IS: this concerns the expertise of combining the evaluation results according to different points of view and more generally the KDD
          <footnote id="uid13" anchored="yes" place="foot">KDD: Knowledge Discovery from Databases</footnote>expertise applied on information systems data.</p>
        </li>
      </simplelist>
    </subsection>
  </presentation>
  <fondements id="uid14">
    <bodyTitle>Scientific Foundations</bodyTitle>
    <subsection level="1" id="uid15">
      <bodyTitle>Introduction</bodyTitle>
      <p>This section details the questions that we want to answer to:</p>
      <simplelist>
        <li id="uid16">
          <p>How to support the semantics specification and the design of hypertext information systems (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid20" location="intern" xyref="1958661692013"/>)?</p>
        </li>
        <li id="uid17">
          <p>How to evaluate information systems by applying KDD technics on usage data (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid24" location="intern" xyref="1958661692013"/>)?</p>
        </li>
        <li id="uid18">
          <p>How to synthesize and exhibit information by applying KDD technics on documents (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid40" location="intern" xyref="1958661692013"/>)?</p>
        </li>
        <li id="uid19">
          <p>How to support users in their information retrieval task and how to design information systems supporting the evolution of user practices (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid41" location="intern" xyref="1958661692013"/>)?</p>
        </li>
      </simplelist>
      <p>The second and third questions concern ``informatio systems data mining''.</p>
    </subsection>
    <subsection level="1" id="uid20">
      <bodyTitle>Semantics and Design of Hypertext Information Systems</bodyTitle>
      <keyword>semantics</keyword>
      <keyword>formal semantics</keyword>
      <keyword>semantic Web</keyword>
      <keyword>semantics checking</keyword>
      <keyword>information system design</keyword>
      <p>Designing and maintaining hypertext information systems, such as Web sites, is a real challenge. On the Web, it is much easier to find inconsistent pieces of information than a well structured site. Our goal is to study and build tools to support the design, development and maintenance of
      complex but coherent sites. Our approach is multi-disciplinary, involving Software Engineering and Artificial Intelligence techniques. There is a strong relation between structured documents (such as Web sites) and a program; the Web is a good candidate to experiment with some of the
      technologies that have been developed in software engineering.</p>
      <p>Most of the efforts deployed in the Web domain are related to languages for documents presentation (HTML, CSS, XSL) and structure (XML), to Web sites modeling and Web services (UML), but not to the formal semantics of Web sites to support their quality and evolution. The initiative led by
      the W3C consortium on Semantic Web (XML, RDF, RDF Schema) and ontologies aims at a different objective related to resource discovery. The term ``semantics'' has at least two significations:</p>
      <simplelist>
        <li id="uid21">
          <p>the meaning of words and texts,</p>
        </li>
        <li id="uid22">
          <p>the study of propositions in a deductive theory.</p>
        </li>
      </simplelist>
      <p>To address the first definition of the word semantics, we use taggers, thesaurus, ontologies, to go deeper into the semantics of plain text.</p>
      <p>But we are especially interested with the latter definition, trying to give a formal semantics to Web sites.</p>
      <p>We distinguish between the static aspects of a site that may involve a set of global constraints (not only syntactic, but also semantic and context dependent) to be verified, and the dynamic aspects. Dynamic aspects formalize the navigation in a Web site which also needs to be specified
      and validated (cf. the execution of a program).</p>
      <p>Our approach is related to the Semantic Web but yet different. The main goal of the Semantic Web is to ease computer-based information retrieval, formalizing data that is mostly textual, for further discovery. We are concerned in the first place by the way Web sites are designed and
      constructed, taking into account their semantics, development and evolution. In this respect we are closer to what is called 
      <i>content management</i>and we would like to check if a particular Web site does follow a predefined specification. We use approaches and techniques based on logic programming and formal semantics of programming languages, in particular operational semantics.</p>
    </subsection>
    <subsection level="1" id="uid23">
      <bodyTitle>Information Systems Data Mining</bodyTitle>
      <keyword>usage mining</keyword>
      <keyword>content mining</keyword>
      <keyword>structure mining</keyword>
      <keyword>document mining</keyword>
      <keyword>user behaviour</keyword>
      <keyword>data warehouse</keyword>
      <keyword>data mining</keyword>
      <subsection level="2" id="uid24">
        <bodyTitle>Usage Mining</bodyTitle>
        <p>The main motivations of usage mining in the context of ISs or search engines are double :</p>
        <simplelist>
          <li id="uid25">
            <p>supporting the re-design process of ISs or search engines by a better understanding of the user practices and by comparing the structure of the IS with the results of the usage analysis;</p>
          </li>
          <li id="uid26">
            <p>supporting the information retrieval by reusing the practices of user groups, what is called ``collaborative filtering'' via the design of adaptive recommender systems or ISs (cf. section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid41" location="intern" xyref="1958661692013"/>).</p>
          </li>
        </simplelist>
        <p>Usage mining correponds to data mining (or more generally to KDD) applied to usage data. By usage data, we mean the traces of user behaviours in log files.</p>
        <p noindent="true">Let us consider the KDD process represented by Fig. 2.</p>
        <p>This process is made of four main steps:</p>
        <orderedlist>
          <li id="uid27">
            <p><b>data selection</b>aims at extraction from the database or datawarehouse the information needed by the data mining step.</p>
          </li>
          <li id="uid28">
            <p><b>data transformation</b>will then use parsers in order to create data tables which can be used by the data mining algorithms.</p>
          </li>
          <li id="uid29">
            <p><b>data mining</b>techniques range from sequential patterns to association rules or cluster discovery.</p>
          </li>
          <li id="uid30">
            <p>finally the last step will allow the 
            <b>re-use of the obtained</b>results into a usage 
            <b>analysis</b>process.</p>
          </li>
        </orderedlist>
        <object id="uid31">
          <table>
            <tr>
              <td>
                <ressource aux="image_2.png" xylemeAttach="2" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/ECD-eng" type="float" width="10.5cm" xyref="1445430006014"/>
              </td>
            </tr>
          </table>
          <caption>Steps of the KDD Process</caption>
        </object>
        <p>Let us zoom on five following research topics involved in the first third steps:</p>
        <subsection level="3" id="uid32">
          <bodyTitle>Data selection and transformation</bodyTitle>
          <p>We insist on the importance of the pre-processing step in the KDD process composed of selection and transformation sub-steps.</p>
          <p>The considered KDD methods applied on usage data will rely on the notion of user session, represented through a tabular model (items), an association rules model (itemsets) or a graph model. This notion of session enables us to act in the appropriate level during the process of
          knowledge extraction from log files. Our goal is to build summaries and generate statistics on these summaries. At this level of formalization we can consider rules and graphs, define hierarchical structures on variables, extract sequences and thus build new types of data by using KDD
          methods.</p>
          <p>Actually, as the analysis methods come from various research fields (data analysis, statistics, data mining, AI., ...), a data transformation from input to output is needed and will be managed by the parsers. The input data will come from databases or from standard formatted file (XML)
          or a private format.</p>
        </subsection>
        <subsection level="3" id="uid33">
          <bodyTitle>Data mining: extracting association rules</bodyTitle>
          <p>Our preprocessing tools (or generalization operators) given in the previous paragraph were designed to build summaries and also generate statistics on these summaries. At this level of formalization we can consider rules and graphs, define hierarchical structures on variables, extract
          sequences and thus build new types of data by using methods for extracting frequent itemsets or association rules.</p>
          <p>These methods were first presented in 1993 by R. Agrawal, T. Imielinski and A. Swami (researchers in databases at the IBM research center, Almaden). They are available in market software for data mining (IBM's intelligent miner or SAS's enterprise miner).</p>
          <p>Our approach will rely on work coming from the field of generalization operators and data aggregation. These summaries can be integrated in a recommendation mechanism for the user help. We propose to adapt frequent itemset research methods or association rules discovery methods to the
          Web Usage Mining problem. We may get inspired by methods coming from the genomist methods (which present common characteristics with our field). If the goal of the analysis can be written in a decisional framework then the clustering methods will identify usage groups based on the
          extracted rules.</p>
        </subsection>
        <subsection level="3" id="uid34">
          <bodyTitle>Data mining: discovering sequential patterns</bodyTitle>
          <p>Knowing the user can be based on sequential pattern (which are inter transactions patterns) discovery. Sequential patterns offer a strong correlation with Web Usage Mining (and more generally with usage analysis problems) purposes. Our goal is to provide extraction methods which are as
          efficient as possible, and also to improve the relevance of their results. For this purpose, we plan to enhance the sequential pattern extraction methods by taking into account the context where those methods are involved. This can be done:</p>
          <simplelist>
            <li id="uid35">
              <p>First of all by analyzing the causes of a sequential pattern extraction failure on large access logs. It is necessary to understand and incorporate the great variety of potential behaviours on a Web site. This variety is mainly due to the large size of the trees representing the
              Web sites and the very large number of combination of navigations on those sites.</p>
            </li>
            <li id="uid36">
              <p>It is also necessary to incorporate all the available information related to the usage. Taking into account several information sources in a single sequential pattern extraction process is a challenge and can lead to numerous opportunities.</p>
            </li>
            <li id="uid37">
              <p>Finally, sequential pattern mining methods will have to get adapted to a new and growing domain: data streams. In fact, in numerous practical cases, data cannot be stored more than a specified time (and even not at all). Data mining methods will have to provide solution in order to
              respect the specific constraints related to this domain (no multiple scan over the data, no blocking actions, etc.).</p>
            </li>
          </simplelist>
        </subsection>
        <subsection level="3" id="uid38">
          <bodyTitle>Data mining: clustering approach to reduce the volume of data in data warehouses</bodyTitle>
          <p>Clustering is one of the most popular technique in knowledge acquisition and it is applied in various fields including data mining and statistical data analysis. This task organizes a set of individuals into clusters in such a way that individual within a given cluster have a high
          degree of similarity, while individuals belonging to different clusters have a high degree of dissimilarity.</p>
          <p>The definition of 'homogeneous' cluster depends on a particular algorithm: this is indeed a simple structure, which, in the absence of a priori knowledge about the multidimensional shape of the data, may be a reasonable starting point towards the discovery of richer and more complex
          structures</p>
          <p>Clustering methods reduce the volume of data in data warehouses, preserving the possibility to perform needed analysis. The rapid accumulation of large databases of increasing complexity poses a number of new problems that traditional algorithms are not equipped to address. One
          important feature of modern data collection is the ever increasing size of a typical database: it is not so unusual to work with databases containing from a few thousands to a few millions of individuals and hundreds or thousands of variables. Now, most clustering algorithms of the
          traditional type are severely limited regarding the number of individuals they can comfortably handle.</p>
          <p>Cluster analysis may be divided into hierarchical and partitioning methods. Hierarchical methods yield complete hierarchy, i.e., a nested sequence of partitions of the input data. Hierarchical methods can be agglomerative or divisive. Agglomerative methods yield a sequence of nested
          partitions starting with the trivial clustering in which each individual is in a unique cluster and ending with the trivial clustering in which all individuals are in the same cluster. A divisive method starts with all individuals in a single cluster and performs splitting until a
          stopping criterion is met. Partitioning methods aim at obtaining a partition of the set of individuals into a fixed number of clusters. These methods identify the partition that optimizes (usually locally) an adequacy criterion.</p>
        </subsection>
        <subsection level="3" id="uid39">
          <bodyTitle>Data mining: reusing usage analysis experiences</bodyTitle>
          <p>This topic aims at re-using previous analysis results into current analysis: in the short run we will work on an incremental approach of the discovery of sequential motives; in the longer run our approach will be based upon case-based reasoning. Nowadays very fast algorithms have been
          developed which efficiently search for dependences between attributes (research algorithms with association rules), or dependences between behaviours (research algorithms with sequential motives) within large databases.</p>
          <p>Unfortunately, even though these algorithms are very efficient, and depending on the size of the database, it can sometimes take up to several days to retrieve relevant and useful information. Furthermore, the variation of parameters provided to the user requires to re-start the
          algorithms without taking previous results into account. Similarly, when new data is added or suppressed from the base, it is often necessary to re-start the retrieval process to maintain the extracted knowledge.</p>
          <p>Considering the size of the handled data, it is essential to propose both an interactive (parameters variation) and incremental (data variation in the base) approach in order to rapidly meet the needs of the end user.</p>
          <p>This problematic is currently considered as an open research problem within the framework of Data Mining; and even though a few solutions exist, they are not quite satisfactory because they only provide a partial solution to the problem.</p>
        </subsection>
      </subsection>
      <subsection level="2" id="uid40">
        <bodyTitle>Content and Structure Document Mining</bodyTitle>
        <keyword>document mining</keyword>
        <keyword>clustering</keyword>
        <keyword>classification</keyword>
        <p>With the increasing amount of available information, sophisticated tools for supporting users in finding useful information are needed. In addition to tools for retrieving relevant documents, there is a need for tools that synthesize and exhibit information that is not explicitly
        contained in the document collection, using document mining techniques. Document mining objectives include extracting structured information from rough text.</p>
        <p noindent="true">The involved techniques from the KDD process are thus mainly clustering and classification. Our goal is to explore the possibilities of those techniques for document mining such as described below.</p>
        <p>Classification aims at associating documents to one or several predefined categories, while the objective of clustering is to identify emerging classes that are not known in advance. Traditional approaches for document classification and clustering rely on various statistical models, and
        representation of documents are mostly based on bags of words.</p>
        <p>Recently much attention has been drawn towards using the structure of XML documents to improve information retrieval, classification and clustering, and more generally information mining. In the last four years, the INEX (Initiative for the Evaluation of XML retrieval) has focused on
        system performance in retrieving elements of documents rather than full documents and evaluated the benefits for end users. Other works are interested in clustering large collections of documents using representations of documents that involve both the structure and the content of
        documents, or the structure only (
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid0" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid1" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid2" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid3" location="biblio" xyref="1958661692013"/>).</p>
        <p>Approaches for combining structure and text range from adding a flat representation of the structure to the classical vector space model or combining different classifiers for different tags or media, to defining a more complex structured vector models 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid4" location="biblio" xyref="1958661692013"/>, possibly involving attributes and links.</p>
        <p>When using the structure only, the objective is generally to organize large and heterogeneous collections of documents into smaller collections (clusters) that can be stored and searched more effectively. Part of the objective is to identify substructures that characterize the documents
        in a cluster and to build a representative of the cluster 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid5" location="biblio" xyref="1958661692013"/>, possibly a schema or a DTD.</p>
        <p>Since XML documents are represented as trees, the problem of clustering XML documents is the same as clustering trees. One can identify two main approaches: 1) identify frequent common sub-patterns between trees and group together documents that share the same patterns; 2) define a
        similarity measure between trees that can be used with a standard clustering algorithm. A possible distance can be calculated by associating a cost function to the edit distance between two trees. However, it is well known that algorithms working on trees have complexity issues. Therefore
        some models replace the original trees by structural summaries or s-graphs that only retain the intrinsic structure of the tree: for example, reducing a list of elements to a single element, flattening recursive structures, etc.</p>
        <p>A common drawback of those approaches above is that they reduce documents to their intrinsic patterns (sub-patterns, or summaries) and do not take into account an important characteristic of XML documents, - the notion of list of elements and more precisely the number of elements in
        those lists. While it may be fine for clustering heterogeneous collection, suppressing lists of elements may result in losing document properties that could be interesting for other types of XML mining.</p>
      </subsection>
    </subsection>
    <subsection level="1" id="uid41">
      <bodyTitle>Supporting Information Retrieval with adaptive recommender systems</bodyTitle>
      <keyword>recommender system</keyword>
      <keyword>personalization</keyword>
      <keyword>collaborative filtering</keyword>
      <keyword>hypermedia</keyword>
      <keyword>user profile</keyword>
      <keyword>KDD</keyword>
      <keyword>CBR</keyword>
      <keyword>case-based reasoning</keyword>
      <keyword>experience management</keyword>
      <keyword>reuse of past experiences</keyword>
      <keyword>social navigation</keyword>
      <keyword>search engine</keyword>
      <keyword>search access</keyword>
      <keyword>indexing</keyword>
      <keyword>user behaviour</keyword>
      <p>We think that information retrieval support tools as recommender systems are very useful in very large information systems. The objective of a recommender system is to help system users to make their choices in a field where they have little information for sorting and evaluating the
      possible alternatives 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid6" location="biblio" xyref="1958661692013"/>, 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid7" location="biblio" xyref="1958661692013"/>, 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid8" location="biblio" xyref="1958661692013"/>.</p>
      <p>A recommender system can be divided into three basic entities (cf Figure 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid42" location="intern" xyref="1958661692013"/>): the group of recommendations producer agents, the module of recommendation computation and the group of
      recommendations consumers.</p>
      <object id="uid42">
        <table>
          <tr>
            <td>
              <ressource aux="image_3.png" xylemeAttach="3" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/picture-rec" type="float" width="8.25cm" xyref="1769428481010"/>
            </td>
          </tr>
        </table>
        <caption>Architecture of a Recommender System</caption>
      </object>
      <p>A major challenge in the field of recommender systems design is the following: How to produce adaptive recommendations of high quality minimizing the effort of producers and the consumers?</p>
      <p>Two main complementary approaches are proposed in the literature:</p>
      <orderedlist>
        <li id="uid43">
          <p>approaches based on the content and the machine learning of user profiles and</p>
        </li>
        <li id="uid44">
          <p>approaches known as a collaborative filtering based on data mining techniques.</p>
        </li>
      </orderedlist>
      <p>The user profile is a structure of data that describes user's centers of interest in the space of the objects which can be recommended. The user profile is a structure built in the first approach or specified by the user in the second approach.</p>
      <p>The user profile is used either to filter available objects (content-based filtering), or to recommend to a user something that satisfied previous users with a similar profile (collaborative filtering) 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid7" location="biblio" xyref="1958661692013"/>.</p>
      <p>In the Axis project, we continue the development of a hybrid approach for recommendations based on the analysis of visited content and on collaborative filtering; The past behaviours of a user group are used to calculate the recommendations (collaborative filtering). Like this this
      approach is able to support some usage evolutions without a complete re-design.Also the usage analysis of such recommender systems may be very useful to support designers in an possible re-design or improvment of their IS.</p>
      <p>Approaches based on data mining are mainly statistical approaches where the sequence of events in the history is not taken into account for the calculation of recommendations. There are some early examples in the field of navigation assistance on the Web: the FootPrints system 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid9" location="biblio" xyref="1958661692013"/>and the system of Yan et al. 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid10" location="biblio" xyref="1958661692013"/>.</p>
      <p>The implementation challenges of our approach relate to the following aspects:</p>
      <simplelist>
        <li id="uid45">
          <p>providing techniques of identification and extraction of relevant behaviours (i.e. the learning behaviours or case behaviours) starting from raw data of past behaviours,</p>
        </li>
        <li id="uid46">
          <p>defining methods and measures of similarities between behaviours,</p>
        </li>
        <li id="uid47">
          <p>defining inference techniques of adaptive recommendations starting from the identified relevant past behaviours (or starting from the reminded cases).</p>
        </li>
      </simplelist>
      <p>We study the class of recommender systems, based on the re-use of a user group's past experiences, using case based reasoning techniques (CBR).</p>
      <p>Let us remind what is 
      <b>Case-Based Reasoning (CBR)</b>. It is a problem solving paradigm based on the reuse by analogy of past experiences, called ``cases''. In order to be found, a case is generally indexed according to certain relevant and discriminating characteristics, called ``indices''; these indices
      determine in which situation (or context) a case can be re-used.</p>
      <p>Case-Based Reasoning 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid11" location="biblio" xyref="1958661692013"/>usually breaks up into four principal phases:</p>
      <orderedlist>
        <li id="uid48">
          <p>a ``retrieve'' phase for cases having similarities (i.e. similar indices) with the current problem,</p>
        </li>
        <li id="uid49">
          <p>a ``re-use'' phase where a solution to the current problem is built, based on cases identified in the previous phase,</p>
        </li>
        <li id="uid50">
          <p>a ``revise'' phase where the solution may be refined with an evaluation process,</p>
        </li>
        <li id="uid51">
          <p>a ``retain'' phase that updates the elements of the reasoning by taking into account the experiment which has been just carried out and which could thus be used for future reasoning.</p>
        </li>
      </orderedlist>
      <p>Difficult problems in CBR are related to: definition and representation of a case, organization of the database containing the cases, various used indexing methods and definition of ``good'' similarities measurements for the case search, link between the steps research and adaptation (the
      best retrieved case being the most easily adaptable case), definition of an adaptation strategy starting with the found case(s), training of new indices, etc.</p>
      <p>We focus on two types of recommender systems:</p>
      <simplelist>
        <li id="uid52">
          <p>systems where the calculation of recommendations is based on the re-use of an users group's experiences in searching for information in a hypertext information system like the Web or on an Internet/Intranet site. These systems aim at an adaptive assistance to the search for information
          activity ;</p>
        </li>
        <li id="uid53">
          <p>systems where the calculation of recommendations is based on the re-use of past experiences of experts, in order to provide an assistance to the design process.</p>
        </li>
      </simplelist>
      <p>We explore all three problems previously described by using case-based reasoning (CBR) techniques and more generally KDD techniques.</p>
      <p noindent="true">We pursue the evaluation of our results in CBR, in particular the indexing model by behavioral situation, the object-oriented framework CBR*Tools and toolbox Broadway*Tools via our current contracts (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid142" location="intern" xyref="1958661692013"/>). Moreover, we pursue the study of sessions indexing techniques and plan to use some sequential pattern extraction
      and clustering algorithms for the on-line and off-line analysis of the Web users usage.</p>
    </subsection>
  </fondements>
  <domaine id="uid54">
    <bodyTitle>Application Domains</bodyTitle>
    <subsection level="1" id="uid55">
      <bodyTitle>Panorama overview</bodyTitle>
      <keyword>Telecommunications e-CRM</keyword>
      <keyword>e-business</keyword>
      <keyword>e-marketing</keyword>
      <keyword>adaptive interface</keyword>
      <keyword>adaptive service personalization</keyword>
      <keyword>information retrieval</keyword>
      <keyword>web usage mining</keyword>
      <keyword>web design</keyword>
      <keyword>Education</keyword>
      <keyword>Transportation</keyword>
      <keyword>Life Sciences</keyword>
      <keyword>Aeronautics</keyword>
      <keyword>Health</keyword>
      <keyword>Engineering</keyword>
      <keyword>Environment</keyword>
      <p>The project explores any applicative field on design, evaluation and improvement of a huge hypermedia information systems, for which end-users are of primary concern. We currently focus on web-based information systems (internet, intranet), or parts of such ISs, offering one of the
      following characteristics:</p>
      <orderedlist>
        <li id="uid56">
          <p>presence or wanted integration of services of assistance in the collaborative search of information and personalization (ranking, filtering, addition of links, etc.);</p>
        </li>
        <li id="uid57">
          <p>frequent evolution of the content (information, ontology), generating many maintenance problems, for example:</p>
          <simplelist>
            <li id="uid58">
              <p>a web-based IS containing information about the activities of a group of people, for example an institute (Inria), a company, a scientific community, an European network on the internet or intranet, etc.</p>
            </li>
            <li id="uid59">
              <p>a web-based IS indexing a wide range of productions (documents, products) resulting from the Web or a company, according to a thematic criteria, eg. the search engines (Yahoo, Voila), the internet guides for specific targets (FT Educado) or portals (scientific communities).</p>
            </li>
          </simplelist>
        </li>
        <li id="uid60">
          <p>interpretation of the user satisfaction (according to the designer point of view) or explicit user satisfaction, as it is the case for example for business sites, e-learning sites, and also for search engines.</p>
        </li>
      </orderedlist>
      <p>In summary, our fields of interest are the following:</p>
      <simplelist>
        <li id="uid61">
          <p>semantic specification and checking of an information system,</p>
        </li>
        <li id="uid62">
          <p>usage analysis of an information system (internet, intranet),</p>
        </li>
        <li id="uid63">
          <p>document mining (XML documents, texts, Web pages)</p>
        </li>
        <li id="uid64">
          <p>re-designing of an information system based on usage analysis,</p>
        </li>
        <li id="uid65">
          <p>adaptive recommender systems for supporting information retrieval, Collaborative search of Information on the internet.</p>
        </li>
      </simplelist>
      <p>Ultimately, it should be noted that other fields (Life Science, health, transports, etc.) may be subject to the study since they provide an experimental framework for the validation of our research work in KDD, and in the reuse of experiences in story management: this type of approach may
      be relevant in applications that are badly solved in automatic of control type (e.g. nutrition of plants under greenhouses, control in robotics).</p>
    </subsection>
  </domaine>
  <logiciels id="uid66">
    <bodyTitle>Software</bodyTitle>
    <subsection level="1" id="uid67">
      <bodyTitle>Introduction</bodyTitle>
      <p>AxIS has developed several packages 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/software.html" location="extern" xyref="4092803861005">http://www-sop.inria.fr/axis/software.html</ref>:</p>
      <simplelist>
        <li id="uid68">
          <p>for classification and clustering : SODAS 2 Softawre (CF. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid70" location="intern" xyref="1958661692013"/>), Clustering Toolbox (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid71" location="intern" xyref="1958661692013"/>),</p>
        </li>
        <li id="uid69">
          <p>as well as frameworks for Case-Based Reasoning (cf. CBR*Tools section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid75" location="intern" xyref="1958661692013"/>) and Recommender systems (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid76" location="intern" xyref="1958661692013"/>).</p>
        </li>
      </simplelist>
    </subsection>
    <subsection level="1" id="uid70">
      <bodyTitle>SODAS 2 Software</bodyTitle>
      <participants category="None">
        <person key="axis-2005-id18098">
          <firstname>Yves</firstname>
          <lastname>Lechevallier</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="axis-2005-id18244">
          <firstname>Marc</firstname>
          <lastname>Csernel</lastname>
        </person>
      </participants>
      <p>The ASSO project designs methods, methodology and software tools for extracting knowledge from multidimensional complex data.</p>
      <p>The SODAS 2 Software 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid12" location="biblio" xyref="1958661692013"/>is the result of the European project called ``ASSO''(Analysis System of Symbolic Official data), that started in
      January 2001 for 36 monthsXS. It supports the analysis of multidimensional complex data (numerical and non numerical) coming from databases mainly in satistical offices and administration using Symbolic Data Analysis 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid13" location="biblio" xyref="1958661692013"/>.</p>
      <p>SODAS 2 is an improved version of the SODAS software developed in the previous SODAS project, following users' requests. This new software is more operational and attractive. It proposes innovative methods and demonstrates that the underlying techniques meet the needs of statistical
      offices. It uses the SOM library 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid14" location="biblio" xyref="1958661692013"/>.</p>
      <p>SODAS allows for the analysis of summarised data, called Symbolic Data. This software is now in the registration process at APP. The latest executive version (version 2.50) of the SODAS 2 software, with its user manual (PDF format), can be downloaded at 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.info.fundp.ac.be/asso/" location="extern" xyref="1701844304026">http://www.info.fundp.ac.be/asso/sodaslink.htm</ref></p>
    </subsection>
    <subsection level="1" id="uid71">
      <bodyTitle>Clustering Toolbox and Classification Software</bodyTitle>
      <participants category="None">
        <person key="axis-2005-id18244">
          <firstname>Marc</firstname>
          <lastname>Csernel</lastname>
        </person>
        <person key="axis-2005-id18372">
          <firstname>Sergiu</firstname>
          <lastname>Chelcea</lastname>
        </person>
        <person key="PASUSERID">
          <firstname>Francesco</firstname>
          <lastname>de Carvalho</lastname>
        </person>
        <person key="axis-2005-id18308">
          <firstname>Aicha</firstname>
          <lastname>El Golli</lastname>
        </person>
        <person key="axis-2005-id18273">
          <firstname>Brieuc</firstname>
          <lastname>Conan-Guez</lastname>
        </person>
        <person key="axis-2005-id18293">
          <firstname>Mihai</firstname>
          <lastname>Jurca</lastname>
        </person>
        <person key="axis-2005-id18098">
          <firstname>Yves</firstname>
          <lastname>Lechevallier</lastname>
          <moreinfo>co-correspondant</moreinfo>
        </person>
        <person key="axis-2005-id18078">
          <firstname>Brigitte</firstname>
          <lastname>Trousse</lastname>
          <moreinfo>co-correspondant</moreinfo>
        </person>
      </participants>
      <p>For clustering, we maintained a clustering toolbox, written in C++ and Java, which groups clustering methods developed by the team over time, and uses the SOM library developed by M. Csernel. This library proposes a common data interface to every algorithm. This toolbox supports
      developers in integrating various classification methods and testing and comparing with other methods. Now it integrates various methods:</p>
      <simplelist>
        <li id="uid72">
          <p>from AxIS Rocquencourt: 1) a partitionning clustering method on complex data tables called SCluster 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid12" location="biblio" xyref="1958661692013"/>, 2) an adapted version of the SOM on the dissimilarity tables called DSOM 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid15" location="biblio" xyref="1958661692013"/>(cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid107" location="intern" xyref="1958661692013"/>) and Div (in C++) 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid16" location="biblio" xyref="1958661692013"/>;</p>
        </li>
        <li id="uid73">
          <p>two partitionning clustering methods on the dissimilarity tables: 1) CDis (in C++) 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid12" location="biblio" xyref="1958661692013"/>issued from a collaboration between AxIS Rocquencourt team and Recife University, Brazil and 2) CCClust (in C++)
          issued from a collaboration between AxIS Rocquencourt team and Recife University, Brazil;</p>
        </li>
        <li id="uid74">
          <p>2-3 AHC (in Java)
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid17" location="biblio" xyref="1958661692013"/>(cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid112" location="intern" xyref="1958661692013"/>) from AxIS Sophia Antipolis.</p>
        </li>
      </simplelist>
      <p>We developed a Web interface for this clustering toolbox for the following methods: SCluster, Div, Cdis, CCClust. 2-3 AHC is available as a Java applet which runs the 
      <span align="left" class="smallcap">hierarchies visualisation toolbox</span>. The aim of this online interface is in a short term to allow other team members (and in the near future Internet users) to use these classification methods to process their own data via the Web. The Web interface is
      developed in C++, run on our Apache internal Web server.</p>
      <p>For classification of functional data, we developed a functional Multi-Layer Perceptron Method called FNET (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid108" location="intern" xyref="1958661692013"/>).</p>
    </subsection>
    <subsection level="1" id="uid75">
      <bodyTitle>CBR*Tools</bodyTitle>
      <participants category="None">
        <person key="axis-2005-id18372">
          <firstname>Sergiu</firstname>
          <lastname>Chelcea</lastname>
        </person>
        <person key="axis-2005-id18293">
          <firstname>Mihai</firstname>
          <lastname>Jurca</lastname>
        </person>
        <person key="axis-2005-id18078">
          <firstname>Brigitte</firstname>
          <lastname>Trousse</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>CBR*Tools is an object-oriented framework 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid18" location="biblio" xyref="1958661692013"/>, 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid19" location="biblio" xyref="1958661692013"/>for Case-Based Reasoning which is specified with the UMT notation (Rational Rose) and written in Java. It offers a
      set of abstract classes to models the main concepts necessary to develop applications integrating case-based reasoning techniques: case, case base, index, measurements of similarity, reasoning control. It also offers a set of concrete classes which implements many traditional methods (closest
      neighbors indexing, Kd-tree indexing 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid20" location="biblio" xyref="1958661692013"/>, prototypes indexing 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid21" location="biblio" xyref="1958661692013"/>, neuronal approach based indexing, standards similarities measurements). CBR*Tools currently contains more than 240
      classes divided in two main categories: the core package for basic functionality and the time package for the specific management of the behavioral situations. The programming of a new application is done by specialization of existing classes, objects aggregation or by using the parameters of
      the existing classes.</p>
      <p>CBR*Tools aims application fields where the re-use of cases indexed by behavioral situations is required. The CBR*Tools framework was evaluated via the design and the implementation of five applications (Broadway-Web, educaid, BeCKB, Broadway-Predict, 
      <span align="left" class="smallcap">CASA</span>and 
      <span align="left" class="smallcap">RA2001</span>). We showed that, for each application, the thorough expertise necessary to use CBR*Tools relates to only 20% to 40% of the hot spots thus validating the assistance brought by our platform on design as well as on the implementation, thanks to
      the re-use of its abstract architecture and its components (index, similarity).</p>
      <p>CBR*Tools is concerned by our two current contracts: EPIA (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid143" location="intern" xyref="1958661692013"/>) and MobiVip (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid147" location="intern" xyref="1958661692013"/>).</p>
      <p>CBR*Tools is planned to be available in 2006 for research, teaching and academic purpose under the INRIA license. The user manual can be downloaded at the URL: 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/cbrtools/manual/" location="extern" xyref="318003096012">http://www-sop.inria.fr/axis/cbrtools/manual/</ref>.</p>
    </subsection>
    <subsection level="1" id="uid76">
      <bodyTitle>Broadway*Tools</bodyTitle>
      <participants category="None">
        <person key="axis-2005-id18293">
          <firstname>Mihai</firstname>
          <lastname>Jurca</lastname>
        </person>
        <person key="axis-2005-id18078">
          <firstname>Brigitte</firstname>
          <lastname>Trousse</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>Broadway*Tools is a toolbox used to facilitate the creation of adaptive recommendation systems for information retrieval on the Web or in a Internet/intranet information system. This toolbox offers different servers, including a server that calculates recommendations based on the
      observation of the user sessions and on the re-use of user groups' former sessions. A recommender system created with Broadway*tools observes navigations of various users and gather the evaluations and annotations of those users to draw up a list of relevant recommendations (Web documents,
      keywords, etc).</p>
      <p>Different recommender systems have been developed:</p>
      <simplelist>
        <li id="uid77">
          <p>for supporting Web browsing with Broadway-Web,</p>
        </li>
        <li id="uid78">
          <p>for supporting browsing inside a Web-based information system with educaid (France Telecom Lannion - Inria contract), e-behaviour (Color Action, use of the mouse and eye-tracking events),</p>
        </li>
        <li id="uid79">
          <p>for supporting query formulation with Be-CBKB (XRCE-Inria contract), etc.</p>
        </li>
      </simplelist>
      <p>Broadway*Tools concerned our two current contracts: EPIA (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid143" location="intern" xyref="1958661692013"/>and MobiVip (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid147" location="intern" xyref="1958661692013"/>).</p>
    </subsection>
  </logiciels>
  <resultats id="uid80">
    <bodyTitle>New Results</bodyTitle>
    <subsection level="1" id="uid81">
      <bodyTitle>Introduction</bodyTitle>
      <keyword>KDD</keyword>
      <keyword>preprocessing</keyword>
      <keyword>data transformation</keyword>
      <keyword>metadata</keyword>
      <keyword>knowledge management</keyword>
      <keyword>viewpoint</keyword>
      <keyword>ontology</keyword>
      <keyword>annotation</keyword>
      <keyword>reusability</keyword>
      <keyword>distances</keyword>
      <keyword>dissimilarities</keyword>
      <p>This year we obtained original results as previous years in our three research topics: data transformation and knowledge management, data mining and web usage mining methods. Let us note first results in document mining (cf. the content and structure point of view of an IS) and in data
      stream mining (cf. the usage point of view of an IS).</p>
      <p>In section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid82" location="intern" xyref="1958661692013"/>, we describe new results on data transformation and knowledge representation. For the latter, we have studied the
      use of metadata (cf. the KM point of view), in particular in two ongoing PhD thesis related semantic web and KDD, conducted by H. Behja and A. Baldé. Metadata have been used or annotating global KDD processes in terms of viewpoints to support the management and the reuse of past KDD
      experiences (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid93" location="intern" xyref="1958661692013"/>), 2) for supporting the interpretation of extracted clusters. Moreover this year we have proposed and studied new
      distances and dissimilarities in various applicative contexts: XML Sanskrit documents (section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid84" location="intern" xyref="1958661692013"/>), tourist itineraries (section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid85" location="intern" xyref="1958661692013"/>) and Web navigations and content (cf section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid83" location="intern" xyref="1958661692013"/>).</p>
      <p>On data mining methods (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid106" location="intern" xyref="1958661692013"/>), we published new results on self organizing maps (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid107" location="intern" xyref="1958661692013"/>), on functional data analysis (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid108" location="intern" xyref="1958661692013"/>), on a new partitioning dynamic clustering method (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid111" location="intern" xyref="1958661692013"/>) and on an agglomerative 2-3 Hierarchical Clustering in the context of Chelcea'PhD thesis (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid112" location="intern" xyref="1958661692013"/>). This year we started a new research topic related to KDD in the context of data streams (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid114" location="intern" xyref="1958661692013"/>).</p>
      <p>Finally on information systems data mining, we started this year to work on visualization problems and we proposed different representations of the organization of a web site based on usage data (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid122" location="intern" xyref="1958661692013"/>). We also obtained our first results on XML document mining and XML search: we studied content and/or structure
      mining for clustering or classifying XML documents (cf. sections 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid132" location="intern" xyref="1958661692013"/>, 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid133" location="intern" xyref="1958661692013"/>) as well as the improvement of the relevance in XML search (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid138" location="intern" xyref="1958661692013"/>). More classically we pursued our researches on intersites web usage mining in the context of the ECML/PKDD 2005
      discovery Challenge (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid125" location="intern" xyref="1958661692013"/>) and in extracting dense periods of sequential patterns (cf. section 
      <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid127" location="intern" xyref="1958661692013"/>).</p>
    </subsection>
    <subsection level="1" id="uid82">
      <bodyTitle>Data Transformation and Knowledge Management in KDD</bodyTitle>
      <subsection level="2" id="uid83">
        <bodyTitle>Dissimilarities for Web Usage Mining</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18259">
            <firstname>Fabrice</firstname>
            <lastname>Rossi</lastname>
          </person>
          <person key="axis-2005-id18451">
            <firstname>Francisco</firstname>
            <lastname>De Carvalho</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18387">
            <firstname>Alzennyr</firstname>
            <lastname>Da Silva</lastname>
          </person>
        </participants>
        <keyword>Dissimilarities</keyword>
        <keyword>Web Usage Mining</keyword>
        <keyword>Clustering</keyword>
        <keyword>Validation</keyword>
        <keyword>Benchmark</keyword>
        <p>Many Web Usage Mining methods rely on clustering algorithms in order to produce homogeneous classes of documents (when the content of the web site is analyzed) and/or of users (when browsing behaviors are analysed). Information extracted from web server logs are complex and noisy, but
        can be used to define usage based dissimilarities between users of the site or between pages of the site. There are however many possibilities to define this type of dissimilarity measure.</p>
        <p>We have defined a benchmark site that allows to compare dissimilarity measures via the clustering results they produce. The benchmark consists in one year of log of the web site of the CIn, the laboratory of Francisco De Carvalho. This site is small (91 pages) and is very well organized.
        This allows to define a meaningful semantic structure and to build an expert partition of its content. Then, this expert partition can be compared to the results of a clustering algorithm applied to the dissimilarity matrix constructed with a specific measure.</p>
        <p>The results that will be published in the EGC 2006 conference show that the Jaccard index and the ``term frequency inverse document frequency'' approach obtain quite good results, whereas the cosine measure performs badly. It seems also that better results could be obtained by taking
        into account the structure of the site together with usage data.</p>
      </subsection>
      <subsection level="2" id="uid84">
        <bodyTitle>Distances for Clustering Homogeneous XML Documents</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18244">
            <firstname>Marc</firstname>
            <lastname>Csernel</lastname>
          </person>
          <person key="axis-2005-id18372">
            <firstname>Sergiu</firstname>
            <lastname>Chelcea</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18678">
            <firstname>Sattisvar</firstname>
            <lastname>Tandabany</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <keyword>distance</keyword>
        <keyword>text comparison</keyword>
        <keyword>Sanskrit</keyword>
        <keyword>transliteration</keyword>
        <p>In the context of a research project with India and some others French partners, about a hundred ancient manuscripts written in Sanskrit, all arisen from the same text (the Benares Glose), should be compared in order to make a critical edition and provide some classification between the
        manuscripts (cf. section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid100" location="intern" xyref="1958661692013"/>).</p>
        <p>During his internship, S. Tandabany developed some tools that were required for clustering homogeneous XML Sanskrit Documents. First, a modified longest common substring algorithm is proposed to deal with Sanskrit characters. Then, as in Sanskrit inversions of characters are not always
        meaningful, a detection of possible inversions is applied. Finally, the Agglomerative 2-3 Hierarchical classification (cf. section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid112" location="intern" xyref="1958661692013"/>) is used as the classification algorithm. To do this, we proposed a new distance between texts taking into
        account some Sanskrit specificities and allowing the addition of meta-data (worn state and shape of the manuscripts as objects, annotations about words forgotten, etc.). The text is splitted into paragraphs, ``sub-distances'' are computed between each corresponding paragraph, taking into
        account adds, deletions, transformations and inversions. Then, some constraints needed to obtain a distance (triangular inequality) are removed to get a dissimilarity instead of a distance for the 2-3AHC. The impact of these modifications on the classification was analysed. Finally, our
        results are highlighted with some experiments and examples 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid22" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid85">
        <bodyTitle>Distances for Clustering Downtown Tourist Itineraries</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18516">
            <firstname>Rémi</firstname>
            <lastname>Busseuil</lastname>
          </person>
          <person key="axis-2005-id18372">
            <firstname>Sergiu</firstname>
            <lastname>Chelcea</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <keyword>Tourist itineraries</keyword>
        <keyword>Clustering</keyword>
        <keyword>Distance</keyword>
        <keyword>2-3 AHC</keyword>
        <p>In the context of the MobiVIP project (cf. section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid147" location="intern" xyref="1958661692013"/>), during Rémi Busseuil's internship we studied the possibility of clustering tourists itineraries in the town
        center (Antibes in this case). Thus, a software for tourist itineraries generation and clustering was developed (in Visual .NET), taking into account not only the geographical characteristics of an itinerary, but also the symbolical ones: street type, buildings type, etc. This new use of
        semantical data, opens new directions for the road itineraries recommendations, by addressing new issues like the purpose of the itinerary or the nature of the crossed areas.</p>
        <p>Clustering itineraries has many advantages besides the possibility of choosing the most suitable one: it is also an analysis and comparison tool. This can have multiple applications: route or destination prediction, traffic anticipation, etc. As clustering algorithm, we used the
        Agglomerative 2-3 Hierarchical Classification (2-3 AHC) algorithm. The 2-3 AHC has the advantage of being easily visualized compared to a classical clustering method.</p>
        <p>In order to compare different itineraries, we basically divided each itinerary into fragments and then we computed a distance/dissimilarity value using the Longest Common Subsequence algorithm (LCS) and a spread function developed in 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid22" location="biblio" xyref="1958661692013"/>. Different ways of defining the dissimilarity and of comparing the fragment were tested.</p>
        <p>An example of clustering 40 itineraries issued from 4 different profession types is presented in Figure 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid86" location="intern" xyref="1958661692013"/>bellow.</p>
        <object id="uid86">
          <table>
            <tr>
              <td>
                <ressource aux="image_4.png" xylemeAttach="4" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-23ahc_trajets-2" type="float" scale="0.3" xyref="1525765019005"/>
              </td>
            </tr>
          </table>
          <caption>2-3 AHC classification on 40 itineraries</caption>
        </object>
      </subsection>
      <subsection level="2" id="uid87">
        <bodyTitle>Semantics Tools for XML documents</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18152">
            <firstname>Thierry</firstname>
            <lastname>Despeyroux</lastname>
          </person>
        </participants>
        <p>The main goal of the Semantic Web is to ease a computer-based data mining and discovery, formalizing data that is mostly textual. Our approach is different as we are concerned in the way Web sites are constructed, taking into account their development and their semantics. In this respect
        we are closer to what is called content management.</p>
        <p>Our formal approach is based on the analogy between Web sites and programs when there are represented as terms, although differences between Web sites and programs can be pointed out :</p>
        <simplelist>
          <li id="uid88">
            <p>Web sites may be spread along a great number of files.</p>
          </li>
          <li id="uid89">
            <p>Information is scattered, with many forward references.</p>
          </li>
          <li id="uid90">
            <p>We may need to use external resources to define the static semantics (thesaurus, ontologies, taggers, image analysis program, etc.).</p>
          </li>
        </simplelist>
        <p>We are developing a specification language to express global constraints in Web sites or in a collection of XML documents in an operational way.</p>
        <p>An initial version of this language as been described in 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid23" location="biblio" xyref="1958661692013"/>, together with its application to a real sized collection of documents: the Inria scientific activity report for
        the years 2001 and 2001.</p>
        <p>The language and its implementation has been developped and improved in 2005, in particular for efficiency. At the same time our XML core parser has been extended to allow parsing of HXTML documents.</p>
        <p>The same language has been used to extract information in XML documents. This has been the case to choose and extract words from different part of XML documents. These words was first passed to a tagger, then used to cluster the different documents. A first experiment has been done in
        2004 and has been presented to the EG2005 conference 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid24" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid25" location="biblio" xyref="1958661692013"/>(cf. section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid132" location="intern" xyref="1958661692013"/>).</p>
        <p>In a more long term experiment, we have initiated a regular monitoring of the Inria activity reports to see how the number of bad URLs in these reports evoluates. This monitoring, started in december 2004 and then performed every two weeks, takes into account the activity report for
        2002, 2003 and 2004.</p>
      </subsection>
      <subsection level="2" id="uid91">
        <bodyTitle>Metadata Extraction for Supporting the Interpretation of Clusters</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18343">
            <firstname>Abdourahamane</firstname>
            <lastname>Baldé</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <keyword>metadata</keyword>
        <keyword>XQuery</keyword>
        <keyword>clustering's interpreting</keyword>
        <keyword>RDF</keyword>
        <keyword>Dublin Core</keyword>
        <keyword>PMML</keyword>
        <p>This work was conducted in the context of the PhD of A. Baldé.</p>
        <p>A huge volume of data is produced by many applications. Data mining techniques are part of knowledge discovery methods whose aim is to discover knowledge in large databases without predetermined information about the application field which is well-known as KDD. But data mining is a
        complex process for an end-user and the main difficulties consist in the interpretation of the results. Metadata can help the interpretation process by providing additional information. Our objective is to facilitate the interpretation process and to point out that metadata can play a major
        role for this purpose. In spite of the visual representation of the results, the user should acquire a significant experience to be able to interpret the clusters. Data mining tools generally offer visualization modules which are not adapted to analysis. The original contributions of our
        work made in collaboration with Marie-Aude Aufaure (Supelec) concern new approaches to representing clustering's metadata and interpreting clustering's results by using metadata.</p>
        <p>First, we propose a metadata model that could be automatically exploited 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid26" location="biblio" xyref="1958661692013"/>. We also propose a tool in order to help the end-user to interpret the clusters obtained. This tool is based upon
        the architecture described in Figure 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid92" location="intern" xyref="1958661692013"/>.</p>
        <p>This architecture is composed by three layers: metadata model, metadata manager which manages metadata extraction and storage and manipulations performed on these metadata and user query layer using XQuery. In order to implement these queries, we use the Saxon processor. Saxon is a set
        of tools dedicated to XML documents processing: it has established a reputation for fast performance, the highest level of conformance to the W3C specifications. This method can be applied to a wide variety of data mining methods.</p>
        <object id="uid92">
          <table>
            <tr>
              <td>
                <ressource aux="image_5.png" xylemeAttach="5" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-architecture" type="float" width="100mm" xyref="939389936002"/>
              </td>
            </tr>
          </table>
          <caption>metadata production architecture</caption>
        </object>
      </subsection>
      <subsection level="2" id="uid93">
        <bodyTitle>Viewpoint Managment for Annotating a KDD Process</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18357">
            <firstname>Hicham</firstname>
            <lastname>Behja</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <keyword>viewpoint</keyword>
        <keyword>complex data mining</keyword>
        <keyword>annotation</keyword>
        <keyword>metadata</keyword>
        <p>This work was performed in the context of the PhD of H. Behja (France-Morocco Cooperation - Software Engineering Network).</p>
        <p>Our goal is to make more explicit the notion of "viewpoint" from analysts during their activity and to propose a new approach to integrate the viewpoint notion in a multi-view Knowledge Discovery from Databases (KDD) analysis. We define a viewpoint in KDD as an analyst's perception of a
        KDD process, perception referring to its own knowledge 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid27" location="biblio" xyref="1958661692013"/>. Our purpose is to facilitate both reusability and adaptability of a KDD process, and to reduce his complexity
        whilst maintaining the trace of the past analysis viewpoints. The KDD process will be considered as a view generation and transformation process annotated by metadata to store the semantics of a KDD process.</p>
        <p>In 2004 we started with an analysis of the state of the art and identified three directions: 1) the use of the viewpoint notion in the Knowledge Engineering Community including object languages for knowledge representation, 2) modelling KDD process adopting a Semantic Web based approach
        and 3) the use of annotations of KDD processes. Then we designed and implemented an object oriented platform for KDD processes including the viewpoint notion (via design patterns and UML using Rational Rose). The current platform is based on the Weka library.</p>
        <p>In 2005 we proposed and implemented the knowledge conceptual model 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid28" location="biblio" xyref="1958661692013"/>integrating the viewpoint concept (cf. Figure 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid99" location="intern" xyref="1958661692013"/>). It is composed of four models structured in two types of knowledge:</p>
        <p>First, for the domain knowledge, the domain model that describes the analyzed domain knowledge in terms of objects, attributes, data, etc. and the analyst domain knowledge that will relate to the tasks carried out by the analyst; choice of methods, variables, etc. We propose a formal
        representation of the domain model as a datawarehouse that allows the business information to be viewed from many viewpoints. For our example of the HTTP log in Web Usage Mining (WUM), the used database design is the star schema.</p>
        <p>Second, for the strategic knowledge, we find:</p>
        <simplelist>
          <li id="uid94">
            <p>the task and method model which describes the KDD analyst domain knowledge. Here, the domain objects are methods, algorithms, parameters, etc. This model is a semi-formal generic ontology. For its construction we are mainly inspired from the DAMON system ontology for the data mining
            step, but we address all three KDD steps (preprocessing, data mining and postprocessing). This ontology is developed in Protégé-2000 system.</p>
          </li>
          <li id="uid95">
            <p>the viewpoint model which describes the viewpoint specification in terms of preferences related to the decision-making process in KDD (choice of the attributes, methods and systems, etc.). This viewpoint model, described by a RDF scheme, manipulates both the analyzed domain and the
            analyst domain:</p>
            <simplelist>
              <li id="uid96">
                <p>The viewpoint analyzed domain specifies the significant attributes for the expert from the analysed domain. This vision allows the analyst on the one hand to restrict the analyzed domain and on the other hand to guide the goal of the retrieval by defining a diagram on the raw
                data.</p>
              </li>
              <li id="uid97">
                <p>The viewpoint analyst domain allows to define a symbolic execution by choosing the methods and the algorithms for each KDD process step.</p>
              </li>
              <li id="uid98">
                <p>The viewpoint organizational model describes the organization of the viewpoints in terms of relations among them (in progress).</p>
              </li>
            </simplelist>
          </li>
        </simplelist>
        <object id="uid99">
          <table>
            <tr>
              <td>
                <ressource aux="image_6.png" xylemeAttach="6" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-figureRAHicham" type="float" scale="0.7" xyref="173017940020"/>
              </td>
            </tr>
          </table>
          <caption>Conceptual model</caption>
        </object>
        <p>This work is accepted for publication in january 2006 in a special issue on ``Méthodes Avancées de Développement des SI'' of the french journal ISI (D. Rieu and G. Giraudin editors).</p>
      </subsection>
      <subsection level="2" id="uid100">
        <bodyTitle>Production and Display of a Critical Edition of Sanskrit documents</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18244">
            <firstname>Marc</firstname>
            <lastname>Csernel</lastname>
          </person>
          <person key="axis-2005-id18560">
            <firstname>Marina</firstname>
            <lastname>Dufresne</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="PASUSERID">
            <firstname>Selma</firstname>
            <lastname>Khebache</lastname>
          </person>
        </participants>
        <keyword>Text comparison</keyword>
        <keyword>Sanskrit</keyword>
        <keyword>transliteration</keyword>
        <keyword>Critical Edition</keyword>
        <keyword>Unicode</keyword>
        <keyword>XML</keyword>
        <keyword>electronic display</keyword>
        <p>A critical edition is the edition of a well known text taking into account all possible versions of this text. Critical editions are particularly needed for texts issued from manuscripts where the variations can be very significant from one manuscript to the other.</p>
        <p noindent="true"><b>Production of critical edition of Sanskrit Text.</b>This is particularly important for the Indian subcontinent where at least one third of the manuscripts existing through the whole world are supposed to be found, the main part of them being written in Sanskrit. It was not an Indian
        tradition to deal with critical edition, so very few of them exist at present time. The idea is to provide a computer assisted construction of critical edition. Such tools exist for occidental languages, but, due to some Sanskrit specificities they could not suit our purpose:</p>
        <simplelist>
          <li id="uid101">
            <p>Sanskrit is written according to a transliterated alphabet.</p>
          </li>
          <li id="uid102">
            <p>Separation between words are mostly absent in a manuscript and their presence is not meaningful. The text is generally formed by a sequence of thousands of characters;</p>
          </li>
          <li id="uid103">
            <p>The writing of two words is different if there is a blank (or any separation) between them, or if they are following each other directly. This notion is called a sandhi.</p>
          </li>
        </simplelist>
        <p>In order to avoid the complexity problem induced by the thousands of characters sentences, and to be able to provide to the philologist the exact words where a difference occurs, we need either a lexicon, or a text where all the words appear separately. We will use the second solution
        and we call such a text a Padapatha according to a certain form of recitation used by the Sanskritist. Due to the sandhi, such a text is not readily comparable with the manuscript text. We must provide a pre-processing based on LEX to construct all the sandhi related to the padapatha in
        order to be able to provide a suitable comparison. For the comparison we use the Longest Common Subsequence (LCS) algorithm based on dynamic programming. The algorithm output will be used as input of the following project steps :</p>
        <simplelist>
          <li id="uid104">
            <p>Electronic display of critical edition of Sanskrit text</p>
          </li>
          <li id="uid105">
            <p>Cluster (cf. section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid84" location="intern" xyref="1958661692013"/>) and Phylogenetic trees</p>
          </li>
        </simplelist>
        <p><b>Electronic display of critical edition of Sanskrit Text.</b>Traditionally critical editions are represented as particularly boring (for unfamiliar) books, where the text itself is very small, and where the notes are numerous and enormous. It's a philologist dream to see only the points
        they care about. An electronic form of critical edition could be a proper answer.</p>
        <p>But there are a lot of problems related to the Sanskrit we have to care about. Thanks to Unicode it is now possible to get some standard about the display of sandhi characters. But because of the ligature formation, two Sanskrit characters separated by a blank do not look similar as if
        they were put one after the other.</p>
        <p>Marina Dufresne during her internship (cf. section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid300" location="intern" xyref="1958661692013"/>) developed a software tool what allows an interactive display of critical edition of Sankrit text starting from
        an XML text. This tool is not perfect but it has been greatly appreciated by the Sanskrit community. This work has bee done in collaboration with François Patte.</p>
      </subsection>
    </subsection>
    <subsection level="1" id="uid106">
      <bodyTitle>Data Mining Methods</bodyTitle>
      <keyword>symbolic data analysis</keyword>
      <keyword>unsupervised clustering</keyword>
      <keyword>Self Organizing Map</keyword>
      <keyword>complex data</keyword>
      <keyword>neural networks</keyword>
      <keyword>hierarchical clustering</keyword>
      <keyword>hierarchies</keyword>
      <subsection level="2" id="uid107">
        <bodyTitle>Self Organizing Maps on dissimilarity matrices</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18308">
            <firstname>Aicha</firstname>
            <lastname>El Golli</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18259">
            <firstname>Fabrice</firstname>
            <lastname>Rossi</lastname>
          </person>
          <person key="axis-2005-id18621">
            <firstname>Nicomedes</firstname>
            <lastname>Lopes Calvacanti Junior</lastname>
          </person>
        </participants>
        <keyword>dissimilarity</keyword>
        <keyword>self organizing maps</keyword>
        <keyword>neural networks</keyword>
        <keyword>clustering</keyword>
        <keyword>visualization</keyword>
        <p>The standard Self Organizing Map (SOM) is restricted to vector data from 
        <span class="math" align="left"><hi rend="it">R</hi><sup><hi rend="it">n</hi></sup></span>. In our previous work 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid29" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid15" location="biblio" xyref="1958661692013"/>, we proposed an adapted version of the SOM, called the DSOM (for Dissimilarity SOM) that can be applied to any
        data for which a dissimilarity can be defined.</p>
        <p>In 2005, we improved DSOM by defining a new algorithm associated to an improved implementation. This implementation significantly reduces the execution time of the method without changing the results 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid30" location="biblio" xyref="1958661692013"/>. The new algorithm is based on a factorization technique applied to the computation of the criterion optimized by
        the method (the sum of weighted dissimilarities between a prototype candidate and the data to cluster). It is associated to an early stopping scheme and to some memorization techniques that leverage the iterative nature of the method.</p>
        <p>We have also applied the DSOM to usage-based web content clustering and visualization 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid31" location="biblio" xyref="1958661692013"/>, see section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid122" location="intern" xyref="1958661692013"/>for details.</p>
      </subsection>
      <subsection level="2" id="uid108">
        <bodyTitle>Functional Data Analysis</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18259">
            <firstname>Fabrice</firstname>
            <lastname>Rossi</lastname>
          </person>
        </participants>
        <keyword>functional data</keyword>
        <keyword>neural networks</keyword>
        <keyword>curves classification</keyword>
        <keyword>support vector machines</keyword>
        <keyword>machine learning</keyword>
        <p>Functional Data Analysis is an extension of traditional data analysis to functional data. In this framework, each individual is described by one or several functions, rather than by a vector of 
        <span class="math" align="left"><hi rend="it">R</hi><sup><hi rend="it">n</hi></sup></span>. This approach allows to take into account the regularity of the observed functions.</p>
        <p>In 2005, we have extended our approach based on neural methods for functional data to the case of Support Vector Machines (SVMs) applied to function classification:</p>
        <simplelist>
          <li id="uid109">
            <p>in 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid32" location="biblio" xyref="1958661692013"/>, we have introduced functional kernels based on derivation operators and on B-spline smoothing. An
            application to spectrometric curves classification showed an improvement of these kernels over standard non functional kernels;</p>
          </li>
          <li id="uid110">
            <p>in 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid33" location="biblio" xyref="1958661692013"/>, we have studied the theoretical properties of a projection based functional kernel, in which functions are
            projected to a truncated Hilbert basis in a pre-processing step. The coordinates on this basis are handled by a standard SVM. We showed that this method, associated to a split sample procedure for the choice of the truncation level, is consistent (i.e., it can reach the Bayes error rate
            asymptotically). We also illustrated the method on several real world data set (speech recognition problems).</p>
          </li>
        </simplelist>
        <p>In 2005, our earlier work on functional multi-layer perceptrons has been published in international journals 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid34" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid35" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid36" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid111">
        <bodyTitle>Partitioning Method: Adaptive Distances on Interval Data</bodyTitle>
        <participants category="None">
          <person key="PASUSERID">
            <firstname>F.A.T.</firstname>
            <lastname>de Carvalho</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="PASUSERID">
            <firstname>Renata</firstname>
            <lastname>Souza</lastname>
          </person>
        </participants>
        <keyword>unsupervised clustering</keyword>
        <keyword>quantitative data</keyword>
        <keyword>dynamic clustering algorithm</keyword>
        <p>The main contribution 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid37" location="biblio" xyref="1958661692013"/>is the proposal of a new partitional dynamic clustering method for interval data based on the use of an adaptive
        Hausdorff distance at each iteration. The idea of dynamical clustering with adaptive distances is to associate a distance to each cluster, which is defined according to its intra-class structure. The advantage of this approach is that the clustering algorithm recognizes different shapes and
        sizes of clusters. Here the adaptive distance is a weighted sum of Hausdorff distances. Explicit formulas for the optimum class prototype, as well as for the weights of the adaptive distances, are found. When used for dynamic clustering of interval data, these prototypes and weights ensure
        that the clustering criterion decreases at each iteration.</p>
        <p>Let 
        <span class="math" align="left"><img width="13" height="13" align="bottom" border="0" src="../../images/img_Omega.png" alt="$ \Omega$"/></span>be a set of 
        <hi rend="italic">n</hi>objects indexed by 
        <hi rend="italic">i</hi>and described by 
        <hi rend="italic">p</hi>interval variables indexed by 
        <hi rend="italic">j</hi>. An 
        <i>interval variable</i>
        <hi rend="italic">X</hi>
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid13" location="biblio" xyref="1958661692013"/>is a correspondence defined from 
        <span class="math" align="left"><img width="13" height="13" align="bottom" border="0" src="../../images/img_Omega.png" alt="$ \Omega$"/></span>in 
        <span class="math" align="left"><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Re.png" alt="$ \Re$"/></span>such that for each 
        <span class="math" align="left"><hi rend="it">i</hi><img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><img width="13" height="13" align="bottom" border="0" src="../../images/img_Omega.png" alt="$ \Omega$"/>, 
        <hi rend="it">X</hi>(
        <hi rend="it">i</hi>) = [
        <hi rend="it">a</hi>, 
        <hi rend="it">b</hi>]
        <img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Im.png" alt="$ \Im$"/></span>, where 
        <span class="math" align="left"><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Im.png" alt="$ \Im$"/></span>is the set of closed intervals defined from 
        <span class="math" align="left"><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Re.png" alt="$ \Re$"/></span>, i.e., 
        <span class="math" align="left"><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Im.png" alt="$ \Im$"/>= {[
        <hi rend="it">a</hi>, 
        <hi rend="it">b</hi>]:
        <hi rend="it">a</hi>, 
        <hi rend="it">b</hi><img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Re.png" alt="$ \Re$"/>, 
        <hi rend="it">a</hi><img width="14" height="24" align="middle" border="0" src="../../images/img_other_le.png" alt="$ \le$"/><hi rend="it">b</hi>}</span>. Each object 
        <hi rend="italic">i</hi>is represented as a vector of intervals 
        <span class="math" align="left"><img align="middle" width="102" height="29" src="math_image_1.png" xylemeAttach="11" border="0" alt="Im1 ${x_i{=(}x_i^1,\#8943 ,x_i^p{)}}$"/></span>, where 
        <span class="math" align="left"><hi rend="it">x</hi><sub><hi rend="it">i</hi></sub><sup><hi rend="it">j</hi></sup>= [
        <hi rend="it">a</hi><sub><hi rend="it">i</hi></sub><sup><hi rend="it">j</hi></sup>, 
        <hi rend="it">b</hi><sub><hi rend="it">i</hi></sub><sup><hi rend="it">j</hi></sup>]
        <img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Im.png" alt="$ \Im$"/></span>.</p>
        <p>An interval data table 
        <span class="math" align="left">{
        <hi rend="it">x</hi>
        <sub><hi rend="it">i</hi></sub>
        <sup><hi rend="it">j</hi></sup>}
        <sub><hi rend="it">n</hi>×
        <hi rend="it">p</hi></sub></span>which is used by our clustering method is made up of 
        <hi rend="italic">n</hi>rows that represent 
        <hi rend="italic">n</hi>objects to be clustered and 
        <hi rend="italic">p</hi>columns that represent 
        <hi rend="italic">p</hi>interval variables. Each cell of this table contains an interval 
        <span class="math" align="left"><hi rend="it">x</hi><sub><hi rend="it">i</hi></sub><sup><hi rend="it">j</hi></sup>= [
        <hi rend="it">a</hi><sub><hi rend="it">i</hi></sub><sup><hi rend="it">j</hi></sup>, 
        <hi rend="it">b</hi><sub><hi rend="it">i</hi></sub><sup><hi rend="it">j</hi></sup>]
        <img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Im.png" alt="$ \Im$"/></span>. In our approach 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid37" location="biblio" xyref="1958661692013"/>a prototype 
        <span class="math" align="left"><hi rend="bold">y</hi><sub><hi rend="it">k</hi></sub></span>of cluster 
        <span class="math" align="left"><hi rend="it">C</hi><sub><hi rend="it">k</hi></sub><img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><hi rend="it">P</hi></span>is also represented as a vector of intervals 
        <span class="math" align="left"><img align="middle" width="103" height="29" src="math_image_2.png" xylemeAttach="12" border="0" alt="Im2 ${y_k{=(}y_k^1,\#8943 ,y_k^p{)}}$"/></span>, where 
        <span class="math" align="left"><hi rend="it">y</hi><sub><hi rend="it">k</hi></sub><sup><hi rend="it">j</hi></sup>= [
        <img width="12" height="12" align="bottom" border="0" src="../../images/img_alpha.png" alt="$ \alpha$"/><sub><hi rend="it">k</hi></sub><sup><hi rend="it">j</hi></sup>, 
        <img width="12" height="26" align="middle" border="0" src="../../images/img_beta.png" alt="$ \beta$"/><sub><hi rend="it">k</hi></sub><sup><hi rend="it">j</hi></sup>]
        <img width="13" height="24" align="middle" border="0" src="../../images/img_other_in.png" alt="$ \in$"/><img width="13" height="13" align="bottom" border="0" src="../../images/img_other_Im.png" alt="$ \Im$"/></span>.</p>
        <p>It is now a matter of choosing an adaptive distance between vectors of intervals and properly defining the representation step of the dynamic algorithm with adaptive distances given in the previous section. In other words, we will give an explicit formula for the prototype 
        <span class="math" align="left"><hi rend="bold">y</hi><sub><hi rend="it">k</hi></sub></span>and for the vector of weights 
        <span class="math" align="left"><img width="11" height="13" align="bottom" border="0" src="../../images/img_lambda.png" alt="$ \lambda$"/><sub><hi rend="it">k</hi></sub></span>that minimizes both the adequacy criterion 
        <span class="math" align="left"><img align="middle" width="153" height="33" src="math_image_3.png" xylemeAttach="13" border="0" alt="Im3 ${\#8721 _{j=1}^p\#955 _k^j\#8721 _{i\#8712 C_k}{d(}x_i^j,y_k^j{)}}$"/></span>.</p>
      </subsection>
      <subsection level="2" id="uid112">
        <bodyTitle>Agglomerative 2-3 Hierarchical Clustering: study and visualization</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18372">
            <firstname>Sergiu</firstname>
            <lastname>Chelcea</lastname>
          </person>
          <person key="axis-2005-id18293">
            <firstname>Mihai</firstname>
            <lastname>Jurca</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <keyword>2-3 AHC</keyword>
        <keyword>clustering</keyword>
        <keyword>aggregation index</keyword>
        <keyword>hierarchies</keyword>
        <p>This work was conducted in the context of the PhD of S. Chelcea.</p>
        <p>We have continued 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid38" location="biblio" xyref="1958661692013"/>this year our study of the Agglomerative 2-3 Hierarchical Clustering 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid39" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid40" location="biblio" xyref="1958661692013"/>as a part of Chelcea Sergiu's PhD thesis. A study of different aggregation indexes and cluster indexing measures
        combined with the 2-3 AHC algorithm execution has revealed a particular case of clusters merging, which can influence the resulting induced dissimilarity matrix. This case that we denoted 
        <i>blind merging</i>, is present when two clusters are merged whilst one of them is not maximal. Based on our previous theoretical study 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid41" location="biblio" xyref="1958661692013"/>, the next (intermediate) merging, will merge together two clusters possibly at a high indexing degree. This can
        be avoided by minimizing the final cluster's indexing degree when choosing the two merging clusters.</p>
        <p>A slightly modified version of a 2-3 AHC algorithm was proposed and implemented in order to avoid such situations. The interest of this new 2-3 algorithm variant is its resulting induced dissimilarity matrix which is ``better'' or equal to the classic ultrametric.</p>
        <p>We experimentally validated this new 2-3 AHC algorithm variant on different artificial datasets and we also integrated it into our 
        <span align="left" class="smallcap">Hierarchies Visualization Toolbox</span>
        <footnote id="uid113" anchored="yes" place="foot"><ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://axis.inria.fr" location="extern" xyref="2970334891012">http://axis.inria.fr/</ref></footnote>.</p>
        <p>This new 2-3 AHC algorithm variant was also applied and validated on other types of datasets: on Web Usage Data 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid38" location="biblio" xyref="1958661692013"/>, on Sanskrit XML documents 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid22" location="biblio" xyref="1958661692013"/>(see also Section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid84" location="intern" xyref="1958661692013"/>) and on tourists itineraries 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid42" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid114">
        <bodyTitle>Sequential Pattern Extraction in Data Streams</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18635">
            <firstname>Alice</firstname>
            <lastname>Marascu</lastname>
          </person>
          <person key="axis-2005-id18166">
            <firstname>Florent</firstname>
            <lastname>Masséglia</lastname>
          </person>
        </participants>
        <keyword>sequential pattern</keyword>
        <keyword>data stream</keyword>
        <keyword>sequence alignment</keyword>
        <p>This work was conducted in the context of the master of A. Marascu.</p>
        <p>In recent years, emerging applications introduced new constraints for data mining methods. These constraints are particularly linked to new kinds of data that can be considered as complex data. One typical kind of such data is known as 
        <i>data streams</i>. In a data stream processing, memory usage is restricted, new elements are generated continuously and have to be considered as fast as possible, no blocking operator can be performed and the data can be examined only once.</p>
        <p>At this time and to the best of our knowledge, no method has been proposed for mining sequential patterns in data streams. We argue that the main reason is the combinatory phenomenon related to sequential pattern mining. Actually, if itemset mining relies on a finite set of possible
        results (the set of combinations between items recorded in the data) this is not the case for sequential patterns where the set of results is infinite. In fact, due to the temporal aspect of sequential patterns, an item can be repeated without limitation leading to an infinite number of
        potential frequent sequences.</p>
        <p>The SMDS (Sequence Mining in Data Streams) method, proposed in 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid43" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid44" location="biblio" xyref="1958661692013"/>, is designed for extracting sequential patterns from a data stream. More precisely, our goal is to extract
        significant patterns that will be representative of Web usage streaming data. To this end, SMDS performs as follows:</p>
        <orderedlist>
          <li id="uid115">
            <p>cutting down the data stream into batches of fixed size. The following operations are then performed for each batch;</p>
          </li>
          <li id="uid116">
            <p>clustering the sequences of the batch;</p>
          </li>
          <li id="uid117">
            <p>for each cluster 
            <hi rend="italic">c</hi>, providing the alignment of the sequences embedded in 
            <hi rend="italic">c</hi>. The aligned sequence will be considered as a summary of 
            <hi rend="italic">c</hi>;</p>
          </li>
          <li id="uid118">
            <p>filtering the aligned sequence in order to keep 1) frequent items only and 2) aligned sequences obtained on clusters having size greater than 2 only;</p>
          </li>
          <li id="uid119">
            <p>maintaining a prefix tree structure that will keep the history of frequency for each extracted sequence (the operations on this structure may be 
            <span class="math" align="left"><hi rend="it">i</hi><hi rend="it">n</hi><hi rend="it">s</hi><hi rend="it">e</hi><hi rend="it">r</hi><hi rend="it">t</hi><hi rend="it">i</hi><hi rend="it">o</hi><hi rend="it">n</hi></span>, 
            <span class="math" align="left"><hi rend="it">u</hi><hi rend="it">p</hi><hi rend="it">d</hi><hi rend="it">a</hi><hi rend="it">t</hi><hi rend="it">e</hi></span>or 
            <span class="math" align="left"><hi rend="it">d</hi><hi rend="it">e</hi><hi rend="it">l</hi><hi rend="it">e</hi><hi rend="it">t</hi><hi rend="it">i</hi><hi rend="it">o</hi><hi rend="it">n</hi></span>).</p>
          </li>
        </orderedlist>
        <p>All those steps have to be performed as fast as possible in order to meet the constraints of a data stream environment. Approximation has been recognized as a key feature for this kind of applications, explaining our choice for an alignment method for extracting the summaries of
        clusters. The SMDS method is illustrated in figure 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid120" location="intern" xyref="1958661692013"/>. SMDS has been tested over both real and synthetic datasets. Experiments could show the efficiency of our
        approach and the relevance of the extracted patterns on the Web site of Inria Sophia Antipolis.</p>
        <object id="uid120">
          <table>
            <tr>
              <td>
                <ressource aux="image_7.png" xylemeAttach="7" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-smds" type="float" width="100mm" xyref="1779399493000"/>
              </td>
            </tr>
          </table>
          <caption>The SMDS method</caption>
        </object>
      </subsection>
    </subsection>
    <subsection level="1" id="uid121">
      <bodyTitle>Web Usage Mining Methods</bodyTitle>
      <subsection level="2" id="uid122">
        <bodyTitle>Visualization</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18259">
            <firstname>Fabrice</firstname>
            <lastname>Rossi</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18308">
            <firstname>Aicha</firstname>
            <lastname>El Golli</lastname>
          </person>
        </participants>
        <keyword>data visualization</keyword>
        <keyword>web usage mining</keyword>
        <keyword>graph visualization</keyword>
        <keyword>non linear projection</keyword>
        <keyword>dissimilarities</keyword>
        <keyword>self organizing map</keyword>
        <p>The analysis of the content of a web site based on usage data is an important task as it allows to obtain insight on the organization of the site and of its adequacy to user needs. The (dis)agreement between the prior structure of the site (in terms of hyperlinks) and the actual
        trajectories of the users is of particular interest. In many situations, users have to follow some complex paths in the site in order to reach the pages they are looking for, mainly because they are interested in topics that appeared unrelated to the creators of the site and thus remained
        unlinked. On the contrary, some hyperlinks are not used frequently, for instance because they link documents that are accessed by different user groups.</p>
        <p>In 2005 we have studied two general tools for visualizing the content of a site based on usage data:</p>
        <simplelist>
          <li id="uid123">
            <p>in 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid45" location="biblio" xyref="1958661692013"/>we have used the logical and hierarchical organization of the web site to simplify the representation of user
            trajectories. Simplified trajectories are used to calculate dissimilarities between URL groups defined thanks to the site hierarchy (groups are also called topics in section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid125" location="intern" xyref="1958661692013"/>). The groups, which reflect the prior semantic structure of the site, are represented thanks to the minimum
            spanning tree induced by the dissimilarity matrix. This allows to explore the relationship between prior categories and user browsing patterns. The method was applied to the INRIA web site and gave satisfactory results;</p>
          </li>
          <li id="uid124">
            <p>in 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid31" location="biblio" xyref="1958661692013"/>we have applied the same general methodology for calculating dissimilarities between URL groups but we used an
            adapted version of the Self Organizing Map (SOM) to visualization clusters obtained via the dissimilarity matrix (see section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid107" location="intern" xyref="1958661692013"/>for details on this version of the SOM).</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid125">
        <bodyTitle>InterSites Web Usage Mining: preprocessing methodology and crossed clustering</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18372">
            <firstname>Sergiu</firstname>
            <lastname>Chelcea</lastname>
          </person>
          <person key="axis-2005-id18387">
            <firstname>Alzennyr</firstname>
            <lastname>Da Silva</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18416">
            <firstname>Doru</firstname>
            <lastname>Tanasa</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
          <person key="axis-2005-id18481">
            <firstname>Rosanna</firstname>
            <lastname>Verde</lastname>
          </person>
        </participants>
        <keyword>Web Usage Mining</keyword>
        <keyword>Complex data</keyword>
        <keyword>Preprocessing</keyword>
        <keyword>Crossed-clustering</keyword>
        <p>In the context of the ECML/PKDD 2005 Discovery Challenge, we improved 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid46" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid47" location="biblio" xyref="1958661692013"/>our preprocessing methodology for intersites Web Usage Mining 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid48" location="biblio" xyref="1958661692013"/>. A clickstream dataset was proposed in the Discovery Challenge this year for the first time. The dataset
        consisted in requests for page views on seven different e-commerce Web sites from the Czech Republic. A request contained a PHP SessionID automatically generated for each new user visit on each server (unique IDs).</p>
        <p>Based on Tanasa's preprocessing methodology 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid48" location="biblio" xyref="1958661692013"/>, we defined a new methodology to preprocess the provided datasets and to store it in a data warehouse. Since a
        user changing shops can have (during a single visit) multiple SessionIDs, one on each shop, we regrouped these PHP SessionIDs into intersite users visits. More precisely we regrouped SessionIDs belonging to a single user (same IP) into a 
        <i>Group of SessionIDs</i>, corresponding to the user's actual (intersite) visit. This was done by comparing the Referrer with the previously accessed URLs (in a reasonable time window), each time the user moves to another shop. We thus reduced by 23.88% the number of user visits.</p>
        <p>To analyze the traffic load in the seven shop sites, we grouped the requests in terms of 
        <i>Time Periods</i>(slices of date and hour). We cross-clustered these time periods against the visited products using a generalized dynamic algorithm 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid49" location="biblio" xyref="1958661692013"/>.</p>
        <p>The result consisted in the confusion table containing classes of periods and products (see Figure 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid126" location="intern" xyref="1958661692013"/>).</p>
        <object id="uid126">
          <table>
            <tr>
              <td>
                <ressource aux="image_8.png" xylemeAttach="8" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-tab_confusion" type="float" scale="0.3" xyref="4292653802002"/>
              </td>
            </tr>
          </table>
          <caption>Confusion table for 7 classes of periods and 5 classes of products</caption>
        </object>
        <p>Such analyses allow us to identify best hours for marketing strategies, like fast promotions, online advices and publish banners, etc. Others analyses could be planned in the future, exploiting for example the link between the consumer activities and the time periods by shop or focusing
        on multi-shop user visits, etc.</p>
        <p>In fact we apply a previous work published in 2003: indeed we proposed in 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid49" location="biblio" xyref="1958661692013"/>a crossed clustering algorithm in order to partition a set of objects in a predefined number of classes and to
        determine, in the same time, a structure (taxonomy) on the categories of the object descriptors. This procedure is a simultaneous clustering algorithm on contingency tables. The convergence of the algorithm is guaranteed at the best partitions of the objects in 
        <hi rend="italic">r</hi>classes and of the categories of the descriptors in 
        <hi rend="italic">c</hi>groups, respectively. This algorithm extended the dynamical algorithms hereafter proposed in the context of the Web Usage Mining. In particular, we had already performed it on the Web Logs Data, coming from the HTTP log files of INRIA web server 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid50" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid127">
        <bodyTitle>Extracting Dense Periods of Sequential Patterns</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18166">
            <firstname>Florent</firstname>
            <lastname>Masséglia</lastname>
          </person>
        </participants>
        <keyword>sequential patterns</keyword>
        <keyword>web usage mining</keyword>
        <keyword>period</keyword>
        <p>This work has been done in collaboration with the LGI2P and the LIRMM (see 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid175" location="intern" xyref="1958661692013"/>) and has been published in 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid51" location="biblio" xyref="1958661692013"/>. Existing Web Usage Mining techniques are currently based on an arbitrary division of the data (
        <i>e.g.</i>``one log per month'') or guided by presumed results (
        <i>e.g</i>``what is the customers behaviour for the period of Christmas purchases?''). Those approaches have two main drawbacks. First, they depend on this arbitrary organization of the data. Second, they cannot automatically extract ``seasons peaks'' among the stored data.</p>
        <p>The work presented in this section performs a specific data mining process (and particularly to extract frequent behaviours) in order to automatically discover the densest periods. Our method extracts, among the whole set of possible combinations, the frequent sequential patterns related
        to the extracted periods. A period will be considered as dense if it contains at least one frequent sequential pattern for the set of users connected to the Web site in that period.</p>
        <p>Our method is based on:</p>
        <orderedlist>
          <li id="uid128">
            <p>a new representation of the Web log file designed to retrieve the ``login'' and ``logout'' information associated to each user.</p>
          </li>
          <li id="uid129">
            <p>a rewriting of the log in order to build periods based on the information of step 1. A period will begin at the arrival of a new user or end at the departure of a ``connected'' user.</p>
          </li>
          <li id="uid130">
            <p>a heuristic designed for extracting approximate frequent sequences from each period built at step 2.</p>
          </li>
        </orderedlist>
        <p>The third step is based on 
        <span align="left" class="smallcap">Perio</span>, the heuristic we have developed for that purpose and it is widely inspired from genetic algorithms.</p>
      </subsection>
    </subsection>
    <subsection level="1" id="uid131">
      <bodyTitle>XML Document Mining and XML Search</bodyTitle>
      <subsection level="2" id="uid132">
        <bodyTitle>Structure and Content Mining</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18152">
            <firstname>Thierry</firstname>
            <lastname>Despeyroux</lastname>
          </person>
          <person key="axis-2005-id18650">
            <firstname>Mounir</firstname>
            <lastname>Fegas</lastname>
          </person>
          <person key="axis-2005-id18591">
            <firstname>Saba</firstname>
            <lastname>Gul</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18210">
            <firstname>Anne-Marie</firstname>
            <lastname>Vercoustre</lastname>
          </person>
        </participants>
        <keyword>Document mining</keyword>
        <keyword>XML clustering</keyword>
        <keyword>XML classification</keyword>
        <p>XML documents are becoming ubiquitous because of their rich and flexible format that can be used for a variety of applications. Standard methods have been used to classify XML documents, reducing them to their textual parts. These approaches do not take advantage of the structure of XML
        documents that also carries important information.</p>
        <p>Last year we studied the impact of selecting different parts (sub-structures) of XML documents for specific clustering tasks. Our approach integrated techniques for extracting representative words from documents elements with unsupervised classification of documents. We illustrated and
        evaluated this approach with the collection of XML activity reports written by Inria research teams for year 2003. The objective was to cluster projects into larger groups (Themes), based on the keywords or different chapters of these activity reports. We then compared the results of
        clustering using different feature selections, with the official theme structure used by Inria between 1985 and 2003, and with the new one proposed officially in 2004. The results (published this year) show that the quality of clustering strongly depends on the selected document features 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid24" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid25" location="biblio" xyref="1958661692013"/>.</p>
        <p>This year we developed a new representation model for clustering XML documents. The standard vector model for classification or clustering of documents represents documents by weighted vectors of words contained in the documents. This model takes into account only the textual content of
        documents. With XML documents, we want a representation that takes into account either the structure of the documents or both the structure and the content. Since XML documents can be seen as trees, we represent documents by the set of their (node) paths of length L, 
        <hi rend="italic">n</hi>
        <span class="math" align="left">&lt; =</span>L 
        <span class="math" align="left">&lt; =</span>
        <hi rend="italic">m</hi>, n and m being two given values. Paths can be contrained to be root-beginning paths, or leaf-ending paths. For dealing with both the structure and the content, we define 
        <i>text paths</i>that extend the node paths with the word contained in the subtree of their final node. Then by regarding paths as words, we can cluster documents by applying standards clustering methods based on the vector model. There is one difficulty, though, since the vector model is
        based on the independance between the dimensions of the vectors. In our case, when two paths are embedded in each other they are obviously not independant. To deal with this problem of dependency, we partition the paths by their length and treat each set of paths as a different modality in
        the clustering algorithm.</p>
        <p>We evaluate our approach using four standard metrics, namely the F-measure, the Corrected-Rand, the entropy and the purity. That for a given clustering task, we compare the resulting clusters with a priori known classes. We made several experiments using the INEX IEEE collections and
        INRIA activity reports 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid52" location="biblio" xyref="1958661692013"/>. The results that will be published in the EGC 2006 conference show that our approach works both for
        structure-based clustering and Structure-and-content clustering. However, using leaf-ending paths may result in damaging the clustering time, as the number of paths increases dramatically. We need to find good ways to reduce the number of paths, especially for text paths.</p>
        <p>We also started to apply this approach to the collections proposed by the INEX XML Document Mining tracks 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid53" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid133">
        <bodyTitle>Sequential Pattern Mining for Structure-based XML Document Classification</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18576">
            <firstname>Calin</firstname>
            <lastname>Garboni</lastname>
          </person>
          <person key="axis-2005-id18166">
            <firstname>Florent</firstname>
            <lastname>Masséglia</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <keyword>sequential pattern</keyword>
        <keyword>structure mining</keyword>
        <keyword>XML document</keyword>
        <keyword>classification</keyword>
        <p>The goal of this work is to provide a classification (``classification supervisée'' in french) over a collection of XML documents. For this purpose we consider that we are provided with a set of clusters coming from a previous clustering on an past collection. More formally: let us
        consider 
        <span class="math" align="left"><hi rend="it">S</hi><sub>1</sub></span>a first collection of XML documents and 
        <span class="math" align="left"><hi rend="it">C</hi>= {
        <hi rend="it">c</hi><sub>1</sub>, 
        <hi rend="it">c</hi><sub>2</sub>, ...
        <hi rend="it">c</hi><sub><hi rend="it">n</hi></sub>}</span>the set of clusters defined for the documents of 
        <span class="math" align="left"><hi rend="it">S</hi><sub>1</sub></span>. Let us now consider 
        <span class="math" align="left"><hi rend="it">S</hi><sub>2</sub></span>a new collection of XML documents. Our goal is to provide a classification on 
        <span class="math" align="left"><hi rend="it">S</hi><sub>2</sub></span>by taking into account the distribution of documents in 
        <hi rend="italic">C</hi>.</p>
        <object id="uid134">
          <table>
            <tr>
              <td>
                <ressource aux="image_9.png" xylemeAttach="9" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-overviewCG" type="float" width="110mm" xyref="2169622809028"/>
              </td>
            </tr>
          </table>
          <caption>Overview of our structure-based classification method</caption>
        </object>
        <p>To this end, our method will perform as illustrated in figure 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid134" location="intern" xyref="1958661692013"/>. It is based on the following three steps:</p>
        <orderedlist>
          <li id="uid135">
            <p>Pre-processing: first of all, we extract the frequent tags embedded in the collection. This step corresponds to step ``1'' in figure 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid134" location="intern" xyref="1958661692013"/>. The main idea is to remove irrelevant tags for clustering operations. A tag which is very frequent in the
            whole collection may be considered as irrelevant since it will not help in separating a document from another (the tag is not discriminative).</p>
          </li>
          <li id="uid136">
            <p>Characterising existing clusters: then we perform a data mining step on each cluster from the previous collection (namely ``
            <hi rend="italic">C</hi>'' in the foreword of this section). This step corresponds to step ``2'' in figure 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid134" location="intern" xyref="1958661692013"/>. For each cluster, the goal is to transform each XML document into a sequence. Furthermore, during the
            mapping operation, the frequent tags extracted from step 1 are removed. Then on each set of sequences corresponding to the original clusters, we perform a data mining step intended to extract the sequential patterns. For each cluster 
            <span class="math" align="left"><hi rend="it">C</hi><sub><hi rend="it">i</hi></sub></span>we are thus provided with 
            <span class="math" align="left"><hi rend="it">S</hi><hi rend="it">P</hi><sub><hi rend="it">i</hi></sub></span>the set of frequent sequences that characterizes 
            <span class="math" align="left"><hi rend="it">C</hi><sub><hi rend="it">i</hi></sub></span>.</p>
          </li>
          <li id="uid137">
            <p>XML Document matching: finally the key step of our method relies on a matching between each document of the collection and the sequences extracted from the second step. This last step corresponds to step 3 in figure 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid134" location="intern" xyref="1958661692013"/>.</p>
          </li>
        </orderedlist>
        <p>The matching techniques developed in this work are described in 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid54" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid138">
        <bodyTitle>Relevance in XML search</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18210">
            <firstname>Anne-Marie</firstname>
            <lastname>Vercoustre</lastname>
          </person>
        </participants>
        <keyword>XML Search</keyword>
        <keyword>User Relevance</keyword>
        <p>When searching information from structured documents collections such as XML collections, it is expected that the use of the structure will help in two ways:</p>
        <simplelist>
          <li id="uid139">
            <p>specifying more precise queries</p>
          </li>
          <li id="uid140">
            <p>identifying specific and relevant parts of documents instead of full documents.</p>
          </li>
        </simplelist>
        <p>In the context of INEX (an International Initiative for the Evaluation of XML search), we are interested in evaluating what granularity of elements the users find relevant. We first analysed the relevance assessments to identify the types of highly relevant elements and identified three
        retrieval scenarios: 
        <i>Original</i>, 
        <i>general</i>and 
        <i>specific</i>and compare the performance of three different systems - a native XML database, a full text retrieval engine and a hybrid system -, for those different scenarios 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid55" location="biblio" xyref="1958661692013"/>. We then developed a novel retrieval heuristics that dynamically determines the preferable units of retrieval
        called 
        <i>Coherent retrieval Element</i>
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid56" location="biblio" xyref="1958661692013"/>.</p>
        <p>In 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid57" location="biblio" xyref="1958661692013"/>, we analyse and compare the assessors'judgement on the relevance of returned document components with the users'
        behaviour when interacting with components of XML documents. By analysing the level of agreement between the assessor and the users, we show that the highest level of agreement is on highly relevant and on non-relevant document components, suggesting that only the end points of the INEX
        10-point relevance scale are perceived in the same way by both the assessor and the users.</p>
      </subsection>
    </subsection>
  </resultats>
  <contrats id="uid141">
    <bodyTitle>Contracts and Grants with Industry</bodyTitle>
    <subsection level="1" id="uid142">
      <bodyTitle>Industrial Contracts</bodyTitle>
      <subsection level="2" id="uid143">
        <bodyTitle>EPIA: a RNTL Project (2003-2005)</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18308">
            <firstname>Aicha</firstname>
            <lastname>El Golli</lastname>
          </person>
          <person key="axis-2005-id18293">
            <firstname>Mihai</firstname>
            <lastname>Jurca</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18195">
            <firstname>Bernard</firstname>
            <lastname>Senach</lastname>
          </person>
          <person key="axis-2005-id18416">
            <firstname>Doru</firstname>
            <lastname>Tanasa</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
            <moreinfo>resp</moreinfo>
          </person>
        </participants>
        <p>Inria Contract Reference: S04 AO485 00 SOPML00 1</p>
        <p>The EPIA project ``Evolution of an Adaptive Information Portal'' got labeled by RNTL 2002, and started on September 2003 until march 2006. Partners are Dalkia, Mediapps and Inria. This year, as Mediapps was bought by Ever (
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.ever-team.com/es/GetRecords?Template=ET/ET_HomePage" location="extern" xyref="1114963808009">
        http://www.ever-team.com/es/GetRecords?Template=ET/ET_HomePage</ref>expert in integrated ECM
        <footnote id="uid144" anchored="yes" place="foot">ECM: Enterprise Content Management</footnote>software), a change of project management was done in June 2005. The objectives of this project are the following:</p>
        <simplelist>
          <li id="uid145">
            <p>Supporting users of Mediapps.Net (tool for selecting canal information of an extranet) via clustering clients. This task started in 2004 and some generic algorithms and pre-processing tools were developed until the beginning of 2005. Some log analysis haven't been done because of the
            unavailability of real data.</p>
          </li>
          <li id="uid146">
            <p>After understanding the user needs for Net.Portal (construction tool for intranet portals), we finished the specification of the trace of the NetPortal engine (cf. the first version of the deliverable D3: ``Experimental context and trace engine in Net.Portal''.). The result of
            this work is the description of the Net.Portal relational database schema and the data organization. The specification of the Net.CanalRecommender was stopped and studied in the new context of the eversuite context.</p>
          </li>
        </simplelist>
        <p>We hold two project meetings in Paris with Ever (june and september) in order to re-orient the project according to Everteam wishes, taking into account the future integration of Mediapps.net and Net.portal in the eversuite software.</p>
      </subsection>
      <subsection level="2" id="uid147">
        <bodyTitle>MobiVIP: a PREDIT Project (2004-2006)</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18372">
            <firstname>Sergiu</firstname>
            <lastname>Chelcea</lastname>
          </person>
          <person key="axis-2005-id18293">
            <firstname>Mihai</firstname>
            <lastname>Jurca</lastname>
          </person>
          <person key="axis-2005-id18195">
            <firstname>Bernard</firstname>
            <lastname>Senach</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
            <moreinfo>resp.</moreinfo>
          </person>
        </participants>
        <p>Inria Contract Reference: 2 03 A2005 00 00MP5 01 1</p>
        <p>MobiVIP, Individual Public Vehicles for Mobility in town centres, is a research project of Predit 3 (Integration of the Communication and Information systems Group). It involves five research laboratories and seven small business companies (SME), in order to experiment, show and evaluate
        the impact of the NTIC on a new service for mobility in town centres. This service is made up of small urban vehicles completing existing public transport. The MobiVIP project will develop key technological bricks for the integrated deployment of mobility services in urban environment.</p>
        <p>The strengths of the project are: 1) the integration between assisted and automatic control, telecommunications, transport modeling, evaluation of service and 2) the demonstrations on 5 complementary experimental sites and 3) the evaluation of possible technology transfer.</p>
        <p>URL: 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/mobivip/" location="extern" xyref="848287942010">http://www-sop.inria.fr/mobivip/</ref></p>
        <p>In december 2004, we finalized in collaboration with B. Senach (Ergomatics Consultants) the delivrable 5.1 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid58" location="biblio" xyref="1958661692013"/>which we coordonate with Georges Gallais (Visa Action, Inria Sophia Antipolis). This deliverable aimed at defining
        a common generic evaluation scenario and proposed a framework to facilitate the identification of the main evaluation dimensions for each planned test or experimentation. This year we had two main tasks: the preparation of the deliverable 5.2 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid59" location="biblio" xyref="1958661692013"/>and the NancyCab event.</p>
        <simplelist>
          <li id="uid148">
            <p>The delivrable 5.2 addresses the definition of the main criteria of service quality from the user point of view: this evaluation takes into account the improvment of information access, information content, mobility and man-machine interaction.</p>
          </li>
          <li id="uid149">
            <p>We work on the preparation of the intermediate project evaluation at the NancyCab 2005 (17-18 juin, Stanislas Place, Nancy): participation at a preliminary meeting (18 may), preparation of a demo of our recommender systems published in 2004 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid60" location="biblio" xyref="1958661692013"/>, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid61" location="biblio" xyref="1958661692013"/>, a poster and also a presentation on ``Scénario générique d'évaluation'' for the evaluation workshop. Indeed
            this intermediate evaluation review has given different articles in various medias (Le Figaro journal 19 june, TV5.org le 20 juin etc.).</p>
          </li>
        </simplelist>
        <p>More we continued our previous work 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid60" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid61" location="biblio" xyref="1958661692013"/>in the travel information retrieval research field related to mobility in the transport domain. This year we
        welcomed one internship on this project:</p>
        <simplelist>
          <li id="uid150">
            <p>R. Busseuil who proposed in 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid42" location="biblio" xyref="1958661692013"/>a new distance for clustering user itineraries (cf. section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid85" location="intern" xyref="1958661692013"/>) and developed an interface for our researches related to urban iteneraries clustering based of Benomad
            software (cf. Figure 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid151" location="intern" xyref="1958661692013"/>).</p>
          </li>
        </simplelist>
        <object id="uid151">
          <table>
            <tr>
              <td>
                <ressource aux="image_10.png" xylemeAttach="10" media="WEB" xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="Images/2005-create_traject" type="float" width="120mm" xyref="878272205004"/>
              </td>
            </tr>
          </table>
          <caption>Interface of the urban transport support tool</caption>
        </object>
      </subsection>
      <subsection level="2" id="uid152">
        <bodyTitle>Industrial Contacts</bodyTitle>
        <p>Some contacts during this year:</p>
        <simplelist>
          <li id="uid153">
            <p>SAP, Sophia Antipolis related to data mining and data streams (security and environnement problems). Contact: B. Trousse and F. Masséglia</p>
          </li>
          <li id="uid154">
            <p>Mondeca and Antidot (leadership), in the context of a proposal to RNRT call for proposals. Our proposal called EIFFEL related to semantic web and e-Tourism was accepted. Academic partners are: LIRMM and University of Paris X (Nanterre). Contact: Y. Lechevallier.</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
  </contrats>
  <international id="uid155">
    <bodyTitle>Other Grants and Activities</bodyTitle>
    <subsection level="1" id="uid156">
      <bodyTitle>Regional Initiatives</bodyTitle>
      <p>Due to the bi-localization of the team, we are involved into two regions: PACA and Ile-de-France.</p>
      <subsection level="2" id="uid157">
        <bodyTitle>Color Action: ``e-Mimetic''</bodyTitle>
        <p>Our partners are: LePont laboratory (E. Boutin) of the University South Toulon and the IHMH team of LIRMM (M. Nanard, J. Nanard, J-Y. Delors), related to defining and evaluating new Web pages ranking criteria based on page presentation. The web server of this action is 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://axis.inria.fr/e-mimetic/" location="extern" xyref="827858677020">e-mimetic</ref>.</p>
        <p>During this action, we have two internships: Sofiane Sellah 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid62" location="biblio" xyref="1958661692013"/>located at Inria Sophia Antipolis on the use of generalized URLs for extracting sequential patterns according to
        different point of views (content or user access) and Patrick Chastellan, located at LIRMM (Montpellier) on the extraction of page presentation criteria.</p>
      </subsection>
      <subsection level="2" id="uid158">
        <bodyTitle>``Pôle de compétitivité SCS ``Solutions Communicantes Sécurisées''</bodyTitle>
        <p>AxIS (B. Senach and B. Trousse) is participating in the preparation of the ROSCOE project related to intelligent transport systems with different partners such: Hitachi Europe (leader), Vu Log, Nexo, Inria (Mascotte), CNRT Télius, etc.</p>
      </subsection>
      <subsection level="2" id="uid159">
        <bodyTitle>Other initiatives</bodyTitle>
        <simplelist>
          <li id="uid160">
            <p>Inria VISA Action: collaboration with G. Gallais and P. Rives (VISTA team, Inria Sophia Antipolis), M. Riveill (Rainbow team, I3S UNSA) on the topic ``adaptation and evaluation of services in the context of transports'' via the MobiVIP project, involving 22 partners (January 2004,
            December 2006).</p>
          </li>
          <li id="uid161">
            <p>Inria Rocquencourt: Gérard Huet for his expertise in Sanskrit.</p>
          </li>
          <li id="uid162">
            <p>Laboratoire des Usages, CNRT Télius, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.telius.org/" location="extern" xyref="856974008026">http://www.telius.org</ref>Sophia Antipolis. B. Trousse is a member of the scientific
            committee and a substitute member of the management committee. B. SEnach participated to the meeting related to: ``Restitution de l'enquéte - Recherche SHS et Société de l'Information en région Provence-Alpes-Cote d'azur'', Marseille (november).</p>
          </li>
          <li id="uid163">
            <p>Supelec: research collaboration with Marie-Aude Aufaure in the context of Baldé's PhD thesis 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid26" location="biblio" xyref="1958661692013"/>.</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
    <subsection level="1" id="uid164">
      <bodyTitle>National Initiatives</bodyTitle>
      <p>AxIS is involved in several national working groups.</p>
      <subsection level="2" id="uid165">
        <bodyTitle>CNRS RTP 12: ``information et connaissance: découvrir et résumer''</bodyTitle>
        <p>In the context of the pluri-disciplinary thematic 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://rtp12.loria.fr/" location="extern" xyref="2512449951008">http://rtp12.loria.fr</ref>, we participated to the CNRS Specific Action (AS 120) ``Disco
        Challenge'' animated by J.F. Boulicaut and B. Crémilleux. We made a presentation to the Discovery challenge proposed at PKDD/ECML 05 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid46" location="biblio" xyref="1958661692013"/>.</p>
      </subsection>
      <subsection level="2" id="uid166">
        <bodyTitle>CNRS Action Concertée Incitative : ``Histoire des savoirs''</bodyTitle>
        <p>This initiative (ACI RNR TTT Grammaire et math matique dans le monde indien 17/01/03 - 17/01/06) associates several French research teams from various research fields, such as computer science, data analysis, and Sanskrit literature. The main goal of this action is to provide help for
        the construction of critical edition of Indian manuscripts in Sanskrit, and to provide pertinent information about the manuscripts classification (construction of cladistic trees). The expected tools will not be restricted to Sanskrit language. This action is completed according some
        different aspects by the European AAT project which allows us to collect more Sankrit manuscripts and to care about some interactive aspect that we where not able to take into account with the ACI dotation. The action will end in december 2006.</p>
      </subsection>
      <subsection level="2" id="uid167">
        <bodyTitle>EGC National Group on Mining Complex Data</bodyTitle>
        <p>URL: 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://eric.univ-lyon2.fr/projets.php" location="extern" xyref="2345245307026">http://eric.univ-lyon2.fr/projets.php</ref></p>
        <p>AxIS members participated actively this year to the Working Group ``Fouille de données complexes'' created by D.A Zighed in June 2003 in the context of the EGC association:</p>
        <simplelist>
          <li id="uid168">
            <p>F. Masséglia with P. Gancarski (LSIIT, Strasbourg) co-organised and co-chaired the second workshop ``Fouille de données complexes dans un processus d'extraction de connaissances'' (January 18, 2005) 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid63" location="biblio" xyref="1958661692013"/>. Y. Lechevallier and B. Trousse were members of the program committee.</p>
          </li>
          <li id="uid169">
            <p>F. Masséglia, B. Trousse participated to the meeting of the two national working groups of the national group on mining complex data in relation with the working group 3.4 ``Data Mining'' of the GDR I3 (May, Paris). F. Masséglia with O. Boussaïd co-animated one of
            these two working groups: ``organisation and structuration of complex data''.</p>
          </li>
          <li id="uid170">
            <p>H. Behja, F. Masséglia and B. Trousse participated in the main meeting of the working group held in Lyon (ERIC) on September 9, 2005. H. Behja made a presentation of his PhD thesis ``Vers une approche Web sémantique pour le processus ECD''.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid171">
        <bodyTitle>GDR-I3</bodyTitle>
        <p>AxIS participated to three working groups of the 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://sis.univ-tln.fr/gdri3/" location="extern" xyref="2495655999011">GDR-PRC~I3</ref>National Research Group ``Information - Interaction - Intelligence'' of
        CNRS:</p>
        <simplelist>
          <li id="uid172">
            <p>Working Group 3.4 (GT) on Data Mining animated by P. Poncelet and J.M. Petit. H. Behja, F. Masséglia and B. Trousse participated to the Paris meeting (May) in collaboration with the working group FDC. F. Masséglia and A. Baldé participated to the second meeting at Lyon
            (November 21). A. Baldé made a presentation of his PhD thesis ``Utilisation de métadonnées pour l'aide à l'interprétation de classes et de partitions''.</p>
          </li>
          <li id="uid173">
            <p><span align="left" class="smallcap">Gracq</span>(
            <i>Groupe de Recherche en Acquisition des Connaissances</i>) (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.irit.fr/GRACQ" location="extern" xyref="3498372435003">GRACQ</ref>): B. Trousse.</p>
          </li>
          <li id="uid174">
            <p>Working Group 3.1 ``Sécurité des Systèmes d'Information'' animated by D. Boulanger and A. Gabillon: F. Masséglia and B. Trousse.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid175">
        <bodyTitle>Other Collaborations</bodyTitle>
        <simplelist>
          <li id="uid176">
            <p>LIRMM (Montpellier) and Ecole des mines d'Alès (LGI2P): F. Masséglia with M. Tesseire (LIRMM) and P. Poncelet (LGI2P) proposed 1) a survey related to sequential pattern mining method and issues 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid64" location="biblio" xyref="1958661692013"/>2) a method dedicated to the management of time constraints in the generalized sequential pattern extraction
            process 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid65" location="biblio" xyref="1958661692013"/>and 3) a distributed algorithm for mining users behaviours on a P2P network (a paper about this work has been
            accepted for the 6th French conference on knowledge extraction and management (EGC'06)).</p>
          </li>
          <li id="uid177">
            <p>ENST: Y. Lechevallier collaborated with Georges Hébrail (ENST).</p>
          </li>
          <li id="uid178">
            <p>Two ARC proposals: 1) ARC SéSur: ``Sécurité et Surveillance dans les data streams'' (resp: F. Masséglia) with M.O Cordier (DREAM, IRISA) P. Poncelet (LGI2P, Alès) and M. Teisseire (LIRMM, Montpellier); 2) ARC Valex: `` Vérification et exploitation de collections de documents
            scientifiques semi-structurés'' (resp: A.-M. Vercoustre) with Annie Morin (TEXMEX, IRISA Rennes), A. Napoli (Orpailleur, INRIA, Nancy), Nathalie Aussenac (IRIT, Toulouse)</p>
          </li>
          <li id="uid179">
            <p>GRIMM-SMASH team (Université Toulouse Le Mirail): F. Rossi works with Nathalie Villa on Support Vector Machines and functional data (cf section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid108" location="intern" xyref="1958661692013"/>and 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid33" location="biblio" xyref="1958661692013"/>, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid32" location="biblio" xyref="1958661692013"/>).</p>
          </li>
          <li id="uid180">
            <p>LITA EA3097 (Université de Metz): F. Rossi and A. El Golli work with Brieuc Conan-Guez on the Self Organizing Map for dissimilarity matrices (see section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid107" location="intern" xyref="1958661692013"/>and 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid30" location="biblio" xyref="1958661692013"/>). F. Rossi works with Brieuc Conan-Guez on functional data analysis (cf section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid108" location="intern" xyref="1958661692013"/>and 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid34" location="biblio" xyref="1958661692013"/>, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid35" location="biblio" xyref="1958661692013"/>, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid36" location="biblio" xyref="1958661692013"/>).</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
    <subsection level="1" id="uid181">
      <bodyTitle>European Initiatives</bodyTitle>
      <subsection level="2" id="uid182">
        <bodyTitle>EuropeAID Project: For Archaeology of Ancient Asian Texts (AAT)</bodyTitle>
        <participants category="None">
          <person key="axis-2005-id18244">
            <firstname>Marc</firstname>
            <lastname>Csernel</lastname>
          </person>
          <person key="axis-2005-id18372">
            <firstname>Sergiu</firstname>
            <lastname>Chelcea</lastname>
          </person>
          <person key="axis-2005-id18560">
            <firstname>Marina</firstname>
            <lastname>Dufresne</lastname>
          </person>
          <person key="axis-2005-id18098">
            <firstname>Yves</firstname>
            <lastname>Lechevallier</lastname>
          </person>
          <person key="axis-2005-id18678">
            <firstname>Sattisvar</firstname>
            <lastname>Tandabany</lastname>
          </person>
          <person key="axis-2005-id18078">
            <firstname>Brigitte</firstname>
            <lastname>Trousse</lastname>
          </person>
        </participants>
        <p>This year we started our project called ``AAT'' in the context of the EuropAid (DG1) projects and more precisely of the Asia Information Technology (I.T. Asia). We collaborated mainly with François Patte (UFR Maths-Informatique, UNiv Parie 5 René Descartes) and Pascale Haag (EHESS,
        Centre d'études de l'Inde et de l'Asie du Sud, Paris).</p>
        <subsection level="3" id="uid183">
          <bodyTitle>The objective of the AAT</bodyTitle>
          <p>Ancient texts, whether religious, scientific or philosophic are known to us due to the patient and vigilant work of scribes who, from centuries to centuries, have copied and copied again successive versions of an original text (usually lost for ever).</p>
          <p>So there is a chain of copies starting with the original text and continued by an immense tree of hundreds of copies that has grown more or less like a genealogical tree. They are never identical to each other, sometimes extremely different. Parts of the original are missing, fragments
          are not readable anymore, some have been miscopied, and some others have been voluntarily transformed. This is particularly true for the large Indian subcontinent where at least one third of the manuscript existing through the whole world are supposed to exist, mostly unpreserved ,
          unreferenced , and being at mercy of any accidental event. Even during the 20th century manuscripts were copied by hand by armies of scholars.</p>
          <p>Still a question remains unsolved as to how to compare hundreds of different copies of a same original ancient text, and to decide which fragments are original and which ones are not in order to re-build the original document.</p>
          <p>Specific software has recently been designed for Latin and Greek scripts which open new avenues to study ancient texts from Roman and Hellenistic periods. It is the aim of the present project to design a most advanced IT tool for ``archaeology of ancient Asian texts''. Such IT Tool
          will be based strictly on open source.</p>
        </subsection>
        <subsection level="3" id="uid184">
          <bodyTitle>Contributions to program</bodyTitle>
          <p>This project involves Axis as the applicant of the project and three others partners: University ``La Sapienza'' in Rome (Facoltà di Studi Orientali), the Bhandarkar Institute of Oriental Studies (BORI) in Poona (India) and the Mahendra Sanskrit University de Kathmandu (Népal).</p>
          <p>Our three partners will dedicate their force to the collection of manuscripts of a famous Indian grammatical text: The Kâçikâvritti or ``Benares glosses''. This text is the oldest comment (around the 7th century) of the Panini grammar, the world oldest example of generative grammar. It
          is well known trough hundreds of manuscripts disseminated all around the Indian subcontinent. These manuscripts are dated from the 12th century to the beginning of the 20th century. They are supposed to display the representation of the same text, but because of the time, their
          completeness is only partially assumed, and they can differ from each other.</p>
          <p noindent="true">Axis is providing the necessary software to reach two different goals which can be completed only one after the other:</p>
          <simplelist>
            <li id="uid185">
              <p>Providing the software tools necessary to help the creation of critical edition of the Sanskrit texts. As a secondary result, a distance between the texts should be established based on the presence/absence of the different words in each manuscript (cf. sections 
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid84" location="intern" xyref="1958661692013"/>, 
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid100" location="intern" xyref="1958661692013"/>).</p>
            </li>
            <li id="uid186">
              <p>Using the distance established by the first software sets, trying to establish which are the different cluster set of manuscript (for example via a 2-3 HAC clustering), try to establish more or less a phylogeny of the different manuscripts</p>
            </li>
          </simplelist>
          <p>One could wonder what is the need for a specific project to compare different Sanskrit texts, as tools such as the famous Unix DIFF exist since a long time. The response is given by some of the Sanskrit writing specificities:</p>
          <simplelist>
            <li id="uid187">
              <p>Sanskrit is written according to a 48 letter alphabet, but, on computer, is written using Latin alphabet using a transliteration such as the Velthuis one.</p>
            </li>
            <li id="uid188">
              <p>Sanskrit is written without blank and the blanks are not very significant</p>
            </li>
            <li id="uid189">
              <p>When two words are written without blank separation, the spelling becomes different, it is the sandhi problem.</p>
            </li>
          </simplelist>
          <p>Three internships were carried out on this project: S. Tandabany (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid84" location="intern" xyref="1958661692013"/>), M. Dufresne and S. Kebbache (cf. section 
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid100" location="intern" xyref="1958661692013"/>).</p>
        </subsection>
      </subsection>
      <subsection level="2" id="uid190">
        <bodyTitle>ERCIM</bodyTitle>
        <p>B. Trousse presented AxIS researches at the Kickoff meeting of the ERCIM Working group on ``Data and Information Mining'' organised by Christoph Schommer on january 14th at the Campus Kirchberg (University of Luxembourg).</p>
      </subsection>
      <subsection level="2" id="uid191">
        <bodyTitle>Other Collaborations</bodyTitle>
        <simplelist>
          <li id="uid192">
            <p>Portugal: B. Trousse collaborated with F. Amilcar Cardoso (amilcar@dei.uc.pt) in the context of the COST Action 282 (2001-2005): ``Knowledge Exploration in Science and Technology''.</p>
            <p noindent="true">URL:
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.mpa-garching.mpg.de/~opmolsrv/COST282/" location="extern" xyref="2784090054023">http://www.mpa-garching.mpg.de/~opmolsrv/COST282/</ref>.</p>
          </li>
          <li id="uid193">
            <p>Italy, University of Napoli II (Profs C. Lauro and R. Verde) : Y. Lechevallier, A. El Golli, D. Tanasa and B. Trousse</p>
          </li>
          <li id="uid194">
            <p>Italy, KDD Lab. Instituto ISTI, (Fosca Gianotti): some potential collaborations were identified after the ERCIM kickoff meeting.</p>
          </li>
          <li id="uid195">
            <p>Belgium, Facultés Universitaires Notre-Dame de la Paix à Namur (Profs A. Hardy, M. Noirhomme and J.-P. Rasson) 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid12" location="biblio" xyref="1958661692013"/>: Y.  Lechevallier.</p>
          </li>
          <li id="uid196">
            <p>Belgium, Université Catholique de Louvain, DICE Laboratory (Prof. Michel Verleysen, Prof. Vincent Wertz, Dr. Amaury Lendasse, Damien François): F. Rossi was invited professor for one month in 2005 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid66" location="biblio" xyref="1958661692013"/>, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid67" location="biblio" xyref="1958661692013"/>.</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
    <subsection level="1" id="uid197">
      <bodyTitle>International Initiatives</bodyTitle>
      <subsection level="2" id="uid198">
        <bodyTitle>Australia</bodyTitle>
        <p>A-M. Vercoustre collaborates with RMIT, Computer Science department, Melbourne, Australia, on analysing and improving XML search from the point of view of the user 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid55" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid57" location="biblio" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid56" location="biblio" xyref="1958661692013"/>. This work is mostly done in the context of the Initiative for the Evaluation of XML Retrieval (
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://inex.is.informatik.uni-duisburg.de:2004/" location="extern" xyref="2251329905031">INEX-2004</ref>), DELOS network of Excellence.</p>
      </subsection>
      <subsection level="2" id="uid199">
        <bodyTitle>Brazil</bodyTitle>
        <p>We continue our collaboration on clustering and web usage mining with F.A.T. de Carvalho from Federal University of Pernambuco (Recife) and his team. We welcomed F.A.T. de Carvalho, during 3 months, September to November. During this year some analysis of Recife Log files are carried out
        by students from Recife University, Napoly University and by AxIS members. Common papers have been proposed at EGC and IFCS. Moreover, we have finished the submission of an article for Computational Statistics Journal (Springer). A poster was presented during the meeting (October 13 to 14)
        on information technologies of Brazil. We have proposed a joint research projet in the framework of the cooperation between INRIA and FACEPE. We also welcomed Thesera Ludemir, during 15 days which has worked with Fabrice Rossi on neural methods.</p>
        <p>Two internships were done on this project:</p>
        <simplelist>
          <li id="uid200">
            <p>A. Da Silva, Clustering in Web Usage Mining with Recife Log files and workbench of PKDD (cf. section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid125" location="intern" xyref="1958661692013"/>) 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid46" location="biblio" xyref="1958661692013"/>, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid47" location="biblio" xyref="1958661692013"/>.</p>
          </li>
          <li id="uid201">
            <p>N. Lopes Calvacanti Junior has started an internship in October 2005 (planned ending date: march 2006). He is working on the implementation of the Self Organizing Map on dissimilarity matrices (see section 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid107" location="intern" xyref="1958661692013"/>).</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid202">
        <bodyTitle>Canada</bodyTitle>
        <p>Y. Lechevallier pursued his collaboration with A. Ciampi (Univ of McGill, Montréal).</p>
        <p>Osmar Zaiane, Professor at the university of Alberta (Canada), visited us during five days at Inria Sophia Antipolis. He participated in Doru Tanasa's Ph.D. committee on 3rd June.</p>
      </subsection>
      <subsection level="2" id="uid203">
        <bodyTitle>India</bodyTitle>
        <p>Marc Csernel collaborated with the Bhandrakar Institute (India) and the Mahendra Sanskrit University (Nepal) via the CNRS action ``History of Knowledge'' (cf. section 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid166" location="intern" xyref="1958661692013"/>) and also via the consortium members of EuropeAid projet of Asia-Information Technology and
        Communications (
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid84" location="intern" xyref="1958661692013"/>, 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#uid182" location="intern" xyref="1958661692013"/>).</p>
      </subsection>
      <subsection level="2" id="uid204">
        <bodyTitle>Morocco</bodyTitle>
        <p>AxIS is involved in a France-Morocco thematic network in software engineering. In this context, B. Trousse co-supervises with Abdelaziz Marzark (University of Casablanca) a Ph.D. student: H. Behja (ENSAM, Meknès, Morocco). H. Behja visited us for his thesis work during the summer
        period and also for our annual AxIS workshop (october 24-26). Mr. Marzark visited us in November (10-13).</p>
      </subsection>
      <subsection level="2" id="uid205">
        <bodyTitle>Romania</bodyTitle>
        <p>We maintained our contacts with the Computer Science department of the West University of Timisoara (Prof Viorel Negru), in particular via the SYNASC conference every year.</p>
      </subsection>
      <subsection level="2" id="uid206">
        <bodyTitle>Tunisia</bodyTitle>
        <p>Y. Lechevallier was invited in January by ENIT (professor Ben Ahmed) at Tunis for a tutorial on ``Data Mining and Neural Methods''. Possible cooperations were studied via a co-supervision of future doctoral students.</p>
      </subsection>
    </subsection>
  </international>
  <diffusion id="uid207">
    <bodyTitle>Dissemination</bodyTitle>
    <subsection level="1" id="uid208">
      <bodyTitle>Promotion of the Scientific Community</bodyTitle>
      <subsection level="2" id="uid209">
        <bodyTitle>Journals</bodyTitle>
        <p>AxIS members belongs to editorial boards of two international journals and three national journals:</p>
        <simplelist>
          <li id="uid210">
            <p>the Co-Design Journal (Editor: S. Scrivener, Coventry University, UK - Publisher: Swets &amp; Zeitlinger): B.Trousse</p>
          </li>
          <li id="uid211">
            <p>the Journal of Symbolic Data Analysis (JSDA) (Editor: E. Diday, electronic journal 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.jsda.unina2.it" location="extern" xyref="278549418019">http://www.jsda.unina2.it</ref>): Y. Lechevallier, F. Rossi and B. Trousse.</p>
          </li>
          <li id="uid212">
            <p>the RIA journal (&lt;&lt; Revue d'Intelligence Artificielle &gt;&gt;) (Hermès publisher; editor in chief: M. Pomerol): B. Trousse.</p>
          </li>
          <li id="uid213">
            <p>the I3 electronic journal of the GDR-I3 (editor-in-chief: C. Garbay et H. Prade) 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.Revue-I3.org/" location="extern" xyref="1957798662018">http://www.Revue-I3.org/</ref>: B. Trousse.</p>
          </li>
          <li id="uid214">
            <p>La revue MODULAD (electronic journal, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.modulad.fr/" location="extern" xyref="1368920875004">http://www.modulad.fr/</ref>): Y. Lechevallier is one of the main editors and F. Rossi
            is a member of the editorial board</p>
          </li>
        </simplelist>
        <p>F. Masséglia and B. Trousse were invited editors (with O. Boussaid and P. Gancarski) of a Special issue of the RNTI (Revue des Nouvelles Technologies de l'Information) on ``Complex Data Mining'' 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid68" location="biblio" xyref="1958661692013"/>. Y. Lechevallier was a member of the editorial board and A-M. Vercoustre was an additional reviewer.</p>
        <p>AxIS members were reviewers for sixteen international and national journals and for one international book</p>
        <simplelist>
          <li id="uid215">
            <p>the IEEE Journal of Transactions on Data and Knowledge Engineering (TDKE): F. Masséglia, B. Trousse (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.computer.org/tkde" location="extern" xyref="2730187461021">http://www.computer.org/tkde/</ref>)</p>
          </li>
          <li id="uid216">
            <p>the International Journal 'Behaviour &amp; Information Technology' (BIT: Taylor &amp; Francis Publisher)</p>
          </li>
          <li id="uid217">
            <p>the Information Systems (IS) Journal: F. Masséglia. (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://ees.elsevier.com/is/" location="extern" xyref="1809251950019">http://ees.elsevier.com/is/</ref>)</p>
          </li>
          <li id="uid218">
            <p>the Data Mining and Knowledge Discovery (DMKD) Journal (twice): F. Masséglia (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="https://www.editorialmanager.com/dami/" location="extern">https://www.editorialmanager.com/dami/</ref>)</p>
          </li>
          <li id="uid219">
            <p>the Journal of Systems and Software (JSS): F. Masséglia. (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://ees.elsevier.com/jss/" location="extern" xyref="3946825542009">http://ees.elsevier.com/jss/</ref>)</p>
          </li>
          <li id="uid220">
            <p>the Data and Knowledge Engineering Journal (DKE): F. Masséglia. (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.sciencedirect.com/science/journal/0169023X" location="extern" xyref="4294246138023">http://www.sciencedirect.com/science/journal/0169023X</ref>)</p>
          </li>
          <li id="uid221">
            <p>La revue Modulad: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.modulad.fr/" location="extern" xyref="1368920875004">http://www.modulad.fr/</ref>)</p>
          </li>
          <li id="uid222">
            <p>Computational Statistics: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://comst.wiwi.hu-berlin.de/" location="extern" xyref="554549228027">http://comst.wiwi.hu-berlin.de/</ref>)</p>
          </li>
          <li id="uid223">
            <p>Scandinavian Journal of Statistics: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.blackwellpublishing.com/journal.asp?ref=0303-6898" location="extern" xyref="2402882575001">
            http://www.blackwellpublishing.com/journal.asp?ref=0303-6898</ref>)</p>
          </li>
          <li id="uid224">
            <p>Computational Statistics and Data Analysis: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.elsevier.com/locate/csda" location="extern" xyref="1901695244023">http://www.elsevier.com/locate/csda</ref>)</p>
          </li>
          <li id="uid225">
            <p>Neural Processing Letters: F. Rossi</p>
            <p noindent="true">(
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.springerlink.com/openurl.asp?genre=journal&amp;issn=1370-4621" location="extern" xyref="3924716557008">
            http://www.springerlink.com/openurl.asp?genre=journal&amp;issn=1370-4621</ref>)</p>
          </li>
          <li id="uid226">
            <p>Revue de Statistique Appliquée: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.sfds.asso.fr/publicat/rsa.htm" location="extern" xyref="550110558030">http://www.sfds.asso.fr/publicat/rsa.htm</ref>)</p>
          </li>
          <li id="uid227">
            <p>Neurocomputing (twice): F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.elsevier.com/locate/issn/09252312" location="extern" xyref="1498269453000">http://www.elsevier.com/locate/issn/09252312</ref>)</p>
          </li>
          <li id="uid228">
            <p>Computational Geosciences: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.springeronline.com/journal/10596/about" location="extern" xyref="1892160293016">http://www.springeronline.com/journal/10596/about</ref>)</p>
          </li>
          <li id="uid229">
            <p>Control and Intelligent Systems Journal: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href=" http://www.actapress.com/Content_of_Journal.aspx?journalID=58" location="extern" xyref="1860799827020">
            http://www.actapress.com/Content_of_Journal.aspx?journalID=58</ref>)</p>
          </li>
          <li id="uid230">
            <p>AI Communications: F. Rossi (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://aicom.web.cse.unsw.edu.au/" location="extern" xyref="3381966838022">http://aicom.web.cse.unsw.edu.au/</ref>)</p>
          </li>
          <li id="uid231">
            <p>Book on ``Processing and Managing Complex Data for Decision Support'': F. Masséglia, B. Trousse. (
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://chirouble.univ-lyon2.fr/bderic/publications/index.php" location="extern" xyref="1299921038016">
            http://chirouble.univ-lyon2.fr/bderic/publications/index.php</ref>)</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid232">
        <bodyTitle>Program Committees</bodyTitle>
        <p>Several AxIS members were involved at national or international conferences/worhshops as member of Program Committee or as additional reviewer. Let us note that we organized this year two workshops this year (FDC at EGC05 and MDM/KDD'05).</p>
        <subsection level="3" id="uid233">
          <bodyTitle>National Conferences/Workshops</bodyTitle>
          <simplelist>
            <li id="uid234">
              <p>Atelier FDC Fouille de Données Complexes (at EGC'05): F. Masséglia (co-chair), B. Trousse, F. Rossi (additional reviewer) (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/fdc-egc05/FDC05_CFP.htm" location="extern" xyref="471387673029">http://www-sop.inria.fr/axis/fdc-egc05/FDC05_CFP.htm</ref>)</p>
            </li>
            <li id="uid235">
              <p>EGC'05 (Paris, January) Extraction et Gestion des Connaissances: Y. Lechevallier, F. Rossi (additional reviewer) and B. Trousse. (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.math-info.univ-paris5.fr/egc2005/index.php" location="extern" xyref="447845164014">http://www.math-info.univ-paris5.fr/egc2005/index.php</ref>)</p>
            </li>
            <li id="uid236">
              <p>Atelier sur la modélisation utilisateurs et personnalisation de l'interaction homme-machine (at EGC'2005): B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-connex.lip6.fr/~artieres/EGC/Atelier_MU_EGC.html" location="extern" xyref="2651474602009">
              http://www-connex.lip6.fr/~artieres/EGC/Atelier_MU_EGC.html</ref>)</p>
            </li>
            <li id="uid237">
              <p>Plateforme AFIA 2005, atelier RàPC Raisonnement à Partir de Cas (Nice, May): B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/acacia/afia2005/rapc/" location="extern" xyref="4287531767019">http://www-sop.inria.fr/acacia/afia2005/rapc/</ref>)</p>
            </li>
            <li id="uid238">
              <p>CORIA 2005 (Grenoble, March) Conférence en Recherche d'Informations et Applications: B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-clips.imag.fr/mrim/coria05/main_coria.html" location="extern" xyref="3023635605020">
              http://www-clips.imag.fr/mrim/coria05/main_coria.html</ref>)</p>
            </li>
            <li id="uid239">
              <p>UBIMOB 2005 Mobilité et Ubiquité (Grenoble, France, June): B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-lsr.imag.fr/UbiMob05/index.html" location="extern" xyref="1451039459008">http://www-lsr.imag.fr/UbiMob05/index.html</ref>)</p>
            </li>
            <li id="uid240">
              <p>SSTIC 2005 (Rennes, June) Symposium sur la Sécurité des Technologies de l'Information et des Communications: F. Rossi (additional reviewer) (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.sstic.org/SSTIC05/info.do" location="extern" xyref="3911104544018">http://www.sstic.org/SSTIC05/info.do</ref>)</p>
            </li>
            <li id="uid241">
              <p>BDA 2005 (Saint-Malo, October) Conférence Bases de Données Avancées: F. Masséglia (additional reviewer).</p>
            </li>
          </simplelist>
        </subsection>
        <subsection level="3" id="uid242">
          <bodyTitle>International Conferences/Workshops</bodyTitle>
          <simplelist>
            <li id="uid243">
              <p>MDM/KDD'05 the sixth International Workshop on Multimedia Data Mining 
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid69" location="biblio" xyref="1958661692013"/>held in conjunction with KDD'05, Chicago, USA): F. Masséglia was co–chair with Fatma Bouali (Univ.
              Lille) and Latifur Khan (Univ. Texas at Dallas). (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/mdm-kdd05/MDM05.htm" location="extern" xyref="885968027025">http://www-sop.inria.fr/axis/mdm-kdd05/MDM05.htm</ref></p>
            </li>
            <li id="uid244">
              <p>GfKI 2005 (Magdeburg, Germany, March) 29th annual conference of the German Classification Societe - From Date and Information Analysis to Knowledge Engineering: F. Rossi (additional reviewer) (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://omen.cs.uni-magdeburg.de/itikmd/gfkl2005/" location="extern" xyref="2791459872022">http://omen.cs.uni-magdeburg.de/itikmd/gfkl2005</ref>)</p>
            </li>
            <li id="uid245">
              <p>WWW 2005 (Valencia, Spain, March) 1st Int'l Workshop on Automated Specification and Verification of Web Sites: T. Despeyroux (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.dsic.upv.es/workshops/wwv05/" location="extern" xyref="1438745794026">http://www.dsic.upv.es/workshops/wwv05/</ref>)</p>
            </li>
            <li id="uid246">
              <p>ESANN 2005 (Bruges, Belgium, April) 13th European Symposium on Artificial Neural Network: F. Rossi (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.dice.ucl.ac.be/esann/" location="extern" xyref="360472534016">http://www.dice.ucl.ac.be/esann/</ref>)</p>
            </li>
            <li id="uid247">
              <p>CSCW 2005 (Coventry, UK, May) 9th International Conference on CSCW in Design: B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://2005.cscwid.org/" location="extern" xyref="2897834382012">http://2005.cscwid.org/</ref>)</p>
            </li>
            <li id="uid248">
              <p>CIR 2005 (Paris, July)International Workshop on Context-Based Information Retrieval: A-M. Vercoustre (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://wwwsi.supelec.fr/bld/CIR-2005/" location="extern" xyref="3684192361025">http://wwwsi.supelec.fr/bld/CIR-2005/</ref>)</p>
            </li>
            <li id="uid249">
              <p>IJCAI 2005 (Edinburg, Scotland, Aug.) 19th International Joint Conference on Artificial Intelligence: B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://ijcai05.csd.abdn.ac.uk/" location="extern" xyref="997844372016">http://ijcai05.csd.abdn.ac.uk/</ref>)</p>
            </li>
            <li id="uid250">
              <p>ACM SIGIR 2005 (Salvador, Brazil, August)Conference on Research and Development in Information Retrieval, posters: A-M. Veroustre (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.dcc.ufmg.br/eventos/sigir2005/" location="extern" xyref="3452304342015">http://www.dcc.ufmg.br/eventos/sigir2005/</ref>)</p>
            </li>
            <li id="uid251">
              <p>6th International Workshop on Multimedia Data Mining, in conjunction with KDD-2005 (Chicago, USA, August): F. Masséglia, B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/mdm-test/content.htm" location="extern" xyref="3955096940027">http://www-sop.inria.fr/axis/mdm-test/content.htm</ref>)</p>
            </li>
            <li id="uid252">
              <p>ICCBR 2005 (Chicago, USA, August) 6th International Conference on Case-Based Reasoning: B. Trousse (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.iccbr.org:8080/iccbr05/index.jsp" location="extern" xyref="3491870093010">http://www.iccbr.org:8080/iccbr05/index.jsp</ref>)</p>
            </li>
            <li id="uid253">
              <p>ICANN 2005 (Warsaw, Poland, September) International Conference on Artificial Neural Networks: F. Rossi (additionnal reviewer) (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.ibspan.waw.pl/ICANN-2005/" location="extern" xyref="3065585202006">http://www.ibspan.waw.pl/ICANN-2005/</ref>)</p>
            </li>
            <li id="uid254">
              <p>Intellicom 2005 (Montreal, Canada, October) IFIP International Conference on Intelligence in Communication Systems: A-M. Vercoustre (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.congresbcu.com/intellcomm2005/" location="extern" xyref="3285957120021">http://www.congresbcu.com/intellcomm2005/</ref>)</p>
            </li>
            <li id="uid255">
              <p>ACM DocEng 2005 (Bristol, UK, November) Symposium on Document Engineering: A-M. Vercoustre (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.documentengineering.org/" location="extern" xyref="2866817910003">http://www.documentengineering.org/</ref>)</p>
            </li>
            <li id="uid256">
              <p>ADCS 2005 (Sidney, Australia, December) 10th Australasian Document Computing Symposium: A-M. Vercoustre (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://goanna.cs.rmit.edu.au/~aht/adcs2005/" location="extern" xyref="3869029670014">http://goanna.cs.rmit.edu.au/~aht/adcs2005/</ref>)</p>
            </li>
            <li id="uid257">
              <p>ICPReMI'05 (Kolkata, India, December) Technical session on Symbolic Data Analysis: M. Csernel (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.isical.ac.in/~premi05/" location="extern" xyref="2112732845023">http://www.isical.ac.in/~premi05/</ref>)</p>
            </li>
            <li id="uid258">
              <p>MSTD 2005 (Porto, Portugal) the first international workshop on Mining Spatio-Temporal Data (held in conjunction with PKDD'05): F. Masséglia. (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.di.uniba.it/~malerba/activities/mstd/" location="extern" xyref="1312152829002">http://www.di.uniba.it/~malerba/activities/mstd/</ref>)</p>
            </li>
            <li id="uid259">
              <p>IDEAS 2005 (Montreal, Canada) the 9th International Database Engineering &amp; Application Symposium: F. Masséglia (additional reviewer). (
              <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://ideas.concordia.ca/ideas2005/" location="extern" xyref="471127949011">http://ideas.concordia.ca/ideas2005/</ref>)</p>
            </li>
          </simplelist>
        </subsection>
      </subsection>
      <subsection level="2" id="uid260">
        <bodyTitle>Invited Seminars</bodyTitle>
        <simplelist>
          <li id="uid261">
            <p>ENIT Tunisia, Séminaire RAIDI: Y. Lechevallier (``Classification automatique dans le Web Usage Mining''), january.</p>
          </li>
          <li id="uid262">
            <p>Project Team CORTEX (LORIA), March 2005: F. Rossi (``Une implémentation efficace du SOM sur tableau de dissimilarités'')</p>
          </li>
          <li id="uid263">
            <p>Common day between the following scientific associations SFDS, EGC, SFC, INFORSID and AFIA, March 21, organised by the French Society of Statistics (SFdS): Y. Lechevallier (``Le tableau de données, une structure unique, des réalités multiples'').</p>
          </li>
          <li id="uid264">
            <p>Machine Learning Group (DICE Laboratory), Université Catholique de Louvain (Belgium), June 2005: F. Rossi (``Classification in Functional Spaces with Support Vector Machines'')</p>
          </li>
          <li id="uid265">
            <p>National Group on ``Mining Complexe data'', H. Behja, september 9, Uiversity of Lyon II. ``Vers une approche web sémantique du processus d'ECD''.</p>
          </li>
          <li id="uid266">
            <p>Seminar ``Logiciels libres en Data Mining'', October 13, organised by the French Society of Statistics (SFdS), InfoStat group , Data Mining et Logiciels: Y. Lechevallier (``WEKA, un logiciel libre en Data Mining'').</p>
          </li>
          <li id="uid267">
            <p>E.N.S. ``Ecole Normale Supérieure''(Ulm, Paris): M. Csernel presented a conference entitled ``Grammaire et mathématiques dans le monde indien: histoire des savoirs, histoire des textes et nouvelles technologies au service de la philologie'' in december.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid268">
        <bodyTitle>Organization of Conferences or Workshops</bodyTitle>
        <p>Besides the organization of the workshops FDC/EGC'05) and MDM/KDD'05, we are involved in others organization tasks:</p>
        <simplelist>
          <li id="uid269">
            <p>Member of the organizing committee of the first IEEE international workshop on ``Mining Complex Data'' (held in conjunction with ICDM, Houston, November): F. Masséglia.</p>
          </li>
          <li id="uid270">
            <p>Organisation of our annual AxIS workshop at Inria Rocquencourt (24-26 october): S. Aubin, S. Honnorat, Y. Lechevallier and B. Trousse. Monthly team meetings were organised by videoconferecne between AxIS Sophia Antipolis and AxIS Rocquencourt.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid271">
        <bodyTitle>AxIS Web Server</bodyTitle>
        <p>AxIS maintains an external and an internal Web site allowing the access to lots of information, including software developed in the team, our publications, relevant events (conferences, workshops) and information related to the conferences and seminar we organise. URL:
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/" location="extern" xyref="835040938007">http://www-sop.inria.fr/axis/</ref>.</p>
        <p noindent="true">S. Chelcea delevoped our publication management tool called ``BibAdmin''. BibAdmin is a collection of PHP/MySQL scripts for bibliographic (Bibtex) management over the Web. Publications are stored in a MySQL database and can be added/edited/modified via a Web
        interface. It is specially designed for research teams to easily manage their publications or references and to make their results more visible. Users can build different private/public bibliographies which can be then used to compile LaTeX documents. BibAdmin is made available under the
        GNU GPL license on INRIA's GForge server at: 
        <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://gforge.inria.fr/projects/bibadmin/" location="extern" xyref="957534047010">http://gforge.inria.fr/projects/bibadmin/</ref></p>
      </subsection>
      <subsection level="2" id="uid272">
        <bodyTitle>Activities of General Interest</bodyTitle>
        <simplelist>
          <li id="uid273">
            <p>T. Despeyroux is president of AGOS (Inria Works Council), a permanent member of the ``commission technique paritaire (CTP)'' and a member of the Inria Board of Directors (Conseil d'Administration) as a scientific staff representative.</p>
          </li>
          <li id="uid274">
            <p>T. Despeyroux is participating in the project for redesigning the intranet Web site of Inria-Rocquencourt.</p>
          </li>
          <li id="uid275">
            <p>B. Senach is involved in the Inria Sophia Antipolis support committee of the world-wide competitivity pole ``Solutions Communicantes Sécurisées''</p>
          </li>
          <li id="uid276">
            <p>B. Trousse is a member of the scientific committee and also a substitute member of the decision committee of the ``Laboratoire des Usages des NTIC'' of Sophia Antipolis.</p>
          </li>
          <li id="uid277">
            <p>B. Trousse is a member of the RSTI scientific committee related to the &lt;&lt; ISI, L'OBJET, RIA, TSI &gt;&gt; journals (Hermès publisher).</p>
          </li>
          <li id="uid278">
            <p>A-M Vercoustre is involved (25%) in the Department for Scientific Information and Communication (DISC), working on Inria policy and tools for scientific publications, in particular the development of an Open Archive in cooperation with CNRS.</p>
          </li>
        </simplelist>
      </subsection>
    </subsection>
    <subsection level="1" id="uid279">
      <bodyTitle>Formation</bodyTitle>
      <subsection level="2" id="uid280">
        <bodyTitle>University Teaching</bodyTitle>
        <p>AxIS is an associated team for the ``STIC Doctoral school'' at the University of Nice Sophie Antipolis (UNSA) and the team members are teaching in various university curriculums:</p>
        <simplelist>
          <li id="uid281">
            <p>``DEA Informatique'' (resp. Mr Kounalis) at UNSA Sophia Antipolis: Optional tutorial on ``Web usage Mining'' (F. Masséglia, B. Trousse).</p>
          </li>
          <li id="uid282">
            <p>``Licence professionnelle franco-italienne: Statistiques et Traitement Informatique de Données (STID)'' (resp. J. Lemaire) at UNSA, Menton: Supervision of a student project (60h by students, 10 students, 30h supervised) on 
            <i>Mining HTTP Logs From Inria's Web Sites</i>: S. Chelcea, B. Trousse.</p>
          </li>
          <li id="uid283">
            <p>International University of Monaco, three courses (D. Tanasa): Programming Techniques (90h), Business Analysis and Systems Design (45h), Management of Information Systems (25h).</p>
          </li>
          <li id="uid284">
            <p>``DEA Modélisation et traitement des données et des connaissances'' (resp: S. Pinson) of the University Paris IX-Dauphine (4h): Tutorial on 
            <i>``Analyse des connaissances numériques et Symboliques''</i>: Y. Lechevallier.</p>
          </li>
          <li id="uid285">
            <p>``DESS Mathématiques appliquées et sciences économiques (MASE)'' of the University Paris IX-Dauphine: Tutorial (18h) on 
            <i>``Méthodes neuronales en classification''</i>: Y. Lechevallier.</p>
          </li>
          <li id="uid286">
            <p>``ENSAE'': Tutorial on 
            <i>``Data Mining''</i>(12h): Y. Lechevallier.</p>
          </li>
          <li id="uid287">
            <p>``ENIT /Tunis'': Tutorial on 
            <i>``Data Mining et méthodes neuronales''</i>(12h): Y. Lechevallier.</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid288">
        <bodyTitle>Ph.D. Thesis</bodyTitle>
        <p>Ph.D. defence in 2005:</p>
        <orderedlist>
          <li id="uid289">
            <p><b>D. Tanasa</b>, (start: end of 2001), ``Web Usage Mining: Contributions to Intersites Logs Preprocessing and Sequential Pattern Extraction with Low Support'' 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid48" location="biblio" xyref="1958661692013"/>), University of Nice-Sophia Antipolis (director: B. Trousse), june 3rd.</p>
          </li>
        </orderedlist>
        <p noindent="true">Ph.D. in progress:</p>
        <orderedlist>
          <li id="uid290">
            <p><b>S. Chelcea</b>, (start: end of 2002), ``Agglomerative 2-3 Hierarchical Clustering: theoretical and applicative study'', Université de Nice-Sophia Antipolis (directors: J. Lemaire and B. Trousse with the support of P. Bertrand on 2-3 AHC).</p>
          </li>
          <li id="uid291">
            <p><b>H. Behja</b>, (start: end of 2002), ``Gestion de points de vues multiples dans l'analyse d'un observatoire sur le Web'', University of Casablanca, (directors: A. Marzark and B. Trousse). This thesis is done in the context of the STIC Software engineering network of
            France-Morocco cooperation (2002-2005).</p>
          </li>
          <li id="uid292">
            <p><b>A. Baldé</b>, (start: end of 2003), ''Extraction de méta-données à partir de prototypes issus d'une classification'' (Metadata Extraction from classification prototypes), University of Paris IX Dauphine, (directors: E. Diday and Y. Lechevallier) with the participation of B. Trousse
            and M.-A. Aufaure (Supelec).</p>
          </li>
          <li id="uid293">
            <p><b>A Da Silva</b>, (start: October 2005), "Modélisation de données agrégées ou complexes par l'approche symbolique, application au Web Usage Mining", University of Paris IX Dauphine (directors: Edwin Diday and Yves Lechevallier).</p>
          </li>
          <li id="uid294">
            <p><b>A. Marascu</b>, (start: October 2005), ``Extraction de Motifs Séquentiels dans les Data Streams'', Université de Nice-Sophia Antipolis (director: Yves Lechevallier) with the participation of B. Trousse and F. Masseglia).</p>
          </li>
        </orderedlist>
        <p>F. Rossi is a member of the thesis committee of 
        <b>N. Delannay</b>(start: October 2003) on ``Méthodes neuronales pour les données structurées'', Université Catholique de Louvain, Belgium (director: Michel Verleysen).</p>
        <p spacebefore="12.0pt">AxIS researchers were members of Ph.D. committees in 2005:</p>
        <simplelist>
          <li id="uid295">
            <p>Doru Tanasa, ``Web Usage Mining: Contributions to Intersites Logs Preprocessing and Sequential Pattern Extraction with Low Support'', defended on 3rd. June 2005: B. Trousse, F. Masséglia</p>
          </li>
          <li id="uid296">
            <p>Cherif Mballo, `` Ordre, codage et extension du critère de Kolomogorov-Smirnov pour la segmentation de données symboliques'', December 12, Y. Lechevallier</p>
          </li>
          <li id="uid297">
            <p>Hani Hamdan, ``Developpement de méthodes de classification pour le contrôle d'émission accoustique d'appareils sous pression'', November 22, Y. Lechevallier</p>
          </li>
          <li id="uid298">
            <p>Nathalie Villa ``Éléments d'apprentissage en statistique fonctionnelle - Classification et régression fonctionnelles par réseaux de neurones et Support Vector Machine'', defended on October 21th, 2005: F. Rossi</p>
          </li>
          <li id="uid299">
            <p>Jonathan Mamou, ``XSEarch, un moteur de recherche pour XML combinant structure et contenu'', Univ. Paris 11, defended on 30th September 2005, Orsay: A.-M. Vercoustre</p>
          </li>
        </simplelist>
      </subsection>
      <subsection level="2" id="uid300">
        <bodyTitle>Internships</bodyTitle>
        <p>We welcomed eleven students in AXIS this year:</p>
        <orderedlist>
          <li id="uid301">
            <p><b>R. Busseuil</b>(supervisors S. Chelcea and B. Trousse), ENS Cachan and Inria Sophia-Antipolis, ``Classification des itinéraires pour l'aide á la navigation assistée par GPS'' 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid42" location="biblio" xyref="1958661692013"/>.</p>
          </li>
          <li id="uid302">
            <p><b>M. Fegas</b>(supervisor A.-M. Vercoustre), University of Orsay Paris-11 and Inria Rocquencourt, ``Classification de documents XML'' 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid52" location="biblio" xyref="1958661692013"/>.</p>
          </li>
          <li id="uid303">
            <p><b>M. Dufresne</b>(supervisors Marc Csernel, Yves lechevallier, Francois Patte), Univ. Paris XIII Institut galilée, Inria Rocquencourt, Interactive presentation of Critical edition of Sankrit texts.</p>
          </li>
          <li id="uid304">
            <p><b>S. Kebbache</b>(supervisors Marc Csernel, Yves lechevallier), Univ. Paris I Panthéon-Sorbonne, Inria Rocquencourt, Comparison of Sanskrit texts, aligment procedures.</p>
          </li>
          <li id="uid305">
            <p><b>A. Marascu</b>(supervisor F. Masséglia), University of Nice and Inria Sophia-Antipolis, ``Extraction de motifs séquentiels dans les data streams'' 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid70" location="biblio" xyref="1958661692013"/>.</p>
          </li>
          <li id="uid306">
            <p><b>S. Sellah</b>(supervisors F. Masséglia and B. Trousse), University of Lyon 2 and Inria Sophia Antipolis, 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid62" location="biblio" xyref="1958661692013"/>.</p>
          </li>
          <li id="uid307">
            <p><b>S. Tandabany</b>(supervisors S. Chelcea and B. Trousse), University of Orsay Paris-11, ENS Lyon and Inria Sophia Antipolis, ``Elaborating a Distance for Clusterig Homogeneous Sanskrit Documents'' 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid22" location="biblio" xyref="1958661692013"/>.</p>
          </li>
        </orderedlist>
        <p>Four of which were in the context of the Inria international internship program:</p>
        <orderedlist>
          <li id="uid308">
            <p><b>A. Da Silva</b>(supervisors Y. Lechevallier and B. Trousse), Recife University of Permenbouc (Brazil), Inria Rocquencourt, Inria International Internship Program.</p>
          </li>
          <li id="uid309">
            <p><b>C. Garboni</b>, West University of Timisoara (Romania) and Inria Sophia Antipolis, Inria International Internship Program 
            <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="#bid54" location="biblio" xyref="1958661692013"/>.</p>
          </li>
          <li id="uid310">
            <p><b>S. Gul</b>(supervisor A.-M. Vercoustre), MIT and Inria Rocquencourt, XML Document mining (in progress), Inria Internship Program.</p>
          </li>
          <li id="uid311">
            <p><b>N. Lopes Calvacanti Junior</b>(supervisor F. Rossi), Federal Univ. of Pernambuco, Brazil and Inria Rocquencourt, Implementation of a fast Dissimilarity Self-Organizing Map (in progress), Inria Internship Program.</p>
          </li>
        </orderedlist>
      </subsection>
    </subsection>
    <subsection level="1" id="uid312">
      <bodyTitle>Participation to Workshops, Conferences, Seminars, Invitations</bodyTitle>
      <p>Readers are kindly asked to report to the publication references for the participation to conferences with a submission process. Furthermore we attended the following conferences or workshops:</p>
      <simplelist>
        <li id="uid313">
          <p>EDA'05 (Entrepôts de Donnes et Analyse en ligne), Lyon, June 10: F. Masséglia.</p>
        </li>
        <li id="uid314">
          <p>Creating the information Commons for e-Science: Towards Institutional Policies and Guidelines for Action, UNESCO Headquarters, Paris, France, September 2005.</p>
        </li>
      </simplelist>
      <p>F. Rossi was invited professor for one month at the Université Catholique de Louvain (Belgium).</p>
      <p noindent="true">M. Csernel was invited in August in the framework ot the AAT project in two different EFEO branches in India: the Poonah branch and the Pondichery branch.</p>
    </subsection>
  </diffusion>
  <biblio id="bibliography" html="bibliography" numero="10" titre="Bibliography">
    <biblStruct rend="refer" n="cite:patrice5" type="article" id="bid82">
      <analytic>
        <title level="a">The 
        <hi rend="italic">k</hi>-weak hierarchical representations: an extension of the indexed closed weak hierarchies</title>
        <author>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Melvin F.</foreName>
            <surname>Janowitz</surname>
            <initial>M. F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Discrete Applied Mathemathics</title>
        <imprint>
          <biblScope type="volume">127</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <month>April</month>
            <year>2003</year>
          </dateStruct>
          <biblScope type="pages">199–220</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Cha1" type="article" id="bid16">
      <analytic>
        <title level="a">A monothetic clustering method</title>
        <author>
          <persName>
            <foreName>Marie</foreName>
            <surname>Chavent</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Pattern Recognition Letters</title>
        <imprint>
          <biblScope type="volume">19</biblScope>
          <biblScope type="number">11</biblScope>
          <dateStruct>
            <month>September</month>
            <year>1998</year>
          </dateStruct>
          <biblScope type="pages">989-996</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:CHELCEA:2004:RFIA" type="inproceedings" id="bid17">
      <analytic>
        <title level="a">Un Nouvel Algorithme de Classification Ascendante 2-3 Hiérarchique</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes de 14ème Congrès Francophone AFRIF-AFIA de Reconnaissance des Formes et Intelligence Artificielle (RFIA 2004), Centre de Congrès Pierre BAUDIS, Toulouse, France</title>
        <imprint>
          <biblScope type="volume">3</biblScope>
          <dateStruct>
            <month>28-30 Janvier</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">1471-1480</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.laas.fr/rfia2004/actes/ARTICLES/388.pdf" location="extern" xyref="69049185012">http://www.laas.fr/rfia2004/actes/ARTICLES/388.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:marc2" type="article" id="bid81">
      <analytic>
        <title level="a">Usual Operations With Symbolic Data Under Normal Symbolic Form</title>
        <author>
          <persName key="axis-2005-id18244">
            <foreName>Marc</foreName>
            <surname>Csernel</surname>
            <initial>M.</initial>
          </persName>
          <persName key="axis-2005-id18451">
            <foreName>Francisco A. T.</foreName>
            <surname>De Carvalho</surname>
            <initial>F. A. T.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Applied Stochastic Models in Business and Industry</title>
        <imprint>
          <biblScope type="volume">15</biblScope>
          <dateStruct>
            <year>1999</year>
          </dateStruct>
          <biblScope type="pages">241–257</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Despeyroux:WWW2004" type="inproceedings" id="bid23">
      <analytic>
        <title level="a">Practical Semantic Analysis of Web Sites and Documents</title>
        <author>
          <persName key="axis-2005-id18152">
            <foreName>Thierry</foreName>
            <surname>Despeyroux</surname>
            <initial>T.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">The 13th World Wide Web Conference, WWW2004, New York City, USA</title>
        <imprint>
          <dateStruct>
            <month>17-22 May</month>
            <year>2004</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/papers/04www/despeyroux-www2004.pdf" location="extern" xyref="3595020992030">
          http://www-sop.inria.fr/axis/papers/04www/despeyroux-www2004.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:ElGolliEtAlSFC2004SomWeb" type="inproceedings" id="bid87">
      <analytic>
        <title level="a">Une application des cartes topologiques auto-organisatrices à l'analyse des fichiers Logs</title>
        <author>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18416">
            <foreName>Doru</foreName>
            <surname>Tanasa</surname>
            <initial>D.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes des onzièmes journées de la Société Francophone de Classification, Bordeaux, France</title>
        <imprint>
          <dateStruct>
            <month>Septembre</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">181–184</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Guichard2004a" type="book" id="bid84">
      <monogr>
        <title level="m">Mesures de l'internet</title>
        <editor role="editor">
          <persName>
            <foreName>Eric</foreName>
            <surname>Guichard</surname>
            <initial>E.</initial>
          </persName>
        </editor>
        <note anchored="yes" place="unspecified" type="bnote">ouvrage collectif suite au Colloque Mesures de l'internet, Nice, France, 12-14 Mai, 2003</note>
        <imprint>
          <publisher>
            <orgName>Les Canadiens en Europe</orgName>
          </publisher>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:chap11" type="incollection" id="bid80">
      <analytic>
        <title level="a">Data mining et analyse des données</title>
        <author>
          <persName>
            <foreName>Georges</foreName>
            <surname>Hébrail</surname>
            <initial>G.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Analyse des données</title>
        <imprint>
          <publisher>
            <orgName>Hermes</orgName>
          </publisher>
          <dateStruct>
            <month>June</month>
            <year>2003</year>
          </dateStruct>
          <biblScope type="pages">340-360</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Jaczynski:1999" type="article" id="bid83">
      <analytic>
        <title level="a">Patrons de conception dans la modélisation d'une plateforme à objets pour le raisonnement à partir de cas. Design patterns for modelling a case-based reasoning tool</title>
        <author>
          <persName>
            <foreName>Michel</foreName>
            <surname>Jaczynski</surname>
            <initial>M.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Revue L'objet - logiciel, bases de données, réseaux</title>
        <imprint>
          <biblScope type="volume">5</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>1999</year>
          </dateStruct>
          <biblScope type="pages">203-232</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Masseglia:2004:APWEB" type="inproceedings" id="bid85">
      <analytic>
        <title level="a">Web Usage Mining: Sequential Pattern Extraction with a Very Low Support</title>
        <author>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18416">
            <foreName>Doru</foreName>
            <surname>Tanasa</surname>
            <initial>D.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Advanced Web Technologies and Applications: 6th Asia-Pacific Web Conference, APWeb 2004, Hangzhou, China. Proceedings</title>
        <title level="s">LNCS</title>
        <imprint>
          <biblScope type="volume">3007</biblScope>
          <publisher>
            <orgName>Springer-Verlag</orgName>
          </publisher>
          <dateStruct>
            <month>14-17 April</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">513–522</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Tanasa:2004:IEEE-I" type="article" id="bid86">
      <analytic>
        <title level="a">Advanced Data Preprocessing for Intersites Web Usage Mining</title>
        <author>
          <persName key="axis-2005-id18416">
            <foreName>Doru</foreName>
            <surname>Tanasa</surname>
            <initial>D.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">IEEE Intelligent Systems</title>
        <imprint>
          <biblScope type="volume">19</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <month>March-April</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">59–65</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://csdl.computer.org/comp/mags/ex/2004/02/x2toc.htm" location="extern" xyref="3178030122025">http://csdl.computer.org/comp/mags/ex/2004/02/x2toc.htm</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="refer" n="cite:Trousse98b" type="inproceedings" id="bid27">
      <analytic>
        <title level="a">Viewpoint Management for Cooperative Design</title>
        <author>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>P.</foreName>
            <surname>Borne</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>M.</foreName>
            <surname>Ksouri</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>A. El</foreName>
            <surname>Kamel</surname>
            <initial>A. E.</initial>
          </persName>
        </editor>
        <title level="m">Proceedings of the IEEE Computationnal Engineering in Systems Applications (CESA'98)</title>
        <imprint>
          <publisher>
            <orgName>UCIS - Ecole Centrale de Lille - CD-Rom</orgName>
          </publisher>
          <dateStruct>
            <month>april</month>
            <year>1998</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="4285" rend="year" n="cite:MDM05" type="proceedings" id="bid69">
      <monogr>
        <title level="m">Proceedings of MDM'05, the sixth international workshop on « Multimedia Data Mining »</title>
        <editor role="editor">
          <persName>
            <foreName>Fatma</foreName>
            <surname>Bouali</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Latifur</foreName>
            <surname>Kahn</surname>
            <initial>L.</initial>
          </persName>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
        </editor>
        <note anchored="yes" place="unspecified" type="bnote">(held in conjunction with KDD'05)</note>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/mdm-kdd05/" location="extern" xyref="542678711019">http://www-sop.inria.fr/axis/mdm-kdd05/</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="1251" rend="year" n="cite:RNTI_FDC_05" type="book" id="bid68">
      <monogr>
        <title level="m">Numéro spécial « Fouille de données complexes »</title>
        <title level="s">Revue des Nouvelles Technologies de l'Information (RNTI)</title>
        <editor role="editor">
          <persName>
            <foreName>Omar</foreName>
            <surname>Boussaid</surname>
            <initial>O.</initial>
          </persName>
          <persName>
            <foreName>Pierre</foreName>
            <surname>Gançarski</surname>
            <initial>P.</initial>
          </persName>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </editor>
        <imprint>
          <biblScope type="volume">7</biblScope>
          <publisher>
            <orgName>Cépaduès</orgName>
          </publisher>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="4271" rend="year" n="cite:FDC05" type="proceedings" id="bid63">
      <monogr>
        <title level="m">Actes de FDC'05, le second atelier sur la « Fouille de données complexes dans un processus d'extraction de connaissances »</title>
        <editor role="editor">
          <persName>
            <foreName>Pierre</foreName>
            <surname>Gançarski</surname>
            <initial>P.</initial>
          </persName>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
        </editor>
        <note anchored="yes" place="unspecified" type="bnote">(Atelier de la conférence EGC'05)</note>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/fdc-egc05/FDC05_CFP.htm" location="extern" xyref="471387673029">http://www-sop.inria.fr/axis/fdc-egc05/FDC05_CFP.htm</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="4269" rend="year" n="cite:Tanasa_PhD_2005" type="phdthesis" id="bid48">
      <monogr>
        <title level="m">Web Usage Mining: Contributions to Intersites Logs Preprocessing and Sequential Pattern Extraction with Low Support</title>
        <author>
          <persName key="axis-2005-id18416">
            <foreName>Doru</foreName>
            <surname>Tanasa</surname>
            <initial>D.</initial>
          </persName>
        </author>
        <note anchored="yes" place="unspecified" type="typdoc">Ph. D. Thesis</note>
        <imprint>
          <publisher>
            <orgName type="school">University of Nice Sophia Antipolis</orgName>
          </publisher>
          <dateStruct>
            <month>3 June</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/personnel/Doru.Tanasa/these_TANASA.pdf" location="extern" xyref="2056788184026">
          http://www-sop.inria.fr/axis/personnel/Doru.Tanasa/these_TANASA.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0584" rend="year" n="cite:baldeetall:2005:JSDA" type="article" id="bid26">
      <analytic>
        <title level="a">How can metadata contribute to add semantic information to clusters?</title>
        <author>
          <persName key="axis-2005-id18343">
            <foreName>Abdourahamane</foreName>
            <surname>Baldé</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Marie-Aude</foreName>
            <surname>Aufaure</surname>
            <initial>M.-A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01362">
        <idno type="issn">1723-5081</idno>
        <title level="j">Journal of Symbolic Data Analysis</title>
        <imprint>
          <biblScope type="volume">3</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">32-44</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/Article.pdf" location="extern" xyref="1069388306003">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/Article.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0297" rend="year" n="cite:marc" type="article" id="bid78">
      <analytic>
        <title level="a">Comparaison de manuscrits sanskrits, édition critique et classification</title>
        <author>
          <persName key="axis-2005-id18244">
            <foreName>Marc</foreName>
            <surname>Csernel</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01793">
        <idno type="issn">1145-895X</idno>
        <title level="j">La Revue Modulad</title>
        <imprint>
          <biblScope type="number">23</biblScope>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">1-20</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0022" rend="year" n="cite:DeCarvalho2005" type="article" subtype="nonparu" id="bid37">
      <analytic>
        <title level="a">Adaptive Hausdorff distances and dynamic clustering of symbolic interval data</title>
        <author>
          <persName>
            <foreName>Francisco de A. T.</foreName>
            <surname>de Carvalho</surname>
            <initial>F. d. A. T.</initial>
          </persName>
          <persName>
            <foreName>Renata M. C. R.</foreName>
            <surname>de Souza</surname>
            <initial>R. M. C. R.</initial>
          </persName>
          <persName>
            <foreName>Marie</foreName>
            <surname>Chavent</surname>
            <initial>M.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01653">
        <idno type="issn">0167-8655</idno>
        <title level="j">Pattern Recognition Letters</title>
        <note anchored="yes" place="unspecified" type="bnote">article in press</note>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="1465" rend="year" n="cite:MaTePo05a" type="inbook" id="bid64">
      <analytic>
        <title level="a">Sequential Pattern Mining: A Survey on Issues and Approaches</title>
        <author>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Maguelonne</foreName>
            <surname>Teisseire</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Pascal</foreName>
            <surname>Poncelet</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <imprint>
          <publisher>
            <orgName>Information Science Publishing</orgName>
          </publisher>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0592" rend="year" n="cite:PEHCEVSKI:2005:34589" type="article" id="bid56">
      <analytic>
        <title level="a">Hybrid XML Retrieval: Combining Information Retrieval and a Native XML Database</title>
        <author>
          <persName>
            <foreName>Jovan</foreName>
            <surname>Pehcevski</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>James</foreName>
            <surname>Thom</surname>
            <initial>J.</initial>
          </persName>
          <persName key="axis-2005-id18210">
            <foreName>Anne-Marie</foreName>
            <surname>Vercoustre</surname>
            <initial>A.-M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid00900">
        <idno type="issn">1386-4564</idno>
        <title level="j">Journal of Information Retrieval, Special Issue on INEX</title>
        <note anchored="yes" place="unspecified" type="bnote">Postprint version. The editor version can be accessed through the DOI.</note>
        <imprint>
          <biblScope type="volume">8</biblScope>
          <biblScope type="number">4</biblScope>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000183" location="extern" xyref="4030947808026">http://hal.inria.fr/inria-00000183</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0457" rend="year" n="cite:RossiConanGuez05CRASConsistance" type="article" id="bid34">
      <analytic>
        <title level="a">Estimation consistante des paramètres d'un modèle non linéaire pour des données fonctionnelles discrétisées aléatoirement</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid00408">
        <idno type="issn">1631-073X</idno>
        <title level="j">Comptes rendus de l'Académie des Sciences - Série I</title>
        <imprint>
          <biblScope type="volume">340</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <month>January</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">167–170</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000223" location="extern" xyref="2666670289009">http://hal.inria.fr/inria-00000223</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0543" rend="year" n="cite:RossiConanGuez05NeuralNetworks" type="article" id="bid35">
      <analytic>
        <title level="a">Functional Multi-Layer Perceptron: a Nonlinear Tool for Functional Data Analysis</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01575">
        <idno type="issn">0893-6080</idno>
        <title level="j">Neural Networks</title>
        <imprint>
          <biblScope type="volume">18</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <month>January</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">45–60</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000599" location="extern" xyref="4035025701025">http://hal.inria.fr/inria-00000599</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="0969" rend="year" n="cite:RossiEtAl05Neurocomputing" type="article" id="bid36">
      <analytic>
        <title level="a">Representation of Functional Data in Neural Networks</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Nicolas</foreName>
            <surname>Delannay</surname>
            <initial>N.</initial>
          </persName>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Michel</foreName>
            <surname>Verleysen</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr id="rid01581">
        <idno type="issn">0925-2312</idno>
        <title level="j">Neurocomputing</title>
        <imprint>
          <biblScope type="volume">64</biblScope>
          <dateStruct>
            <month>March</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">183–210</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000666" location="extern" xyref="3874582691030">http://hal.inria.fr/inria-00000666</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3185" rend="year" n="cite:BehjaEtAl:EGC:2005" type="inproceedings" id="bid28">
      <analytic>
        <title level="a">Prise en compte des Points de Vue pour l'annotation d'un processus d'Extraction de Connaissances à partir de Données</title>
        <author>
          <persName key="axis-2005-id18357">
            <foreName>Hicham</foreName>
            <surname>Behja</surname>
            <initial>H.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>A.</foreName>
            <surname>Marzak</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Suzanne</foreName>
            <surname>Pinson</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Nicole</foreName>
            <surname>Vincent</surname>
            <initial>N.</initial>
          </persName>
        </editor>
        <title level="m">Actes des 5ème journées Extraction et Gestion des Connaissances (EGC 2005), Revue des Nouvelles Technologies de l'Information (RNTI-E-3)</title>
        <imprint>
          <biblScope type="volume">1</biblScope>
          <publisher>
            <orgName>Cépaduès-Editions, ISBN 2.85428.677.4</orgName>
          </publisher>
          <dateStruct>
            <month>January</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">245-256</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2045" rend="year" n="cite:ChelceaEtAll:PKDD:2005" type="inproceedings" id="bid46">
      <analytic>
        <title level="a">Benefits of InterSite Pre-Processing and Clustering Methods in E-Commerce Domain</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName key="axis-2005-id18387">
            <foreName>Alzennyr</foreName>
            <surname>Da Silva</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18416">
            <foreName>Doru</foreName>
            <surname>Tanasa</surname>
            <initial>D.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Petr</foreName>
            <surname>Berka</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Bruno</foreName>
            <surname>Crémilleux</surname>
            <initial>B.</initial>
          </persName>
        </editor>
        <title level="m">Proceedings of the ECML/PKDD2005 Discovery Challenge, A Collaborative Effort in Knowledge Discovery from Databases, Porto, Portugal</title>
        <imprint>
          <dateStruct>
            <month>3-7 October</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">15-21</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000880" location="extern" xyref="2717101913015">http://hal.inria.fr/inria-00000880</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3176" rend="year" n="cite:ChelceaEtAll:MDM:2005" type="inproceedings" id="bid47">
      <analytic>
        <title level="a">Pre-Processing and Clustering Complex Data in E-Commerce Domain</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName key="axis-2005-id18387">
            <foreName>Alzennyr</foreName>
            <surname>Da Silva</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18416">
            <foreName>Doru</foreName>
            <surname>Tanasa</surname>
            <initial>D.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the First International Workshop on Mining Complex Data 2005 (IEEE MCD'2005), held in conjunction with the Fifth IEEE International Conference on Data Mining (ICDM'05), Houston, Texas</title>
        <imprint>
          <dateStruct>
            <month>27 November</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000881" location="extern" xyref="136333823025">http://hal.inria.fr/inria-00000881</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2100" rend="year" n="cite:ChelceaTrousse:EGC:2005" type="inproceedings" id="bid38">
      <analytic>
        <title level="a">Classification 2-3 hiérarchique de données du Web</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Suzanne</foreName>
            <surname>Pinson</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Nicole</foreName>
            <surname>Vincent</surname>
            <initial>N.</initial>
          </persName>
        </editor>
        <title level="m">Actes des 5ème journées Extraction et Gestion des Connaissances (EGC 2005), Revue des Nouvelles Technologies de l'Information (RNTI-E-3)</title>
        <imprint>
          <biblScope type="volume">1</biblScope>
          <publisher>
            <orgName>Cépaudès-Editions, ISBN 2.85428.677.4</orgName>
          </publisher>
          <dateStruct>
            <month>January</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">219</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000864" location="extern" xyref="2278685581024">http://hal.inria.fr/inria-00000864</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="1676" rend="year" n="cite:ConanGuezEtAlWSOM2005" type="inproceedings" id="bid30">
      <analytic>
        <title level="a">A Fast Algorithm for the Self-Organizing Map on Dissimilarity Data</title>
        <author>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 5th Workshop on Self-Organizing Maps (WSOM 05), Paris (France)</title>
        <imprint>
          <dateStruct>
            <month>September</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">561–568</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2140" rend="year" n="cite:ll" type="inproceedings" id="bid79">
      <analytic>
        <title level="a">Comparaison de textes sanskrits en vue d'une édition critique</title>
        <author>
          <persName key="axis-2005-id18244">
            <foreName>Marc</foreName>
            <surname>Csernel</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>V.</foreName>
            <surname>Makarenkov</surname>
            <initial>V.</initial>
          </persName>
          <persName>
            <foreName>G.</foreName>
            <surname>Cucumel</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>J-F</foreName>
            <surname>Lapointe</surname>
            <initial>J.-F.</initial>
          </persName>
        </editor>
        <title level="m">Compte rendu des 12-emes Rencontres de la Socitété Francophone de classification, Montreal</title>
        <imprint>
          <publisher>
            <orgName>SFC</orgName>
          </publisher>
          <dateStruct>
            <month>29 May - 1 June</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">108-111</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3656" rend="year" n="cite:DMBiz2005" type="inproceedings" id="bid77">
      <analytic>
        <title level="a">Uma Abordagem para Descoberta do Perfil da Clientela em Web Sites Institucionais</title>
        <author>
          <persName key="axis-2005-id18387">
            <foreName>Alzennyr</foreName>
            <surname>Da Silva</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Francisco de A. T.</foreName>
            <surname>de Carvalho</surname>
            <initial>F. d. A. T.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the first ECML/PKDD Workshop on Data Mining for Business (DMBiz'05), held in conjunction with the 16th European Conference on Machine Learning (ECML'05) and the 9th European Conference on Principles and Practice of Knowledge Discovery in
        Databases (PKDD'05), Porto, Portugal</title>
        <note anchored="yes" place="unspecified" type="bnote">Poster</note>
        <imprint>
          <dateStruct>
            <month>3 October</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2441" rend="year" n="cite:dltv05b" type="inproceedings" id="bid25">
      <analytic>
        <title level="a">Experiments in Clustering Homogeneous XML Documents to Validate an Existing Typology</title>
        <author>
          <persName key="axis-2005-id18152">
            <foreName>Thierry</foreName>
            <surname>Despeyroux</surname>
            <initial>T.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18210">
            <foreName>Anne-Marie</foreName>
            <surname>Vercoustre</surname>
            <initial>A.-M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 5th International Conference on Knowledge Management (I-Know), Vienne, Autriche</title>
        <note anchored="yes" place="unspecified" type="bnote">(postprint)</note>
        <imprint>
          <biblScope type="number">1</biblScope>
          <publisher>
            <orgName>Journal of Universal Computer Science</orgName>
          </publisher>
          <dateStruct>
            <month>July</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000002" location="extern" xyref="145703398019">http://hal.inria.fr/inria-00000002</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2439" rend="year" n="cite:dltv05a" type="inproceedings" id="bid24">
      <analytic>
        <title level="a">Expériences de classification de documents XML homogènes</title>
        <author>
          <persName key="axis-2005-id18152">
            <foreName>Thierry</foreName>
            <surname>Despeyroux</surname>
            <initial>T.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18210">
            <foreName>Anne-Marie</foreName>
            <surname>Vercoustre</surname>
            <initial>A.-M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Nicole</foreName>
            <surname>Vincent</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Suzanne</foreName>
            <surname>Pinson</surname>
            <initial>S.</initial>
          </persName>
        </editor>
        <title level="m">Actes des 5ème journées Extraction et Gestion des Connaissances (EGC 2005), Revue des Nouvelles Technologies de l'Information (RNTI-E-3), Paris, France</title>
        <imprint>
          <biblScope type="volume">1</biblScope>
          <publisher>
            <orgName>Cépaduès-Editions</orgName>
          </publisher>
          <dateStruct>
            <month>January</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">183-188</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/docs/00/03/49/10/PDF/raclass.pdf" location="extern" xyref="2839385440019">http://hal.inria.fr/docs/00/03/49/10/PDF/raclass.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2235" rend="year" n="cite:ElGolliASMDA2005" type="inproceedings" id="bid73">
      <analytic>
        <title level="a">Criterion-based divisive clustering: application to symbolic objects generation</title>
        <author>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of XIth International Symposium on Applied Stochastic Models and Data Analysis (ASMDA 2005), Brest, France</title>
        <imprint>
          <dateStruct>
            <month>17-20 May</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">709–713</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/ASMDAsectionSymbolic.pdf" location="extern" xyref="3390629942031">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/ASMDAsectionSymbolic.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2111" rend="year" n="cite:LechevallierVerseISI2005" type="inproceedings" id="bid76">
      <analytic>
        <title level="a">Clustering Methods in Symbolic Data Analysis</title>
        <author>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18481">
            <foreName>Rosanna</foreName>
            <surname>Verde</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 55th session of the International of Statictics Society (ISI 2005), Sydney</title>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2851" rend="year" n="cite:AMFM_MCD05" type="inproceedings" id="bid44">
      <analytic>
        <title level="a">Mining Data Streams for Frequent Sequences Extraction</title>
        <author>
          <persName key="axis-2005-id18635">
            <foreName>Alice</foreName>
            <surname>Marascu</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the First International Workshop on Mining Complex Data 2005 (IEEE MCD'2005),held in conjunction with the Fifth IEEE International Conference on Data Mining (ICDM'05), Houston, USA</title>
        <imprint>
          <dateStruct>
            <month>27 November</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/MCD_05.pdf" location="extern" xyref="3266234572016">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/MCD_05.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2853" rend="year" n="cite:AMFM_MSTD05" type="inproceedings" id="bid43">
      <analytic>
        <title level="a">Mining Sequential Patterns from Temporal Streaming Data</title>
        <author>
          <persName key="axis-2005-id18635">
            <foreName>Alice</foreName>
            <surname>Marascu</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the first ECML/PKDD Workshop on Mining Spatio-Temporal Data (MSTD'05), held in conjunction with the 9th European Conference on Principles and Practice of Knowledge Discovery in Databases (PKDD'05), Porto, Portugal</title>
        <imprint>
          <dateStruct>
            <month>3 October</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/MSTD_05.pdf" location="extern" xyref="2938228796015">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/MSTD_05.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3779" rend="year" n="cite:MaPoTeMa05" type="inproceedings" id="bid51">
      <analytic>
        <title level="a">Web Usage Mining: Extracting Unexpected Periods from Web Logs</title>
        <author>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Pascal</foreName>
            <surname>Poncelet</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Maguelonne</foreName>
            <surname>Teisseire</surname>
            <initial>M.</initial>
          </persName>
          <persName key="axis-2005-id18635">
            <foreName>Alice</foreName>
            <surname>Marascu</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 2nd Workshop on Temporal Data Mining (TDM 2005), held in conjunction with the Fifth IEEE International Conference on Data Mining (ICDM'05), Houston, USA</title>
        <imprint>
          <dateStruct>
            <month>27 November</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/tdm_icdm_period2.pdf" location="extern" xyref="3768123919028">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/tdm_icdm_period2.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2632" rend="year" n="cite:PEHCEVSKI:2005:30394" type="inproceedings" id="bid55">
      <analytic>
        <title level="a">Hybrid XML Retrieval Revisited</title>
        <author>
          <persName>
            <foreName>Jovan</foreName>
            <surname>Pehcevski</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>James</foreName>
            <surname>Thom</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Saied</foreName>
            <surname>Tahaghoghi</surname>
            <initial>S.</initial>
          </persName>
          <persName key="axis-2005-id18210">
            <foreName>Anne-Marie</foreName>
            <surname>Vercoustre</surname>
            <initial>A.-M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Norbert</foreName>
            <surname>Fuhr</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Mounia</foreName>
            <surname>Lalmas</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Saadia</foreName>
            <surname>Malik</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Zoltán</foreName>
            <surname>Szlávik</surname>
            <initial>Z.</initial>
          </persName>
        </editor>
        <title level="m">Advances in XML Information Retrieval, Proceedings of the Third International Workshop of the Initiative for the Evaluation of XML Retrieval (INEX 2004), Schloss Dagstuhl, Germany</title>
        <title level="s">LNCS</title>
        <note anchored="yes" place="unspecified" type="bnote">Postprint</note>
        <imprint>
          <biblScope type="volume">3493</biblScope>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000003" location="extern" xyref="2709301056005">http://hal.inria.fr/inria-00000003</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3700" rend="year" n="cite:PEHCEVSKI:2005:34588" type="inproceedings" id="bid57">
      <analytic>
        <title level="a">Users and Assessors in the Context of INEX: Are Relevance Dimensions Relevant?</title>
        <author>
          <persName>
            <foreName>Jovan</foreName>
            <surname>Pehcevski</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>James</foreName>
            <surname>Thom</surname>
            <initial>J.</initial>
          </persName>
          <persName key="axis-2005-id18210">
            <foreName>Anne-Marie</foreName>
            <surname>Vercoustre</surname>
            <initial>A.-M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Andrew</foreName>
            <surname>Trotman</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Mounia</foreName>
            <surname>Lalmas</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Norbert</foreName>
            <surname>Fuhr</surname>
            <initial>N.</initial>
          </persName>
        </editor>
        <title level="m">Proceedings of the INEX 2005 Workshop on Element Retrieval Methodology, Glasgow, Scotland</title>
        <imprint>
          <dateStruct>
            <month>30 July</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000182" location="extern" xyref="1502644038012">http://hal.inria.fr/inria-00000182</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3098" rend="year" n="cite:RassonLechevallierISI2005" type="inproceedings" id="bid71">
      <analytic>
        <title level="a">Parsimoious representation of symbolic objects : the case of multidimensional intervals</title>
        <author>
          <persName>
            <foreName>Jean-Paul</foreName>
            <surname>Rasson</surname>
            <initial>J.-P.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 55th session of the International of Statictics Society (ISI)</title>
        <imprint>
          <publisher>
            <orgName>ISI</orgName>
          </publisher>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3695" rend="year" n="cite:RossiEtAlESANN2005WUMSOM" type="inproceedings" id="bid31">
      <analytic>
        <title level="a">Usage Guided Clustering of Web Pages with the Median Self Organizing Map</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 13th European Symposium On Artificial Neural Networks (ESANN 2005), Bruges, Belgium</title>
        <imprint>
          <dateStruct>
            <month>April</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">351–356</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3762" rend="year" n="cite:RossiEtAlEGC2005" type="inproceedings" id="bid45">
      <analytic>
        <title level="a">Visualisation de la perception d'un site web par ses utilisateurs</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Suzanne</foreName>
            <surname>Pinson</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Nicole</foreName>
            <surname>Vincent</surname>
            <initial>N.</initial>
          </persName>
        </editor>
        <title level="m">Actes des 5ème journées Extraction et Gestion des Connaissances (EGC 2005), Revue des Nouvelles Technologies de l'Information (RNTI-E-3), Paris, France</title>
        <imprint>
          <biblScope type="volume">II</biblScope>
          <publisher>
            <orgName>Cépaduès-Editions</orgName>
          </publisher>
          <dateStruct>
            <month>January</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">563–574</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2103" rend="year" n="cite:RossiVillaASMDA2005SVM" type="inproceedings" id="bid32">
      <analytic>
        <title level="a">Classification in Hilbert Spaces with Support Vector Machines</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Nathalie</foreName>
            <surname>Villa</surname>
            <initial>N.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of XIth International Symposium on Applied Stochastic Models and Data Analysis (ASMDA 2005), Brest, France</title>
        <imprint>
          <dateStruct>
            <month>May</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="2101" rend="year" n="cite:VerdeLechevallierSFC2005" type="inproceedings" id="bid74">
      <analytic>
        <title level="a">Classification croisée d'un tableau de données de type intervalle</title>
        <author>
          <persName key="axis-2005-id18481">
            <foreName>Rosanna</foreName>
            <surname>Verde</surname>
            <initial>R.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes des 12èmes Rencontres de la Société Francophone de Classification (SFC 2005), Montréal</title>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3481" rend="year" n="cite:VillaRossiESANN2005SVM" type="inproceedings" id="bid33">
      <analytic>
        <title level="a">Support Vector Machine For Functional Data Classification</title>
        <author>
          <persName>
            <foreName>Nathalie</foreName>
            <surname>Villa</surname>
            <initial>N.</initial>
          </persName>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 13th European Symposium On Artificial Neural Networks (ESANN 2005), Bruges, Belgium</title>
        <imprint>
          <dateStruct>
            <month>April</month>
            <year>2005</year>
          </dateStruct>
          <biblScope type="pages">467–472</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3859" rend="year" n="cite:Busseuil" type="misc" id="bid42">
      <monogr>
        <title level="m">Classification des itinéraires pour l'aide à la navigation assistée par GPS</title>
        <author>
          <persName key="axis-2005-id18516">
            <foreName>Rémi</foreName>
            <surname>Busseuil</surname>
            <initial>R.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/rapportREMY.pdf" location="extern" xyref="47587217023">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/rapportREMY.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3858" rend="year" n="cite:fegmoun05" type="misc" id="bid52">
      <monogr>
        <title level="m">Classification de documents XML, Application au corpus d'INEX et aux rapports d'activité INRIA</title>
        <author>
          <persName key="axis-2005-id18650">
            <foreName>Mounir</foreName>
            <surname>Fegas</surname>
            <initial>M.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/Rapport-Mounir.pdf" location="extern" xyref="1416698293012">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/Rapport-Mounir.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3994" rend="year" n="cite:garboni:2005" type="misc" id="bid54">
      <monogr>
        <title level="m">Sequential Pattern Mining for Structure-based XML Document Classification</title>
        <author>
          <persName key="axis-2005-id18576">
            <foreName>Calin</foreName>
            <surname>Garboni</surname>
            <initial>C.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3932" rend="year" n="cite:Lechevallier:RDC:2005" type="misc" id="bid72">
      <monogr>
        <title level="m">Le tableau de données, une structure unique, des réalités multiples</title>
        <author>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>21 March</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note anchored="yes" place="unspecified" type="howpublished">RDC'2005 ENST Paris</note>
    </biblStruct>
    <biblStruct titlekey="4040" rend="year" n="cite:YL:2005:Weka" type="misc" id="bid75">
      <monogr>
        <title level="m">WEKA, un logiciel libre d'apprentissage et de Data Mining</title>
        <author>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>13 October</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note anchored="yes" place="unspecified" type="howpublished">Après-midi d'INFOSTAT, Paris</note>
    </biblStruct>
    <biblStruct titlekey="3894" rend="year" n="cite:Marascu:2005:stage" type="misc" id="bid70">
      <monogr>
        <title level="m">Extraction de motifs séquentiels dans les data streams</title>
        <author>
          <persName key="axis-2005-id18635">
            <foreName>Alice</foreName>
            <surname>Marascu</surname>
            <initial>A.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/show.php?author=Alice_Marascu" location="extern" xyref="3478520275019">
          http://www-sop.inria.fr/axis/Publications/show.php?author=Alice_Marascu</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="4039" rend="year" n="cite:Sellah:2005" type="misc" id="bid62">
      <monogr>
        <title level="m">Web Usage Mining : Extraction de motifs séquentiels selon plusieurs points de vue</title>
        <author>
          <persName key="axis-2005-id18664">
            <foreName>Sofiane</foreName>
            <surname>Sellah</surname>
            <initial>S.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="4005" rend="year" n="cite:MOBIVIP-D5.2" type="misc" id="bid59">
      <monogr>
        <title level="m">Spécifications des critères d'évaluation et des données d'usage à tracer</title>
        <author>
          <persName key="axis-2005-id18195">
            <foreName>Bernard</foreName>
            <surname>Senach</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <note anchored="yes" place="unspecified" type="bnote">INRIA Sophia Antipolis, Delivrable D5.2. du Contrat PREDIT MOBIVIP</note>
        <imprint>
          <dateStruct>
            <month>December</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="3885" rend="year" n="cite:tandab05" type="misc" id="bid22">
      <monogr>
        <title level="m">Elaborating a Distance for Clustering Homogeneous Sanskrit Documents</title>
        <author>
          <persName key="axis-2005-id18678">
            <foreName>Sattisvar</foreName>
            <surname>Tandabany</surname>
            <initial>S.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www-sop.inria.fr/axis/Publications/uploads/pdf/ReportSatti.pdf" location="extern" xyref="4054029346005">
          http://www-sop.inria.fr/axis/Publications/uploads/pdf/ReportSatti.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct titlekey="" rend="year" n="cite:vfgl05a" type="misc" id="bid53">
      <monogr>
        <title level="m">A Flexible Structured-based Representation for XML Document Mining</title>
        <title level="m">Pre-Proceedings of the Fourth International Workshop of the Initiative for the Evaluation of XML Retrieval (INEX 2005), Schloss Dagstuhl, Germany</title>
        <author>
          <persName key="axis-2005-id18210">
            <foreName>Anne-Marie</foreName>
            <surname>Vercoustre</surname>
            <initial>A.-M.</initial>
          </persName>
          <persName key="axis-2005-id18650">
            <foreName>Mounir</foreName>
            <surname>Fegas</surname>
            <initial>M.</initial>
          </persName>
          <persName key="axis-2005-id18591">
            <foreName>Saba</foreName>
            <surname>Gul</surname>
            <initial>S.</initial>
          </persName>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>2005</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://hal.inria.fr/inria-00000839" location="extern" xyref="2826340801000">http://hal.inria.fr/inria-00000839</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:BockDiday2000" type="book" id="bid13">
      <monogr>
        <title level="m">Analysis of Symbolic Data. Exploratory methods for extracting statistical information from complex data</title>
        <editor role="editor">
          <persName>
            <foreName>Hans-Hermann</foreName>
            <surname>Bock</surname>
            <initial>H.-H.</initial>
          </persName>
          <persName>
            <foreName>Edwin</foreName>
            <surname>Diday</surname>
            <initial>E.</initial>
          </persName>
        </editor>
        <imprint>
          <publisher>
            <orgName>Springer Verlag</orgName>
          </publisher>
          <dateStruct>
            <year>2000</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:CBT02" type="inproceedings" id="bid41">
      <analytic>
        <title level="a">Theoretical study of a new 2-3 Hierarchical Clustering Algorithm</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the 4th International Workshop on Symbolic and Numeric Algorithms for Scientific Computing, SYNASC 2002, Timisoara, Romania</title>
        <imprint>
          <dateStruct>
            <month>8-12 October</month>
            <year>2002</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:ChelceaEtAl:GFKL:2003" type="inproceedings" id="bid40">
      <analytic>
        <title level="a">A New Agglomerative 2-3 Hierarchical Clustering Algorithm</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>Daniel</foreName>
            <surname>Baier</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Klaus-Dieter</foreName>
            <surname>Wernecke</surname>
            <initial>K.-D.</initial>
          </persName>
        </editor>
        <title level="m">Innovations in Classification, Data Science, and Information Systems. Proc. 27th Annual GfKl Conference, University of Cottbus, March 12 - 14, 2003, Heidelberg-Berlin, Germany</title>
        <title level="s">Studies in Classification, Data Analysis, and Knowledge Organization</title>
        <imprint>
          <publisher>
            <orgName>Springer-Verlag, ISBN 3-540-23221-4</orgName>
          </publisher>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">3-10</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.springeronline.com/sgw/cda/frontpage/0,11855,5-10129-22-36021200-0,00.html" location="extern" xyref="3985737531008">
          http://www.springeronline.com/sgw/cda/frontpage/0,11855,5-10129-22-36021200-0,00.html</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:CHELCEA:2004:RFIA" type="inproceedings" id="bid39">
      <analytic>
        <title level="a">Un Nouvel Algorithme de Classification Ascendante 2-3 Hiérarchique</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Patrice</foreName>
            <surname>Bertrand</surname>
            <initial>P.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes de 14ème Congrès Francophone AFRIF-AFIA de Reconnaissance des Formes et Intelligence Artificielle (RFIA 2004), Centre de Congrès Pierre BAUDIS, Toulouse, France</title>
        <imprint>
          <biblScope type="volume">3</biblScope>
          <dateStruct>
            <month>28-30 January</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">1471-1480</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://www.laas.fr/rfia2004/actes/ARTICLES/388.pdf" location="extern" xyref="69049185012">http://www.laas.fr/rfia2004/actes/ARTICLES/388.pdf</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:ChelceaGallaisTrousse:MOBUBI:2004" type="inproceedings" id="bid60">
      <analytic>
        <title level="a">Recommandations personnalisées pour la recherche d'information facilitant les déplacements</title>
        <author>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Georges</foreName>
            <surname>Gallais</surname>
            <initial>G.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Premières Journées Francophones : Mobilité et Ubiquité 2004, ESSI, Nice, Sophia-Antipolis, France</title>
        <imprint>
          <publisher>
            <orgName>Cepadues - ISBN : 2-85428-653-7 / ACM Digital Library - ISBN : 1-58113-915-2</orgName>
          </publisher>
          <dateStruct>
            <month>1-3 June</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">143 - 150</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://portal.acm.org/citation.cfm?id=1050873.1050905" location="extern" xyref="1910212774002">http://portal.acm.org/citation.cfm?id=1050873.1050905</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:MC97" type="misc" id="bid14">
      <monogr>
        <title level="m">Software Requirements Specification for the S.O.M. (Symbolic Object Manipulation)</title>
        <author>
          <persName key="axis-2005-id18244">
            <foreName>Marc</foreName>
            <surname>Csernel</surname>
            <initial>M.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>November</month>
            <year>1997</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note anchored="yes" place="unspecified" type="howpublished">Deliverable of the WP1 of the Sodas Project</note>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:dachwise04" type="misc" id="bid2">
      <monogr>
        <title level="m">Clustering XML Documents using Structural Summarie</title>
        <author>
          <persName>
            <foreName>Theodore</foreName>
            <surname>Dalamagas</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Tao</foreName>
            <surname>Cheng</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Klaas-Jan</foreName>
            <surname>Winkel</surname>
            <initial>K.-J.</initial>
          </persName>
          <persName>
            <foreName>Timos</foreName>
            <surname>Sellis</surname>
            <initial>T.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
      <note anchored="yes" place="unspecified" type="howpublished">In Proc. of ClustWeb - International Workshop on Clustering Information over the Web in conjunction with EDBT 04, Crete, Greece</note>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:ElGolliConanGuezRossiIFCS2004SomDiss" type="inproceedings" id="bid29">
      <analytic>
        <title level="a">A Self Organizing Map for dissimilarity data</title>
        <author>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>D.</foreName>
            <surname>Banks</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>L.</foreName>
            <surname>House</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>F. R.</foreName>
            <surname>McMorris</surname>
            <initial>F. R.</initial>
          </persName>
          <persName>
            <foreName>P.</foreName>
            <surname>Arabie</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>W.</foreName>
            <surname>Gaul</surname>
            <initial>W.</initial>
          </persName>
        </editor>
        <title level="m">Classification, Clustering, and Data Mining Applications (Proceedings of IFCS 2004), Chicago, Illinois (USA)</title>
        <imprint>
          <publisher>
            <orgName>Springer</orgName>
          </publisher>
          <publisher>
            <orgName type="organisation">IFCS
            <address/></orgName>
          </publisher>
          <dateStruct>
            <month>July</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">61–68</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:ElGolliConanGuezRossi04JSDA" type="article" id="bid15">
      <analytic>
        <title level="a">Self Organizing Map and Symbolic Data</title>
        <author>
          <persName key="axis-2005-id18308">
            <foreName>Aïcha</foreName>
            <surname>El Golli</surname>
            <initial>A.</initial>
          </persName>
          <persName key="axis-2005-id18273">
            <foreName>Brieuc</foreName>
            <surname>Conan-Guez</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Journal of Symbolic Data Analysis</title>
        <imprint>
          <biblScope type="volume">2</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <month>November</month>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:FS97" type="article" id="bid19">
      <analytic>
        <title level="a">Object-Oriented Application Frameworks</title>
        <author>
          <persName>
            <foreName>Mohamed E.</foreName>
            <surname>Fayad</surname>
            <initial>M. E.</initial>
          </persName>
          <persName>
            <foreName>Douglas C.</foreName>
            <surname>Schmidt</surname>
            <initial>D. C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Communication of the ACM</title>
        <imprint>
          <biblScope type="volume">40</biblScope>
          <biblScope type="number">10</biblScope>
          <dateStruct>
            <year>1997</year>
          </dateStruct>
          <biblScope type="pages">32-38</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:flesca02detecting" type="inproceedings" id="bid5">
      <analytic>
        <title level="a">Detecting Structural Similarities between XML Documents</title>
        <author>
          <persName>
            <foreName>Sergio</foreName>
            <surname>Flesca</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Giuseppe</foreName>
            <surname>Manco</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Elio</foreName>
            <surname>Masciari</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>Luigi</foreName>
            <surname>Pontieri</surname>
            <initial>L.</initial>
          </persName>
          <persName>
            <foreName>Andrea</foreName>
            <surname>Pugliese</surname>
            <initial>A.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">WebDB</title>
        <imprint>
          <dateStruct>
            <year>2002</year>
          </dateStruct>
          <biblScope type="pages">55-60</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:gagi00" type="inproceedings" id="bid0">
      <analytic>
        <title level="a">XTRACT: a system for extracting document type descriptors from XML documents</title>
        <author>
          <persName>
            <foreName>Minos</foreName>
            <surname>Garofalakis</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Aristides</foreName>
            <surname>Gionis</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Rajeev</foreName>
            <surname>Rastogi</surname>
            <initial>R.</initial>
          </persName>
          <persName>
            <foreName>S.</foreName>
            <surname>Seshadri</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Kyuseok</foreName>
            <surname>Shim</surname>
            <initial>K.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <imprint>
          <dateStruct>
            <year>2000</year>
          </dateStruct>
          <biblScope type="pages">165–176</biblScope>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://citeseer.ist.psu.edu/garofalakis00xtract.html" location="extern" xyref="1228450255017">http://citeseer.ist.psu.edu/garofalakis00xtract.html</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Jac94" type="inproceedings" id="bid21">
      <analytic>
        <title level="a">Fuzzy Logic for the Retrieval Step of a Case-Based Reasoner</title>
        <author>
          <persName>
            <foreName>Michel</foreName>
            <surname>Jaczynski</surname>
            <initial>M.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Second European Workshop on Case-Based Reasoning (EWCBR'94), Chantilly</title>
        <imprint>
          <dateStruct>
            <year>1994</year>
          </dateStruct>
          <biblScope type="pages">313-320</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Johnson88" type="article" id="bid18">
      <analytic>
        <title level="a">Designing Reusable Classes</title>
        <author>
          <persName>
            <foreName>Ralph E.</foreName>
            <surname>Johnson</surname>
            <initial>R. E.</initial>
          </persName>
          <persName>
            <foreName>Brian</foreName>
            <surname>Foote</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Journal of Object-oriented programming</title>
        <imprint>
          <biblScope type="volume">1</biblScope>
          <biblScope type="number">2</biblScope>
          <dateStruct>
            <year>1988</year>
          </dateStruct>
          <biblScope type="pages">22–35</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Konstan97" type="article" id="bid8">
      <analytic>
        <title level="a">GroupLens: Applying collaborative filtering to usenet news</title>
        <author>
          <persName>
            <foreName>Joseph A.</foreName>
            <surname>Konstan</surname>
            <initial>J. A.</initial>
          </persName>
          <persName>
            <foreName>Bradley N.</foreName>
            <surname>Miller</surname>
            <initial>B. N.</initial>
          </persName>
          <persName>
            <foreName>David</foreName>
            <surname>Maltz</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>J. L.</foreName>
            <surname>Herlocker</surname>
            <initial>J. L.</initial>
          </persName>
          <persName>
            <foreName>L. R.</foreName>
            <surname>Gordon</surname>
            <initial>L. R.</initial>
          </persName>
          <persName>
            <foreName>J.</foreName>
            <surname>Riedl</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Communications of the ACM</title>
        <imprint>
          <biblScope type="volume">40</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>1997</year>
          </dateStruct>
          <biblScope type="pages">77-87</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:YL2003b" type="inproceedings" id="bid49">
      <analytic>
        <title level="a">General dynamic clustering methods on symbolic data tables</title>
        <author>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18481">
            <foreName>Rosanna</foreName>
            <surname>Verde</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Classification and Data Analysis Group, Bologne,Italie</title>
        <imprint>
          <publisher>
            <orgName>CLADAG2003</orgName>
          </publisher>
          <dateStruct>
            <month>September</month>
            <year>2003</year>
          </dateStruct>
          <biblScope type="pages">245-248</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:YL2004e" type="inproceedings" id="bid50">
      <analytic>
        <title level="a">Crossed Clustering method: An efficient Clustering Method for Web Usage Mining</title>
        <author>
          <persName key="axis-2005-id18098">
            <foreName>Yves</foreName>
            <surname>Lechevallier</surname>
            <initial>Y.</initial>
          </persName>
          <persName key="axis-2005-id18481">
            <foreName>Rosanna</foreName>
            <surname>Verde</surname>
            <initial>R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Complex Data Analysis, Pekin, Chine</title>
        <imprint>
          <publisher>
            <orgName>CDA'2004</orgName>
          </publisher>
          <dateStruct>
            <month>october</month>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:lichmayi04" type="article" id="bid3">
      <analytic>
        <title level="a">An Efficient and Scalable Algorithm for Clustering XML Documents by Structure</title>
        <author>
          <persName>
            <foreName>Wang</foreName>
            <surname>Lian</surname>
            <initial>W.</initial>
          </persName>
          <persName>
            <foreName>David Wai-Lok</foreName>
            <surname>Cheung</surname>
            <initial>D. W.-L.</initial>
          </persName>
          <persName>
            <foreName>Nikos</foreName>
            <surname>Mamoulis</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Siu-Ming</foreName>
            <surname>Yiu</surname>
            <initial>S.-M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">IEEE Trans. Knowl. Data Eng</title>
        <imprint>
          <biblScope type="volume">16</biblScope>
          <biblScope type="number">1</biblScope>
          <dateStruct>
            <month>January</month>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:MaTePo04b" type="inproceedings" id="bid65">
      <analytic>
        <title level="a">Pre-Processing Time Constraints for Efficiently Mining Generalized Sequential Patterns</title>
        <author>
          <persName key="axis-2005-id18166">
            <foreName>Florent</foreName>
            <surname>Masseglia</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Maguelone</foreName>
            <surname>Teisseire</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Pascal</foreName>
            <surname>Poncelet</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">11th International Symposium on Temporal Representation and Reasoning (TIME'04), Tatihou, France</title>
        <imprint>
          <dateStruct>
            <month>1-3 July</month>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:JT97" type="inproceedings" id="bid11">
      <analytic>
        <title level="a">Aspects du raisonnement à partir de cas</title>
        <author>
          <persName>
            <foreName>Amédéo</foreName>
            <surname>Napoli</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName/>
            <surname>et al.</surname>
            <initial/>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>S.</foreName>
            <surname>Pesty</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>P.</foreName>
            <surname>Siegel</surname>
            <initial>P.</initial>
          </persName>
        </editor>
        <title level="m">Actes des 6 èmes journées nationales PRC-GDR Intelligence Artificielle</title>
        <imprint>
          <publisher>
            <orgName>Hermes, Paris</orgName>
          </publisher>
          <dateStruct>
            <month>mars</month>
            <year>1997</year>
          </dateStruct>
          <biblScope type="pages">261-288</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:nija02" type="inproceedings" id="bid1">
      <analytic>
        <title level="a">Evaluating Structural Similarity in XML Documents</title>
        <author>
          <persName>
            <foreName>Andrew</foreName>
            <surname>Nierman</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>H. V.</foreName>
            <surname>Jagadish</surname>
            <initial>H. V.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the Fifth International Workshop on the Web and Databases (WebDB 2002), Madison, Wisconsin, USA</title>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2002</year>
          </dateStruct>
          <ref xlink:actuate="onRequest" xlink:show="replace" xlink:type="simple" xlink:href="http://citeseer.ist.psu.edu/nierman02evaluating.html" location="extern" xyref="4229699122010">http://citeseer.ist.psu.edu/nierman02evaluating.html</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Sodas2" type="misc" id="bid12">
      <monogr>
        <title level="m">User manual for SODAS 2 Software</title>
        <author>
          <persName>
            <foreName>Monique</foreName>
            <surname>Noirhomme-Fraiture</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName/>
            <surname>et al.</surname>
            <initial/>
          </persName>
        </author>
        <note anchored="yes" place="unspecified" type="bnote">version 1.0</note>
        <imprint>
          <publisher>
            <orgName>FUNDP, Belgique</orgName>
          </publisher>
          <dateStruct>
            <month>april</month>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Resnick97" type="article" id="bid7">
      <analytic>
        <title level="a">Recommender systems</title>
        <author>
          <persName>
            <foreName>Paul</foreName>
            <surname>Resnick</surname>
            <initial>P.</initial>
          </persName>
          <persName>
            <foreName>Hal R.</foreName>
            <surname>Varian</surname>
            <initial>H. R.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Communications of the ACM</title>
        <imprint>
          <biblScope type="volume">40</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>1997</year>
          </dateStruct>
          <biblScope type="pages">56-58</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:RossiEtAlChimio2005" type="inproceedings" id="bid67">
      <analytic>
        <title level="a">Sélection de groupes de variables spectrales par information mutuelle grâce à une représentation spline</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Damien</foreName>
            <surname>François</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Vincent</foreName>
            <surname>Wertz</surname>
            <initial>V.</initial>
          </persName>
          <persName>
            <foreName>Michel</foreName>
            <surname>Verleysen</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Actes de la conférence Chimiométrie 2005, Villeneuve d'Ascq (France)</title>
        <imprint>
          <dateStruct>
            <month>November–December</month>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:RossiEtAl05Chemometrics" type="article" id="bid66">
      <analytic>
        <title level="a">Mutual information for the selection of relevant variables in spectrometric nonlinear modelling</title>
        <author>
          <persName key="axis-2005-id18259">
            <foreName>Fabrice</foreName>
            <surname>Rossi</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Amaury</foreName>
            <surname>Lendasse</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Damien</foreName>
            <surname>François</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Vincent</foreName>
            <surname>Wertz</surname>
            <initial>V.</initial>
          </persName>
          <persName>
            <foreName>Michel</foreName>
            <surname>Verleysen</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Chemometrics and Intelligent Laboratory Systems</title>
        <note anchored="yes" place="unspecified" type="bnote">In press</note>
        <imprint>
          <dateStruct>
            <year>2005</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:mobivip-D5.1" type="misc" id="bid58">
      <monogr>
        <title level="m">Définition du scénario générique guidant l'évalaution du service VIP</title>
        <author>
          <persName key="axis-2005-id18195">
            <foreName>Bernard</foreName>
            <surname>Senach</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
        </author>
        <note anchored="yes" place="unspecified" type="bnote">INRIA Sophia Antipolis, Delivrable D5.2. du Projet PREDIT MOBIVIP</note>
        <imprint>
          <dateStruct>
            <month>December</month>
            <year>2004</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Shardanand95" type="inproceedings" id="bid6">
      <analytic>
        <title level="a">Social Information Filtering: Algorithms for Automating Word of mouth</title>
        <author>
          <persName>
            <foreName>Upendra</foreName>
            <surname>Shardanand</surname>
            <initial>U.</initial>
          </persName>
          <persName>
            <foreName>Pattie</foreName>
            <surname>Maes</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">CHI'95: Mosaic of creativity, Denver, Colorado</title>
        <imprint>
          <publisher>
            <orgName>ACM</orgName>
          </publisher>
          <dateStruct>
            <month>May</month>
            <year>1995</year>
          </dateStruct>
          <biblScope type="pages">210-217</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:TrChGa:Genie:2004" type="article" id="bid61">
      <analytic>
        <title level="a">Faciliter les déplacements par des recommandations personnalisées à la recherche d'information</title>
        <author>
          <persName key="axis-2005-id18078">
            <foreName>Brigitte</foreName>
            <surname>Trousse</surname>
            <initial>B.</initial>
          </persName>
          <persName key="axis-2005-id18372">
            <foreName>Sergiu</foreName>
            <surname>Chelcea</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Georges</foreName>
            <surname>Gallais</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Revue Génie Logiciel, rubrique Systèmes d'informations et transports</title>
        <imprint>
          <biblScope type="number">70</biblScope>
          <dateStruct>
            <month>September</month>
            <year>2004</year>
          </dateStruct>
          <biblScope type="pages">48 - 57</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Wess94" type="inproceedings" id="bid20">
      <analytic>
        <title level="a">Using K-d Trees to Improve the Retrieval Step in Case-Based Reasoning</title>
        <author>
          <persName>
            <foreName>Stefan</foreName>
            <surname>Wess</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Klaus-Dieter</foreName>
            <surname>Althoff</surname>
            <initial>K.-D.</initial>
          </persName>
          <persName>
            <foreName>Guido</foreName>
            <surname>Derwand</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <editor role="editor">
          <persName>
            <foreName>S.</foreName>
            <surname>Wess</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>K.D.</foreName>
            <surname>Althoff</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>M. M.</foreName>
            <surname>Richter</surname>
            <initial>M. M.</initial>
          </persName>
        </editor>
        <title level="m">Lecture Notes in Artificial Intelligence, Topics in Case-Based Reasoning</title>
        <imprint>
          <publisher>
            <orgName>Springer-Verlag</orgName>
          </publisher>
          <dateStruct>
            <year>1994</year>
          </dateStruct>
          <biblScope type="pages">167-181</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:footprints97" type="inproceedings" id="bid9">
      <analytic>
        <title level="a">Using History to Assist Information Browsing</title>
        <author>
          <persName>
            <foreName>Alan</foreName>
            <surname>Wexelblat</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Pattie</foreName>
            <surname>Maes</surname>
            <initial>P.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">Proceedings of the RIAO'97 Symposioum: Computer-Assisted Information Retrieval on the Internet, Montreal, Canada</title>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>1997</year>
          </dateStruct>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:Yan96" type="article" id="bid10">
      <analytic>
        <title level="a">From user access patterns to dynamic hypertext linking</title>
        <author>
          <persName>
            <foreName>Tak Woon</foreName>
            <surname>Yan</surname>
            <initial>T. W.</initial>
          </persName>
          <persName>
            <foreName>Matthew</foreName>
            <surname>Jacobsen</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Hector</foreName>
            <surname>Garcia-Molina</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Umeshwar</foreName>
            <surname>Dayal</surname>
            <initial>U.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="j">Computer Network and ISDN systems</title>
        <note anchored="yes" place="unspecified" type="bnote">(proceedings of the 5th international WWW conference)</note>
        <imprint>
          <biblScope type="volume">28</biblScope>
          <dateStruct>
            <month>mai</month>
            <year>1996</year>
          </dateStruct>
          <biblScope type="pages">1007-1014</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct rend="foot" n="footcite:yi00classifier" type="inproceedings" id="bid4">
      <analytic>
        <title level="a">A classifier for semi-structured documents</title>
        <author>
          <persName>
            <foreName>Jeonghee</foreName>
            <surname>Yi</surname>
            <initial>J.</initial>
          </persName>
          <persName>
            <foreName>Neel</foreName>
            <surname>Sundaresan</surname>
            <initial>N.</initial>
          </persName>
        </author>
      </analytic>
      <monogr>
        <title level="m">KDD '00: Proceedings of the sixth ACM SIGKDD international conference on Knowledge discovery and data mining, New York, NY, USA</title>
        <imprint>
          <publisher>
            <orgName>ACM Press</orgName>
          </publisher>
          <dateStruct>
            <year>2000</year>
          </dateStruct>
          <biblScope type="pages">340–344</biblScope>
        </imprint>
      </monogr>
    </biblStruct>
  </biblio>
</raweb>
