<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE raweb PUBLIC "-//INRIA//DTD " "raweb2.dtd">
<raweb xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" year="2012">
  <identification id="sierra" isproject="true">
    <shortname>SIERRA</shortname>
    <projectName>Statistical Machine Learning and Parsimony</projectName>
    <theme-de-recherche>Optimization, Learning and Statistical Methods</theme-de-recherche>
    <domaine-de-recherche>Applied Mathematics, Computation and Simulation</domaine-de-recherche>
    <urlTeam>http://www.di.ens.fr/sierra/</urlTeam>
    <datecreation type="Team">January 01, 2011 </datecreation>
    <structure_exterieure type="Labs">
      <libelle>Département d'Informatique de l'Ecole Normale Supérieure</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>CNRS</libelle>
    </structure_exterieure>
    <structure_exterieure type="Organism">
      <libelle>Ecole normale supérieure de Paris</libelle>
    </structure_exterieure>
    <UR name="Rocquencourt"/>
    <keywords>
      <term>Machine Learning</term>
      <term>Statistics</term>
      <term>Convex Optimization</term>
      <term>Data Mining</term>
    </keywords>
    <moreinfo/>
  </identification>
  <team id="uid1">
    <person key="select-2006-idm193321381344">
      <firstname>Sylvain</firstname>
      <lastname>Arlot</lastname>
      <affiliation>CNRS</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Junior Researcher CNRS</moreinfo>
    </person>
    <person key="willow-2007-idm119098005552">
      <firstname>Francis</firstname>
      <lastname>Bach</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Team leader, Senior researcher “détaché” at Inria from Corps des Mines</moreinfo>
      <hdr>oui</hdr>
    </person>
    <person key="willow-2009-idm241890428288">
      <firstname>Guillaume</firstname>
      <lastname>Obozinski</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Chercheur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Ingénieur Expert de Recherche</moreinfo>
    </person>
    <person key="willow-2009-idm241890420336">
      <firstname>Louise</firstname>
      <lastname>Benoît</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="willow-2009-idm241890415088">
      <firstname>Florent</firstname>
      <lastname>Couzinié-Devy</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="sierra-2012-idm442940210896">
      <firstname>Fajwel</firstname>
      <lastname>Fogel</lastname>
      <affiliation>CNRS</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="willow-2010-idm1079616768">
      <firstname>Edouard</firstname>
      <lastname>Grave</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="willow-2009-idm241890407184">
      <firstname>Toby</firstname>
      <lastname>Hocking</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>graduated on November 20, 2012</moreinfo>
    </person>
    <person key="willow-2009-idm241890401936">
      <firstname>Armand</firstname>
      <lastname>Joulin</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>graduated on December 17, 2012</moreinfo>
    </person>
    <person key="sierra-2012-idm442940199568">
      <firstname>Rémi</firstname>
      <lastname>Lajugie</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="sierra-2012-idm442940196944">
      <firstname>Loic</firstname>
      <lastname>Landrieu</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="willow-2009-idm241890399312">
      <firstname>Augustin</firstname>
      <lastname>Lefèvre</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>graduated on October 3, 2012</moreinfo>
    </person>
    <person key="sierra-2012-idm442940191264">
      <firstname>Alex</firstname>
      <lastname>Mesnil</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="sierra-2011-idm457989345136">
      <firstname>Anil</firstname>
      <lastname>Nelakanti</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Cifre Ph.D. with Xerox</moreinfo>
    </person>
    <person key="parietal-2009-idm302557838896">
      <firstname>Fabian</firstname>
      <lastname>Pedregosa</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="flowers-2008-idm186862164224">
      <firstname>Thomas</firstname>
      <lastname>Schatz</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="willow-2010-idm1079619392">
      <firstname>Matthieu</firstname>
      <lastname>Solnon</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>PhD</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="classic-2012-idm487366258672">
      <firstname>Lindsay</firstname>
      <lastname>Polienor</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Assistant</categoryPro>
      <research-centre>Rocquencourt</research-centre>
    </person>
    <person key="imedia-2006-idm544971845104">
      <firstname>Jean-Paul</firstname>
      <lastname>Chieze</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>Technique</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>Ingénieur SED</moreinfo>
    </person>
    <person key="sierra-2011-idm457989376096">
      <firstname>Simon</firstname>
      <lastname>Lacoste-Julien</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>financed by Mairie de Paris and ERC grant</moreinfo>
    </person>
    <person key="cafe-2006-idm360414076672">
      <firstname>Nicolas</firstname>
      <lastname>Le Roux</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>financed by ERC grant, until September 20, 2012</moreinfo>
    </person>
    <person key="sierra-2011-idm457989373152">
      <firstname>Ronny</firstname>
      <lastname>Luss</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>financed by associated team STATWEB, until September 1, 2012</moreinfo>
    </person>
    <person key="sierra-2011-idm457989367008">
      <firstname>Mark</firstname>
      <lastname>Schmidt</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>financed by ERC grant</moreinfo>
    </person>
    <person key="sierra-2012-idm442940159744">
      <firstname>Nino</firstname>
      <lastname>Shervashidze</lastname>
      <affiliation>INRIA</affiliation>
      <categoryPro>PostDoc</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>since December 1, 2012</moreinfo>
    </person>
    <person key="sierra-2012-idm442940156688">
      <firstname>Michael</firstname>
      <lastname>Jordan</lastname>
      <affiliation>UnivFr</affiliation>
      <categoryPro>Visiteur</categoryPro>
      <research-centre>Rocquencourt</research-centre>
      <moreinfo>financed by Fondation de Sciences Mathématiques de Paris</moreinfo>
    </person>
  </team>
  <presentation id="uid2">
    <bodyTitle>Overall Objectives</bodyTitle>
    <subsection id="uid3" level="1">
      <bodyTitle>Statement</bodyTitle>
      <p>Machine learning is a recent scientific domain, positioned between
applied mathematics, statistics and computer science. Its goals are
the optimization, control, and modelisation of complex systems from
examples. It applies to data from numerous engineering and scientific
fields (e.g., vision, bioinformatics, neuroscience, audio processing,
text processing, economy, finance, etc.), the ultimate goal being to
derive general theories and algorithms allowing advances in each of
these domains. Machine learning is characterized by the high quality
and quantity of the exchanges between theory, algorithms and
applications: interesting theoretical problems almost always emerge
from applications, while theoretical analysis allows the understanding
of why and when popular or successful algorithms do or do not work,
and leads to proposing significant improvements.</p>
      <p>Our academic positioning is exactly at the intersection between these
three aspects—algorithms, theory and applications—and our main
research goal is to make the link between theory and algorithms, and
between algorithms and high-impact applications in various engineering
and scientific fields, in particular computer vision, bioinformatics,
audio processing, text processing and neuro-imaging.</p>
      <p>Machine learning is now a vast field of research and the team focuses
on the following aspects: supervised learning (kernel methods,
calibration), unsupervised learning (matrix factorization, statistical
tests), parsimony (structured sparsity, theory and algorithms), and
optimization (convex optimization, bandit learning). These four
research axes are strongly interdependent, and the interplay between
them is key to successful practical applications.</p>
    </subsection>
    <subsection id="uid4" level="1">
      <bodyTitle>Highlights of the Year</bodyTitle>
      <simplelist>
        <li id="uid5">
          <p noindent="true">Rodolphe Jenatton (former PhD student, graduated in 2011) received two thesis prizes (Fondation Hadamard and AFIA).</p>
        </li>
        <li id="uid6">
          <p noindent="true">Francis Bach received the Inria young researcher prize.</p>
        </li>
        <li id="uid7">
          <p noindent="true">Monograph published in the collection <i>Foundations and Trends in Machine Learning</i>: “Optimization with sparsity-inducing penalties”.</p>
        </li>
      </simplelist>
    </subsection>
  </presentation>
  <fondements id="uid8">
    <bodyTitle>Scientific Foundations</bodyTitle>
    <subsection id="uid9" level="1">
      <bodyTitle>Supervised Learning</bodyTitle>
      <p>This part of our research focuses on methods where, given a set of
examples of input/output pairs, the goal is to predict the output
for a new input, with research on kernel methods, calibration methods,
and multi-task learning.
</p>
    </subsection>
    <subsection id="uid10" level="1">
      <bodyTitle>Unsupervised Learning</bodyTitle>
      <p>We focus here on methods where no output is given and the goal is to
find structure of certain known types (e.g., discrete or
low-dimensional) in the data, with a focus on matrix factorization,
statistical tests, dimension reduction, and semi-supervised learning.
</p>
    </subsection>
    <subsection id="uid11" level="1">
      <bodyTitle>Parsimony</bodyTitle>
      <p>The concept of parsimony is central to many areas of science. In the
context of statistical machine learning, this takes the form of
variable or feature selection. The team focuses primarily on
structured sparsity, with theoretical and algorithmic contributions
(this is the main topic of the ERC starting investigator grant awarded
to F. Bach).
</p>
    </subsection>
    <subsection id="uid12" level="1">
      <bodyTitle>Optimization</bodyTitle>
      <p>Optimization in all its forms is central to machine learning, as many
of its theoretical frameworks are based at least in part on
empirical risk minimization. The team focuses primarily on convex and
bandit optimization, with a particular focus on large-scale optimization.
</p>
    </subsection>
  </fondements>
  <domaine id="uid13">
    <bodyTitle>Application Domains</bodyTitle>
    <subsection id="uid14" level="1">
      <bodyTitle>Application Domains</bodyTitle>
      <p>Machine learning research can be conducted from two main perspectives: the first one, which has been dominant in the last 30 years, is to design learning algorithms and theories which are as generic as possible, the goal being to make as few assumptions as possible regarding the problems to be solved and to let data speak for themselves. This has led to many interesting methodological developments and successful applications. However, we believe that this strategy has reached its limit for many application domains, such as computer vision, bioinformatics, neuro-imaging, text and audio processing, which leads to the second perspective our team is built on: Research in machine learning theory and algorithms should be driven by interdisciplinary collaborations, so that specific prior knowledge may be properly introduced into the learning process, in particular with the following fields:</p>
      <simplelist>
        <li id="uid15">
          <p noindent="true">Computer vision: objet recognition, object detection, image segmentation, image/video processing, computational photography. In collaboration with the Willow project-team.</p>
        </li>
        <li id="uid16">
          <p noindent="true">Bioinformatics: cancer diagnosis, protein function prediction, virtual screening. In collaboration with Institut Curie.</p>
        </li>
        <li id="uid17">
          <p noindent="true">Text processing: document collection modeling, language models.</p>
        </li>
        <li id="uid18">
          <p noindent="true">Audio processing: source separation, speech/music processing. In collaboration with Telecom Paristech.</p>
        </li>
        <li id="uid19">
          <p noindent="true">Neuro-imaging: brain-computer interface (fMRI, EEG, MEG). In collaboration with the Parietal project-team.</p>
        </li>
      </simplelist>
    </subsection>
  </domaine>
  <logiciels id="uid20">
    <bodyTitle>Software</bodyTitle>
    <subsection id="uid21" level="1">
      <bodyTitle>
        <ref xlink:href="http://spams-devel.gforge.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">SPAMS (SPArse Modeling Software)</ref>
      </bodyTitle>
      <participants>
        <person key="imedia-2006-idm544971845104">
          <firstname>Jean-Paul</firstname>
          <lastname>Chieze</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="willow-2009-idm241890428288">
          <firstname>Guillaume</firstname>
          <lastname>Obozinski</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>SPAMS (SPArse Modeling Software) is an optimization toolbox for solving various
sparse estimation problems: dictionary learning and matrix factorization, solving sparse decomposition prob-
lems, solving structured sparse decomposition problems. It is developped by Julien Mairal (former Willow PhD student, co-advised by F. Bach and J. Ponce), with the collaboration of Francis Bach (Inria), Jean
Ponce (Ecole Normale Supérieure), Guillermo Sapiro (University of Minnesota), Rodolphe Jenatton (Inria)
and Guillaume Obozinski (Inria). It is coded in C++ with a Matlab interface. Recently, interfaces for R
and Python have been developed by Jean-Paul Chieze (Inria). Currently 650 downloads and between 1500
and 2000 page visits per month. See <ref xlink:href="http://spams-devel.gforge.inria.fr/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>spams-devel.<allowbreak/>gforge.<allowbreak/>inria.<allowbreak/>fr/</ref>.</p>
    </subsection>
    <subsection id="uid22" level="1">
      <bodyTitle>
        <ref xlink:href="http://mlg.eng.cam.ac.uk/slacoste/sigma/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">SiGMa - Simple Greedy Matching: a tool for aligning large knowledge-bases</ref>
      </bodyTitle>
      <participants>
        <person key="sierra-2011-idm457989376096">
          <firstname>Simon</firstname>
          <lastname>Lacoste-Julien</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>SiGMa - Simple Greedy Matching: a tool for aligning large knowledge-bases</p>
      <p>Version 1. Webpage: <ref xlink:href="http://mlg.eng.cam.ac.uk/slacoste/sigma/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>mlg.<allowbreak/>eng.<allowbreak/>cam.<allowbreak/>ac.<allowbreak/>uk/<allowbreak/>slacoste/<allowbreak/>sigma/</ref>.</p>
      <p>The tool SiGMa (Simple Greedy Matching) is a knowledge base alignment
tool implemented in Python. It takes as input two knowledge bases,
each represented as a list of triples of (entity, relationship,
entity), in addition to a partial alignment between the relationships
from one knowledge base to the other, and gives as output an ordered
list of proposed entity matches between the two knowledge base (where
the order corresponds heuristically to a notion of certainty about
these matches). The matching decisions are made in a greedy fashion,
combining information about the relationship graph as well as a
pairwise similarity scores defined between the entities. The code
handles various sources of information to be used for this score, such
as a similarity defined on strings, dates, and other entity properties
– and gives a few options to the user.</p>
      <p>We also provide two large-scale knowledge base alignment benchmark
datasets with tens of thousands of ground truth pairs: YAGO aligned to
IMDb as well as Freebase aligned to IMDb.</p>
      <p>Participants outside of Sierra: Konstantina Palla, Alex Davies, Zoubin
Ghahramani (Machine Learning Group, Department of Engineering,
University of Cambridge); Gjergji Kasneci, Thore Graepel (Microsoft
Research Cambridge)</p>
      <p>See <ref xlink:href="http://mlg.eng.cam.ac.uk/slacoste/sigma/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>mlg.<allowbreak/>eng.<allowbreak/>cam.<allowbreak/>ac.<allowbreak/>uk/<allowbreak/>slacoste/<allowbreak/>sigma/</ref>.</p>
    </subsection>
    <subsection id="uid23" level="1">
      <bodyTitle>
        <ref xlink:href="http://www.di.ens.fr/~mschmidt/Software/minFunc.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">minFunc (2012 version)</ref>
      </bodyTitle>
      <participants>
        <person key="sierra-2011-idm457989367008">
          <firstname>Mark</firstname>
          <lastname>Schmidt</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>minFunc is a Matlab function for unconstrained optimization of differentiable real-valued multivariate functions using line-search methods. It uses an interface very similar to the Matlab Optimization Toolbox function fminunc, and can be called as a replacement for this function. On many problems, minFunc requires fewer function evaluations to converge than fminunc (or minimize.m). Further it can optimize problems with a much larger number of variables (fminunc is restricted to several thousand variables), and uses a line search that is robust to several common function pathologies.</p>
      <p>The default parameters of minFunc call a quasi-Newton strategy, where limited-memory BFGS updates with Shanno-Phua scaling are used in computing the step direction, and a bracketing line-search for a point satisfying the strong Wolfe conditions is used to compute the step direction. In the line search, (safeguarded) cubic interpolation is used to generate trial values, and the method switches to an Armijo back-tracking line search on iterations where the objective function enters a region where the parameters do not produce a real valued output (i.e. complex, NaN, or Inf).
See <ref xlink:href="http://www.di.ens.fr/~mschmidt/Software/minFunc.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>di.<allowbreak/>ens.<allowbreak/>fr/<allowbreak/>~mschmidt/<allowbreak/>Software/<allowbreak/>minFunc.<allowbreak/>html</ref>.</p>
    </subsection>
    <subsection id="uid24" level="1">
      <bodyTitle>
        <ref xlink:href="http://www.di.ens.fr/~mschmidt/Software/minFunc.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">prettyPlot</ref>
      </bodyTitle>
      <participants>
        <person key="sierra-2011-idm457989367008">
          <firstname>Mark</firstname>
          <lastname>Schmidt</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>The prettyPlot function is a simple wrapper to Matlab's plot function for quickly making nicer-looking plots. Here are the features:
Made the default line styles bigger, and the default fonts nicer.
Options are passed as a structure, instead of through plot's large number of different functions.
You can pass in cell arrays to have lines of different lengths.
You can pass an <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>n</mi><mo>×</mo><mn>3</mn></mrow></math></formula> matrix of colors, and cell arrays of line-styles and/or markers. It will cycle through the given choices.
All markers are placed on top of (all) lines, you do not have to put a marker on every data point, and you can use different spacing between markers for different lines.
You can change only the upper or lower x-limit (y-limit), rather than having to specify both.
There is some support for making nicer-looking error lines.
See <ref xlink:href="http://www.di.ens.fr/~mschmidt/Software/prettyPlot.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>di.<allowbreak/>ens.<allowbreak/>fr/<allowbreak/>~mschmidt/<allowbreak/>Software/<allowbreak/>prettyPlot.<allowbreak/>html</ref>.</p>
    </subsection>
    <subsection id="uid25" level="1">
      <bodyTitle>
        <ref xlink:href="http://segannot.r-forge.r-project.org/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">SegAnnot</ref>
      </bodyTitle>
      <participants>
        <person key="willow-2009-idm241890407184">
          <firstname>Toby</firstname>
          <lastname>Hocking</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>SegAnnot: an R package for fast segmentation of annotated piecewise constant signals. Tech report and R package. Standard segmentation models for piecewise constant signals do not always agree with an expert's visual interpretation of the signal, as encoded using a set of annotations. This R package implements a dynamic programming algorithm which can be used to quickly find a segmentation model in agreement with expert annotations.
Collaboration with Guillem Rigaill (Inria - AgroParisTech). See <ref xlink:href="http://hal.inria.fr/hal-00759129" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00759129</ref> and <ref xlink:href="http://segannot.r-forge.r-project.org/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>segannot.<allowbreak/>r-forge.<allowbreak/>r-project.<allowbreak/>org/</ref>.</p>
    </subsection>
  </logiciels>
  <resultats id="uid26">
    <bodyTitle>New Results</bodyTitle>
    <subsection id="uid27" level="1">
      <bodyTitle>A Stochastic Gradient Method with an Exponential Convergence Rate for Strongly-Convex Optimization with Finite Training Sets</bodyTitle>
      <participants>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
        <person key="sierra-2011-idm457989367008">
          <firstname>Mark</firstname>
          <lastname>Schmidt</lastname>
        </person>
        <person key="cafe-2006-idm360414076672">
          <firstname>Nicolas</firstname>
          <lastname>Le Roux</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid0" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose a new stochastic gradient method for optimizing the sum of a finite set of smooth functions, where the sum is strongly convex. While standard stochastic gradient methods converge at sublinear rates for this problem, the proposed method incorporates a memory of previous gradient values in order to achieve a linear convergence rate. In a machine learning context, numerical experiments indicate that the new algorithm can dramatically outperform standard algorithms, both in terms of optimizing the training objective and reducing the testing objective quickly.
</p>
    </subsection>
    <subsection id="uid28" level="1">
      <bodyTitle>Convex Relaxation for Combinatorial Penalties</bodyTitle>
      <participants>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
        <person key="willow-2009-idm241890428288">
          <firstname>Guillaume</firstname>
          <lastname>Obozinski</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid1" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose an unifying view of several recently proposed structured sparsity-inducing norms. We consider the situation of a model simultaneously (a) penalized by a set- function de ned on the support of the unknown parameter vector which represents prior knowledge on supports, and (b) regularized in Lp-norm. We show that the natural combinatorial optimization problems obtained may be relaxed into convex optimization problems and introduce a notion, the lower combinatorial envelope of a set-function, that characterizes the tightness of our relaxations. We moreover establish links with norms based on latent representations including the latent group Lasso and block-coding, and with norms obtained from submodular functions.</p>
    </subsection>
    <subsection id="uid29" level="1">
      <bodyTitle>Kernel change-point detection</bodyTitle>
      <participants>
        <person key="select-2006-idm193321381344">
          <firstname>Sylvain</firstname>
          <lastname>Arlot</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid2" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we tackle the change-point problem with data belonging to a general set. We propose a penalty for choosing the number of change-points in the kernel-based method of Harchaoui and Cappé (2007). This penalty generalizes the one proposed for one dimensional signals by Lebarbier (2005). We prove it satisfies a non-asymptotic oracle inequality by showing a new concentration result in Hilbert spaces. Experiments on synthetic and real data illustrate the accuracy of our method, showing it can detect changes in the whole distribution of data, even when the mean and variance are constant. Our algorithm can also deal with data of complex nature, such as the GIST descriptors which are commonly used for video temporal segmentation.</p>
      <p>Collaboration with Alain Celisse (University Lille 1; Inria Lille, MODAL team) and Zaïd Harchaoui (Inria Grenoble, LEAR team).</p>
    </subsection>
    <subsection id="uid30" level="1">
      <bodyTitle>On the Equivalence between Herding and Conditional Gradient Algorithms</bodyTitle>
      <participants>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="sierra-2011-idm457989376096">
          <firstname>Simon</firstname>
          <lastname>Lacoste-Julien</lastname>
        </person>
        <person key="willow-2009-idm241890428288">
          <firstname>Guillaume</firstname>
          <lastname>Obozinski</lastname>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid3" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we show that the herding procedure of Welling (2009) takes exactly the form of a standard convex optimization algorithm–namely a conditional gradient algorithm minimizing a quadratic moment discrepancy. This link enables us to invoke convergence results from convex optimization and to consider faster alternatives for the task of approximating integrals in a reproducing kernel Hilbert space. We study the behavior of the different variants through numerical simulations. The experiments indicate that while we can improve over herding on the task of approximating integrals, the original herding algorithm tends to approach more often the maximum entropy distribution, shedding more light on the learning bias behind herding.</p>
    </subsection>
    <subsection id="uid31" level="1">
      <bodyTitle><formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold cross-validation and <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold penalization in least-squares density estimation</bodyTitle>
      <participants>
        <person key="select-2006-idm193321381344">
          <firstname>Sylvain</firstname>
          <lastname>Arlot</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid4" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we study <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold cross-validation for model selection in least-squares density estimation. The goal is to provide theoretical grounds for choosing <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula> in order to minimize the least-squares risk of the selected estimator.
We first prove a non asymptotic oracle inequality for <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold cross-validation and its bias-corrected version (<formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold penalization), with an upper bound decreasing as a function of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>. In particular, this result implies <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold penalization is asymptotically optimal. Then, we compute the variance of <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold cross-validation and related criteria, as well as the variance of key quantities for model selection performances. We show these variances depend on <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula> like <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mn>1</mn><mo>+</mo><mn>1</mn><mo>/</mo><mo>(</mo><mi>V</mi><mo>-</mo><mn>1</mn><mo>)</mo></mrow></math></formula> (at least in some particular cases), suggesting the performances increase much from <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>V</mi><mo>=</mo><mn>2</mn></mrow></math></formula> to <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>V</mi><mo>=</mo><mn>5</mn></mrow></math></formula> or 10, and then is almost constant. Overall, this explains the common advice to take <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mrow><mi>V</mi><mo>=</mo><mn>10</mn><mspace width="0.166667em"/></mrow></math></formula>—at least in our setting and when the computational power is limited—, as confirmed by some simulation experiments.</p>
      <p>Collaboration with Matthieu Lerasle (CNRS, University Nice Sophia Antipolis).</p>
    </subsection>
    <subsection id="uid32" level="1">
      <bodyTitle>Machine learning for Neuro-imaging</bodyTitle>
      <participants>
        <person key="parietal-2009-idm302557838896">
          <firstname>Fabian</firstname>
          <lastname>Pedregosa</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
        <person key="willow-2009-idm241890428288">
          <firstname>Guillaume</firstname>
          <lastname>Obozinski</lastname>
        </person>
      </participants>
      <p>In the course of the year 2011-2012 two articles where submitted and accepted in international workshops. The first published article, <b>Improved brain pattern recovery through ranking approaches</b> (<ref xlink:href="#sierra-2012-bid5" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) was presented at the 2nd International Workshop on Pattern Recognition in NeuroImaging in London, July 2012 and proposes a new approach for the problem of estimating the coefficients of a generalized linear model with monotonicity constraint. For this, we explore the use of ranking techniques, which are popular in the context of information retrieval but novel for medical imaging applications.</p>
      <p>The second published article, <b>Learning to rank from medical imaging data</b> (<ref xlink:href="#sierra-2012-bid6" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>) uses the same techniques as the previous article to solve a more fundamental problem, that is, to predict a quantitative (and potentially non-linear) variable from a set of noisy measurements. We show on simulations and two fMRI datasets
that this approach is able to predict the correct ordering on pairs of images, yielding higher prediction accuracy than standard regression and
multiclass classification techniques.</p>
      <p>Collaboration with the Parietal project-team (A. Gramfort, B. Thirion, G. Varoquaux)</p>
    </subsection>
    <subsection id="uid33" level="1">
      <bodyTitle>SiGMa: Simple Greedy Matching for Aligning Large Knowledge Bases</bodyTitle>
      <participants>
        <person key="sierra-2011-idm457989376096">
          <firstname>Simon</firstname>
          <lastname>Lacoste-Julien</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>The Internet has enabled the creation of a growing number of
large-scale knowledge bases in a variety of domains containing
complementary information. Tools for automatically aligning these
knowledge bases would make it possible to unify many sources of
structured knowledge and answer complex queries. However, the
efficient alignment of large-scale knowledge bases still poses a
considerable challenge. In <ref xlink:href="#sierra-2012-bid7" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we present Simple Greedy Matching
(SiGMa), a simple algorithm for aligning knowledge bases with millions
of entities and facts. SiGMa is an iterative propagation algorithm
which leverages both the structural information from the relationship
graph as well as flexible similarity measures between entity
properties in a greedy local search, thus making it scalable. Despite
its greedy nature, our experiments indicate that SiGMa can efficiently
match some of the world's largest knowledge bases with high precision.
We provide additional experiments on benchmark datasets which
demonstrate that SiGMa can outperform state-of-the-art approaches both
in accuracy and efficiency.</p>
      <p>Collaboration with Konstantina Palla, Alex Davies, Zoubin Ghahramani
(Machine Learning Group, Department of Engineering, University of
Cambridge); Gjergji Kasneci (Max Planck Institut fur Informatik);
Thore Graepel (Microsoft Research Cambridge).</p>
    </subsection>
    <subsection id="uid34" level="1">
      <bodyTitle>Block-Coordinate Frank-Wolfe Optimization for Structural SVMs</bodyTitle>
      <participants>
        <person key="sierra-2011-idm457989376096">
          <firstname>Simon</firstname>
          <lastname>Lacoste-Julien</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="sierra-2011-idm457989367008">
          <firstname>Mark</firstname>
          <lastname>Schmidt</lastname>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid8" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose a randomized block-coordinate variant of the classic
Frank-Wolfe algorithm for convex optimization with block-separable
constraints. Despite its lower iteration cost, we show that it
achieves the same convergence rate in duality gap as the full
Frank-Wolfe algorithm. We also show that, when applied to the dual
structural support vector machine (SVM) objective, this yields an
online algorithm that has the same low iteration complexity as primal
stochastic subgradient methods. However, unlike stochastic subgradient
methods, the stochastic Frank-Wolfe algorithm allows us to compute the
optimal step-size and yields a computable duality gap guarantee. Our
experiments indicate that this simple algorithm outperforms competing
structural SVM solvers.</p>
      <p>Collaboration with Martin Jaggi (Centre de Mathématiques Appliquées,
Ecole Polytechnique); Patrick Pletscher (Machine Learning Laboratory,
ETH Zurich).</p>
    </subsection>
    <subsection id="uid35" level="1">
      <bodyTitle>A convex relaxation for weakly supervised classifiers</bodyTitle>
      <participants>
        <person key="willow-2009-idm241890401936">
          <firstname>Armand</firstname>
          <lastname>Joulin</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid9" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we introduce a general multi-class approach to weakly
supervised classification. Inferring the labels and learning the
parameters of the model is usually done jointly through a
block-coordinate descent algorithm such as expectation-maximization
(EM), which may lead to local minima. To avoid this problem, we
propose a cost function based on a convex relaxation of the soft-max
loss. We then propose an algorithm specifically designed to
efficiently solve the corresponding semidefinite program (SDP).
Empirically, our method compares favorably to standard ones on
different datasets for multiple instance learning and semi-supervised
learning, as well as on clustering tasks.</p>
    </subsection>
    <subsection id="uid36" level="1">
      <bodyTitle>Multi-Class Cosegmentation</bodyTitle>
      <participants>
        <person key="willow-2009-idm241890401936">
          <firstname>Armand</firstname>
          <lastname>Joulin</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
      </participants>
      <p>Bottom-up, fully unsupervised segmentation remains a daunting
challenge for computer vision. In the cosegmentation context, on the
other hand, the availability of multiple images assumed to contain
instances of the same object classes provides a weak form of
supervision that can be exploited by discriminative approaches.
Unfortunately, most existing algorithms are limited to a very small
number of images and/or object classes (typically two of each). In <ref xlink:href="#sierra-2012-bid10" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose a novel energy-minimization approach to cosegmentation
that can handle multiple classes and a significantly larger number of
images. The proposed cost function combines spectral- and
discriminative-clustering terms, and it admits a probabilistic
interpretation. It is optimized using an efficient EM method,
initialized using a convex quadratic approximation of the energy.
Comparative experiments show that the proposed approach matches or
improves the state of the art on several standard datasets.</p>
      <p>Collaboration with the Willow project-team (J. Ponce).</p>
    </subsection>
    <subsection id="uid37" level="1">
      <bodyTitle>A latent factor model for highly multi-relational data
</bodyTitle>
      <participants>
        <person key="cafe-2006-idm360414076672">
          <firstname>Nicolas</firstname>
          <lastname>Le Roux</lastname>
        </person>
        <person key="willow-2009-idm241890428288">
          <firstname>Guillaume</firstname>
          <lastname>Obozinski</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>Many data such as social networks, movie preferences or knowledge bases are multi-relational, in that they describe multiple relations between entities. While there is a large body of work focused on modeling these data, modeling these multiple types of relations jointly remains challenging. Further, existing approaches tend to breakdown when the number of these types grows. In <ref xlink:href="#sierra-2012-bid11" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we propose a method for modeling large multi relational datasets, with possibly thousands of relations. Our model is based on a bilinear structure, which captures various orders of interaction of the data, and also shares sparse latent factors across different relations. We illustrate the performance of our approach on standard tensor-factorization datasets where we attain, or outperform, state-of-the-art results. Finally, a NLP application demonstrates our scalability and the ability of our model to learn efficient and semantically meaningful verb representations.</p>
      <p>Collaboration with R. Jenatton (CMAP, Ecole Polytechnique) and Antoine Bordes (CNRS, Université de Technologie de Compiégne).
</p>
    </subsection>
    <subsection id="uid38" level="1">
      <bodyTitle>Semi-supervised NMF with time-frequency annotations for single-channel source separation</bodyTitle>
      <participants>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
        <person key="willow-2009-idm241890399312">
          <firstname>Augustin</firstname>
          <lastname>Lefèvre</lastname>
          <moreinfo>correspondant</moreinfo>
        </person>
      </participants>
      <p>In <ref xlink:href="#sierra-2012-bid12" location="biblio" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"/>, we formulate a novel extension of nonnegative matrix factorization (NMF) to
take into account partial information
on source-specific activity in the spectrogram.
Results on single-channel source separation show that time-frequency annotations allow to disambiguate the source separation problem,
and learned annotations open the way for a completely
unsupervised learning procedure for source separation with no human intervention.</p>
      <p>Collaboration with C. Févotte (Laboratoire traitement et communication de l'information (LTCI), CNRS: UMR5141 - Institut Télécom - Télécom ParisTech).
</p>
    </subsection>
  </resultats>
  <contrats id="uid39">
    <bodyTitle>Bilateral Contracts and Grants with Industry</bodyTitle>
    <subsection id="uid40" level="1">
      <bodyTitle>Bilateral Grants with Industry</bodyTitle>
      <participants>
        <person key="willow-2007-idm119098005552">
          <firstname>Francis</firstname>
          <lastname>Bach</lastname>
        </person>
      </participants>
      <sanspuceslist>
        <li id="uid41">
          <p noindent="true">Google Research Award: “Large scale adaptive machine learning with finite data sets”.</p>
        </li>
      </sanspuceslist>
    </subsection>
  </contrats>
  <partenariat id="uid42">
    <bodyTitle>Partnerships and Cooperations</bodyTitle>
    <subsection id="uid43" level="1">
      <bodyTitle>National Initiatives</bodyTitle>
      <subsection id="uid44" level="2">
        <bodyTitle>ANR</bodyTitle>
        <subsection id="uid45" level="3">
          <bodyTitle>
            <ref xlink:href="https://sites.google.com/site/anrcalibration/ " location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">Calibration</ref>
          </bodyTitle>
          <participants>
            <person key="select-2006-idm193321381344">
              <firstname>Sylvain</firstname>
              <lastname>Arlot</lastname>
            </person>
          </participants>
          <sanspuceslist>
            <li id="uid46">
              <p noindent="true">S. Arlot, Membre du projet ANR Calibration</p>
            </li>
            <li id="uid47">
              <p noindent="true">Titre: Statistical calibration</p>
            </li>
            <li id="uid48">
              <p noindent="true">Coordinator: University Paris Dauphine</p>
            </li>
            <li id="uid49">
              <p noindent="true">Leader: Vincent Rivoirard</p>
            </li>
            <li id="uid50">
              <p noindent="true">Other members: 34 members, mostly among CEREMADE (Paris Dauphine), Laboratoire Jean-Alexandre Dieudonné (Université de Nice) and Laboratoire de Mathématiques de l'Université Paris Sud</p>
            </li>
            <li id="uid51">
              <p noindent="true">Instrument: ANR Blanc</p>
            </li>
            <li id="uid52">
              <p noindent="true">Duration: Jan 2012 - Dec 2015</p>
            </li>
            <li id="uid53">
              <p noindent="true">Total funding: 240 000 euros</p>
            </li>
            <li id="uid54">
              <p noindent="true">Webpage: <ref xlink:href="https://sites.google.com/site/anrcalibration/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>sites.<allowbreak/>google.<allowbreak/>com/<allowbreak/>site/<allowbreak/>anrcalibration/</ref></p>
            </li>
          </sanspuceslist>
        </subsection>
        <subsection id="uid55" level="3">
          <bodyTitle>
            <ref xlink:href="http://www.di.ens.fr/~arlot/ANR-DETECT.htm " location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">Detect</ref>
          </bodyTitle>
          <participants>
            <person key="select-2006-idm193321381344">
              <firstname>Sylvain</firstname>
              <lastname>Arlot</lastname>
            </person>
            <person key="willow-2007-idm119098005552">
              <firstname>Francis</firstname>
              <lastname>Bach</lastname>
            </person>
            <person key="sierra-2012-idm442940199568">
              <firstname>Rémi</firstname>
              <lastname>Lajugie</lastname>
            </person>
          </participants>
          <sanspuceslist>
            <li id="uid56">
              <p noindent="true">Title: New statistical approaches to computer vision and bioinformatics</p>
            </li>
            <li id="uid57">
              <p noindent="true">Coordinator: Ecole Normale Supérieure (Paris)</p>
            </li>
            <li id="uid58">
              <p noindent="true">Leader of the project: Sylvain Arlot</p>
            </li>
            <li id="uid59">
              <p noindent="true">Other members: J. Sivic (Willow project-team, ENS), A. Celisse (University Lille 1), T. Mary-Huard (AgroParisTech), E. Roquain and F. Villers (University Paris 6).</p>
            </li>
            <li id="uid60">
              <p noindent="true">Instrument: ANR, Young researchers Program</p>
            </li>
            <li id="uid61">
              <p noindent="true">Duration: Sep 2009 - Aug 2012</p>
            </li>
            <li id="uid62">
              <p noindent="true">Total funding: 70000 Euros</p>
            </li>
            <li id="uid63">
              <p noindent="true">See also: <ref xlink:href="http://www.di.ens.fr/~arlot/ANR-DETECT.htm" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>di.<allowbreak/>ens.<allowbreak/>fr/<allowbreak/>~arlot/<allowbreak/>ANR-DETECT.<allowbreak/>htm</ref></p>
            </li>
            <li id="uid64">
              <p noindent="true">Abstract: The Detect project aims at providing new statistical approaches for detection problems in computer vision (in particular, detecting and recognizing human actions in videos) and bioinformatics (e.g., simultaneously segmenting CGH profiles). These problems are mainly of two different statistical nature: multiple change-point detection (i.e., partitioning a sequence of observations into homogeneous contiguous segments) and multiple tests (i.e., controlling a priori the number of false positives among a large number of tests run simultaneously).</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
    </subsection>
    <subsection id="uid65" level="1">
      <bodyTitle>European Initiatives</bodyTitle>
      <subsection id="uid66" level="2">
        <bodyTitle>FP7 Projects</bodyTitle>
        <subsection id="uid67" level="3">
          <bodyTitle>
            <ref xlink:href=" http://www.di.ens.fr/~fbach/sierra " location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">SIERRA</ref>
          </bodyTitle>
          <participants>
            <person key="willow-2007-idm119098005552">
              <firstname>Francis</firstname>
              <lastname>Bach</lastname>
              <moreinfo>correspondant</moreinfo>
            </person>
            <person key="sierra-2011-idm457989376096">
              <firstname>Simon</firstname>
              <lastname>Lacoste-Julien</lastname>
            </person>
            <person key="willow-2009-idm241890399312">
              <firstname>Augustin</firstname>
              <lastname>Lefèvre</lastname>
            </person>
            <person key="cafe-2006-idm360414076672">
              <firstname>Nicolas</firstname>
              <lastname>Le Roux</lastname>
            </person>
            <person key="sierra-2011-idm457989367008">
              <firstname>Mark</firstname>
              <lastname>Schmidt</lastname>
            </person>
          </participants>
          <sanspuceslist>
            <li id="uid68">
              <p noindent="true">Title: SIERRA – Sparse structured methods for machine learning</p>
            </li>
            <li id="uid69">
              <p noindent="true">Type: IDEAS</p>
            </li>
            <li id="uid70">
              <p noindent="true">Instrument: ERC Starting Grant (Starting)</p>
            </li>
            <li id="uid71">
              <p noindent="true">Duration: December 2009 - November 2014</p>
            </li>
            <li id="uid72">
              <p noindent="true">Coordinator: Inria
(France)</p>
            </li>
            <li id="uid73">
              <p noindent="true">See also: <ref xlink:href=" http://www.di.ens.fr/~fbach/sierra " location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest"> http://<allowbreak/>www.<allowbreak/>di.<allowbreak/>ens.<allowbreak/>fr/<allowbreak/>~fbach/<allowbreak/>sierra
</ref></p>
            </li>
            <li id="uid74">
              <p noindent="true">Abstract:
Machine learning is now a core part of many research domains, where
the abundance of data has forced researchers to rely on automated
processing of information.
The main current paradigm of application of machine learning
techniques consists in two sequential stages: in the
representation phase, practitioners first build a large set of
features and potential responses for model building or prediction.
Then, in the learning phase, off-the-shelf algorithms are used
to solve the appropriate data processing tasks.
While this has led to significant advances in many domains, the
potential of machine learning techniques is far from being reached:
the tenet of this proposal is that to achieve the expected
breakthroughs, this two-stage paradigm should be replaced by an
integrated process where the</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
    </subsection>
    <subsection id="uid75" level="1">
      <bodyTitle>International Initiatives</bodyTitle>
      <subsection id="uid76" level="2">
        <bodyTitle>Inria Associate Teams</bodyTitle>
        <subsection id="uid77" level="3">
          <bodyTitle>
            <ref xlink:href="http://www.di.ens.fr/~fbach/statweb.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">STATWEB</ref>
          </bodyTitle>
          <participants>
            <person key="willow-2007-idm119098005552">
              <firstname>Francis</firstname>
              <lastname>Bach</lastname>
              <moreinfo>correspondant</moreinfo>
            </person>
            <person key="sierra-2011-idm457989373152">
              <firstname>Ronny</firstname>
              <lastname>Luss</lastname>
            </person>
          </participants>
          <sanspuceslist>
            <li id="uid78">
              <p noindent="true">Title: Fast Statistical Analysis of Web Data via Sparse Learning</p>
            </li>
            <li id="uid79">
              <p noindent="true">Inria principal investigator: Francis Bach</p>
            </li>
            <li id="uid80">
              <p noindent="true">International Partner (Institution - Laboratory - Researcher):</p>
              <sanspuceslist>
                <li id="uid81">
                  <p noindent="true">University of California Berkeley (United States)
- EECS and IEOR Departments - Laurent El Ghaoui</p>
                </li>
              </sanspuceslist>
            </li>
            <li id="uid82">
              <p noindent="true">Duration: 2011 - 2013</p>
            </li>
            <li id="uid83">
              <p noindent="true">See also: <ref xlink:href="http://www.di.ens.fr/~fbach/statweb.html" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>di.<allowbreak/>ens.<allowbreak/>fr/<allowbreak/>~fbach/<allowbreak/>statweb.<allowbreak/>html</ref></p>
            </li>
            <li id="uid84">
              <p noindent="true">The goal of the proposed research is to provide web-based tools for the analysis and visualization of large corpora of text documents, with a focus on databases of news articles. We intend to use advanced algorithms, drawing from recent progresses in machine learning and statistics, to allow a user to quickly produce a short summary and associated timeline showing how a certain topic is described in news media. We are also interested in unsupervised learning techniques that allow a user to understand the difference between several different news sources, topics or documents.</p>
            </li>
          </sanspuceslist>
        </subsection>
      </subsection>
    </subsection>
    <subsection id="uid85" level="1">
      <bodyTitle>International Research Visitors</bodyTitle>
      <subsection id="uid86" level="2">
        <bodyTitle>Visits of International Scientists</bodyTitle>
        <p>Michael Jordan (U.C. Berkeley, <ref xlink:href="http://www.cs.berkeley.edu/~jordan" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>cs.<allowbreak/>berkeley.<allowbreak/>edu/<allowbreak/>~jordan</ref>), is spending one year in our team, starting September 2012, financed by the Fondation de Sciences Mathématiques de Paris and Inria.</p>
      </subsection>
    </subsection>
  </partenariat>
  <diffusion id="uid87">
    <bodyTitle>Dissemination</bodyTitle>
    <subsection id="uid88" level="1">
      <bodyTitle>Scientific Animation</bodyTitle>
      <subsection id="uid89" level="2">
        <bodyTitle>Editorial boards</bodyTitle>
        <sanspuceslist>
          <li id="uid90">
            <p noindent="true">F. Bach: Journal of Machine Learning Research, Action Editor.</p>
          </li>
          <li id="uid91">
            <p noindent="true">F. Bach: IEEE Transactions on Pattern Analysis and Machine Intelligence, Associate Editor.</p>
          </li>
          <li id="uid92">
            <p noindent="true">F. Bach: Information and Inference, Associate Editor.</p>
          </li>
          <li id="uid93">
            <p noindent="true">F. Bach: SIAM Journal on Imaging Sciences, Associate Editor.</p>
          </li>
          <li id="uid94">
            <p noindent="true">G. Obozinski: Journal of Machine Learning Research, Member of the Editorial Board.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid95" level="2">
        <bodyTitle>Area chairs</bodyTitle>
        <sanspuceslist>
          <li id="uid96">
            <p noindent="true">G. Obozinski: International conference on Artificial Intelligence and Statistics (AISTATS) 2012.</p>
          </li>
          <li id="uid97">
            <p noindent="true">F. Bach: International Conference on Machine Learning, 2012.</p>
          </li>
          <li id="uid98">
            <p noindent="true">S. Lacoste-Julien, F. Bach: Conference on Uncertainty in Artificial Intelligence, 2012.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid99" level="2">
        <bodyTitle>Reviewing</bodyTitle>
        <sanspuceslist>
          <li id="uid100">
            <p noindent="true">Journals: Annals of Statistics, Machine Learning, Journal of Machine Learning Research (JMLR), IEEE Transaction on Information Theory, Transaction in Pattern Recognition and Machine Intelligence (TPAMI), Information and Inference (IMAIAI), Scandinavian Journal of Statistics (SJS), Statistics and Computing (STO), Annales de l'IHP, Annals of Statistics</p>
          </li>
          <li id="uid101">
            <p noindent="true">Conferences: UAI, ECML, NIPS, CVPR, ICML, COLT, AISTATS.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid102" level="2">
        <bodyTitle>Other</bodyTitle>
        <sanspuceslist>
          <li id="uid103">
            <p noindent="true">S. Arlot is member of the board for the entrance exam in Ecole Normale Supérieure (mathematics, voie B/L).</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid104" level="2">
        <bodyTitle>Workshop and conference organization</bodyTitle>
        <sanspuceslist>
          <li id="uid105">
            <p noindent="true">M. Schmidt, Session Organizer at International Conference on Continuous Optimization (July 27 - August 1, 2013).</p>
          </li>
          <li id="uid106">
            <p noindent="true">G. Obozinski, Co-organiser of the workshop “Sparsity, Dictionaries and Projections in Machine Learning and Signal Processing" at ICML 2012, Edinburgh, Scotland.
<ref xlink:href="http://www.di.ens.fr/~obozinski/ICML2012workshop/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>www.<allowbreak/>di.<allowbreak/>ens.<allowbreak/>fr/<allowbreak/>~obozinski/<allowbreak/>ICML2012workshop/</ref>.</p>
          </li>
          <li id="uid107">
            <p noindent="true">F. Bach: International Conference on Machine Learning, 2012, Workshop co-chair.</p>
          </li>
          <li id="uid108">
            <p noindent="true">F. Bach: Co-organizer of the NIPS workshop on “Analysis Operator Learning vs. Dictionary Learning: Fraternal Twins in Sparse Modeling”, <ref xlink:href="https://sites.google.com/site/dlaoplnips2012/" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">https://<allowbreak/>sites.<allowbreak/>google.<allowbreak/>com/<allowbreak/>site/<allowbreak/>dlaoplnips2012/</ref>.</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
    <subsection id="uid109" level="1">
      <bodyTitle>Teaching - Supervision - Juries</bodyTitle>
      <subsection id="uid110" level="2">
        <bodyTitle>Teaching</bodyTitle>
        <sanspuceslist>
          <li id="uid111">
            <p noindent="true">Licence : S. Arlot, F. Bach, G. Obozinski, “Apprentissage statistique”, 35h, Ecole Normale Supérieure, Filière “Math-Info”, première année.</p>
          </li>
          <li id="uid112">
            <p noindent="true">Licence: G. Obozinski, Introduction aux modèles graphiques (4h) in Enseignement spécialisé "Apprentissage artificiel" for second year students at Ecole des Mines.</p>
          </li>
          <li id="uid113">
            <p noindent="true">Mastère: S. Arlot and F. Bach, "Statistical learning", 24h, Mastère M2, Université Paris-Sud, France.</p>
          </li>
          <li id="uid114">
            <p noindent="true">Mastère: G. Obozinski, N. Le Roux, Introduction à l'apprentissage machine appliqué aux neurosciences et à la cognition
Co-teaching (6h) in the course of the Master Recherche en Sciences Cognitives co-habilitated by EHESS, ENS and Université Paris Descartes.</p>
          </li>
          <li id="uid115">
            <p noindent="true">Mastère: F. Bach, G. Obozibski, Introduction aux modèles graphiques
(30h), Master MVA (Ecole Normale Supérieure de Cachan).</p>
          </li>
          <li id="uid116">
            <p noindent="true">Doctorat: S. Arlot, "Model selection via penalization, resampling and cross-validation, with application to change-point detection", 6h, Université de Cergy.</p>
          </li>
          <li id="uid117">
            <p noindent="true">Doctorat: G. Obozinski,
Probabilistic graphical models for Information Retrieval,
in the Russian Summer School in Information Retrieval (RuSSIR 2012), Yaroslavl, Russia.</p>
          </li>
          <li id="uid118">
            <p noindent="true">Doctorat: F. Bach,
International Computer Vision Summer School 2012, 3h, Sicily.</p>
          </li>
          <li id="uid119">
            <p noindent="true">Doctorat: F. Bach,
Summer school on Visual Recognition and Machine Learning, 3h, Grenoble.</p>
          </li>
          <li id="uid120">
            <p noindent="true">Doctorat: F. Bach: Machine learning summer school (MLSS), 3h, Kyoto, Japan.</p>
          </li>
        </sanspuceslist>
      </subsection>
      <subsection id="uid121" level="2">
        <bodyTitle>Supervision</bodyTitle>
        <sanspuceslist>
          <li id="uid122">
            <p noindent="true">PhD : Toby Hocking, “Learning algorithms and statistical software,
with applications to bioinformatics”,
ENS Cachan, November 20, 2012, Advisors: F. Bach, J.-P. Vert (Ecole des Mines de Paris - Institut Curie).</p>
          </li>
          <li id="uid123">
            <p noindent="true">PhD: Augustin Lefèvre, “Dictionary learning methods for single-channel audio source separation”, ENS Cachan, October 3, 2012, Advisors: F. Bach and C. Févotte (Telecom Paristech).</p>
          </li>
          <li id="uid124">
            <p noindent="true">PhD: Armand Joulin, “Convex optimization for co-segmentation”, ENS Cachan, December 17, 2012, Advisors: F. Bach and J. Ponce (Willow project-team).</p>
          </li>
        </sanspuceslist>
      </subsection>
    </subsection>
    <subsection id="uid125" level="1">
      <bodyTitle>Invited presentations</bodyTitle>
      <sanspuceslist>
        <li id="uid126">
          <p noindent="true">S. Arlot, "Optimal model selection with V-fold cross-validation: how should V be chosen?", World Congress in Probability and Statistics 2012, Istanbul.</p>
        </li>
        <li id="uid127">
          <p noindent="true">S. Arlot, "Resampling-based estimation of the accuracy of satellite ephemerides", Inaugural Conference of the Laboratory Fibonacci, Scuola Normale Superiore di Pisa, 2012.</p>
        </li>
        <li id="uid128">
          <p noindent="true">S. Arlot, "Choix de V pour la sélection de modèles par validation croisée V-fold en estimation de densité", Séminaire parisien de statistique, IHP, Paris, 2012.</p>
        </li>
        <li id="uid129">
          <p noindent="true">S. Arlot, "Calibration automatique d'estimateurs linéaires à l'aide de pénalités minimales, application à la régression multi-tâches.", Séminaire de Statistique de l'IMT, Toulouse, 2012.</p>
        </li>
        <li id="uid130">
          <p noindent="true">F. Bach, International Conference on Pattern Recognition Applications and Methods, Faro, Portugal,
2012 (keynote speaker).</p>
        </li>
        <li id="uid131">
          <p noindent="true">F. Bach, Rank Prize Symposium (invited talk), Lake District, England, 2012.</p>
        </li>
        <li id="uid132">
          <p noindent="true">F. Bach, University of Cambridge (two seminars), 2012.</p>
        </li>
        <li id="uid133">
          <p noindent="true">F. Bach, Schlumberger workshop on Mathematical Models of Sound Analysis, IHES (invited talk),
2012.</p>
        </li>
        <li id="uid134">
          <p noindent="true">F. Bach, Joint Pattern Recognition Symposium of the German Association for Pattern Recognition
(DAGM) (invited talk), Graz, Austria, 2012.</p>
        </li>
        <li id="uid135">
          <p noindent="true">F. Bach, International Workshop on Machine Learning for Signal Processing (plenary lecture),
Santander, Spain, 2012.</p>
        </li>
        <li id="uid136">
          <p noindent="true">F. Bach, Seminar Max-Planck Institute, Tübingen, October 2012.</p>
        </li>
        <li id="uid137">
          <p noindent="true">E. Grave, Laboratoire d'Informatique de Paris 6, Université Pierre et Marie Curie (Seminar), 2012.</p>
        </li>
        <li id="uid138">
          <p noindent="true">S. Lacoste-Julien, "Harnessing the structure of data for discriminative machine
learning", Colloque du Département d'Informatique et de Recherche
Opérationnelle, Université de Montréal, Montréal, Canada, February
2012</p>
        </li>
        <li id="uid139">
          <p noindent="true">S. Lacoste-Julien, "Structured Alignment Methods in Machine Learning", SMT seminar at
the LIMSI, Orsay, France, July 2012</p>
        </li>
        <li id="uid140">
          <p noindent="true">S. Lacoste-Julien, "Frank-Wolfe optimization insights in machine learning", machine
learning seminar, University of Toronto, Toronto, Canada, August 2012.</p>
        </li>
        <li id="uid141">
          <p noindent="true">S. Lacoste-Julien, "Frank-Wolfe optimization insights in machine learning", Machine
Learning Group seminar, University of Cambridge, Cambridge, UK, August
2012.</p>
        </li>
        <li id="uid142">
          <p noindent="true">S. Lacoste-Julien, "Harnessing the structure of data in machine learning", invited
talk, Department of Engineering Science, University of Oxford, Oxford,
UK, September 2012.</p>
        </li>
        <li id="uid143">
          <p noindent="true">S. Lacoste-Julien, "Frank-Wolfe optimization insights in machine learning", invited
talk, Stanford AI Lab, Stanford University, Stanford, USA, December
2012.</p>
        </li>
        <li id="uid144">
          <p noindent="true">G. Obozinski,
Swiss Statistical Seminar, Bern, Switzerland, April 2012.</p>
        </li>
        <li id="uid145">
          <p noindent="true">G. Obozinski, Séminaire de Statistiques, Université de Pennsylvanie, Philadelphia, PA, USA, May 2012.</p>
        </li>
        <li id="uid146">
          <p noindent="true">G. Obozinski, Séminaire de Statistiques, Université Paris 11, May 2012.</p>
        </li>
        <li id="uid147">
          <p noindent="true">G. Obozinski, Journées de Statistiques (Conférence annuelle de la Société Francaise de Statistiques), Université Libre de Bruxelles, Belgium, May 2012.</p>
        </li>
        <li id="uid148">
          <p noindent="true">G. Obozinski, Congrèss mondial de Probabilités et Statistiques, Istanbul, Turkey, July 2012.</p>
        </li>
        <li id="uid149">
          <p noindent="true">G. Obozinski, séminaire du CEREMADE, Université Paris-Dauphine, December 2012.</p>
        </li>
        <li id="uid150">
          <p noindent="true">M. Schmidt, NAIS Workshop on Advances in Large-Scale Optimization, Edinburgh, May 24-25, 2012.</p>
        </li>
        <li id="uid151">
          <p noindent="true">M. Schmidt, International Symposium on Mathematical Programming, Berlin, August 19-24, 2012.</p>
        </li>
        <li id="uid152">
          <p noindent="true">M. Schmidt, University of British Columbia, "Linearly-Convergent Stochastic-Gradient Methods", Seminar, December 10, 2012.</p>
        </li>
        <li id="uid153">
          <p noindent="true">M. Schmidt, - Simon Fraser University, "Opening up the black box: Faster methods for non-smooth and big-data optimization", Seminar, December 11, 2012.</p>
        </li>
      </sanspuceslist>
    </subsection>
    <subsection id="uid154" level="1">
      <bodyTitle>Prizes and awards</bodyTitle>
      <sanspuceslist>
        <li id="uid155">
          <p noindent="true">M. Schmidt, NSERC Postdoctoral Fellowship (January 2012 - December 2013).</p>
        </li>
        <li id="uid156">
          <p noindent="true">S. Lacoste-Julien, Research in Paris fellowship 2011-2012.</p>
        </li>
        <li id="uid157">
          <p noindent="true">F. Bach: Inria young researcher prize, 2012.</p>
        </li>
        <li id="uid158">
          <p noindent="true">R. Jenatton: Thesis prize from Fondation Hadamard, 2012.</p>
        </li>
        <li id="uid159">
          <p noindent="true">R. Jenatton: Thesis prize from AFIA, accessit, 2012.</p>
        </li>
      </sanspuceslist>
    </subsection>
    <subsection id="uid160" level="1">
      <bodyTitle>Popularization</bodyTitle>
      <sanspuceslist>
        <li id="uid161">
          <p noindent="true">Participation to Inria-Rocquencourt “Fête de la Science”, 2012.</p>
        </li>
      </sanspuceslist>
    </subsection>
  </diffusion>
  <biblio id="bibliography" html="bibliography" numero="10" titre="Bibliography">
    <biblStruct dedoublkey="1672" id="sierra-2012-bid14" type="article" rend="year" n="cite:bach:hal-00621245">
      <identifiant type="hal" value="hal-00621245"/>
      <analytic>
        <title level="a">Structured sparsity through convex optimization</title>
        <author>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName key="willow-2008-idm253693195904">
            <foreName>Rodolphe</foreName>
            <surname>Jenatton</surname>
            <initial>R.</initial>
          </persName>
          <persName key="willow-2007-idm119097976224">
            <foreName>Julien</foreName>
            <surname>Mairal</surname>
            <initial>J.</initial>
          </persName>
          <persName key="willow-2009-idm241890428288">
            <foreName>Guillaume</foreName>
            <surname>Obozinski</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid02378">
        <idno type="issn">0883-4237</idno>
        <title level="j">Statistical Science</title>
        <imprint>
          <biblScope type="volume">27</biblScope>
          <biblScope type="number">4</biblScope>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">450-468</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00621245" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00621245</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="0890" id="sierra-2012-bid16" type="article" rend="year" n="cite:friedlander:inria-00626571">
      <identifiant type="doi" value="10.1137/110830629"/>
      <identifiant type="hal" value="inria-00626571"/>
      <analytic>
        <title level="a">Hybrid Deterministic-Stochastic Methods for Data Fitting</title>
        <author>
          <persName>
            <foreName>Michael P.</foreName>
            <surname>Friedlander</surname>
            <initial>M. P.</initial>
          </persName>
          <persName key="sierra-2011-idm457989367008">
            <foreName>Mark</foreName>
            <surname>Schmidt</surname>
            <initial>M.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01830">
        <idno type="issn">1064-8275</idno>
        <title level="j">SIAM Journal on Scientific Computing</title>
        <imprint>
          <biblScope type="volume">34</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">A1380-A1405</biblScope>
          <ref xlink:href="http://hal.inria.fr/inria-00626571" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>inria-00626571</ref>
        </imprint>
      </monogr>
      <note type="bnote">22 pages</note>
    </biblStruct>
    <biblStruct dedoublkey="1139" id="sierra-2012-bid15" type="article" rend="year" n="cite:jenatton:inria-00589785">
      <identifiant type="doi" value="10.1137/110832380"/>
      <identifiant type="hal" value="inria-00589785"/>
      <analytic>
        <title level="a">Multi-scale Mining of fMRI data with Hierarchical Structured Sparsity</title>
        <author>
          <persName key="willow-2008-idm253693195904">
            <foreName>Rodolphe</foreName>
            <surname>Jenatton</surname>
            <initial>R.</initial>
          </persName>
          <persName key="odyssee-2006-idm405611837616">
            <foreName>Alexandre</foreName>
            <surname>Gramfort</surname>
            <initial>A.</initial>
          </persName>
          <persName key="select-2007-idm133980334544">
            <foreName>Vincent</foreName>
            <surname>Michel</surname>
            <initial>V.</initial>
          </persName>
          <persName key="willow-2009-idm241890428288">
            <foreName>Guillaume</foreName>
            <surname>Obozinski</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Evelyn</foreName>
            <surname>Eger</surname>
            <initial>E.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName key="parietal-2008-idm343501673536">
            <foreName>Bertrand</foreName>
            <surname>Thirion</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01825">
        <idno type="issn">1936-4954</idno>
        <title level="j">SIAM Journal on Imaging Sciences</title>
        <imprint>
          <biblScope type="volume">5</biblScope>
          <biblScope type="number">3</biblScope>
          <dateStruct>
            <month>July</month>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">835-856</biblScope>
          <ref xlink:href="http://hal.inria.fr/inria-00589785" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>inria-00589785</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="1148" id="sierra-2012-bid13" type="article" rend="year" n="cite:solnon:hal-00610534">
      <identifiant type="hal" value="hal-00610534"/>
      <analytic>
        <title level="a">Multi-task Regression using Minimal Penalties</title>
        <author>
          <persName key="willow-2010-idm1079619392">
            <foreName>Matthieu</foreName>
            <surname>Solnon</surname>
            <initial>M.</initial>
          </persName>
          <persName key="select-2006-idm193321381344">
            <foreName>Sylvain</foreName>
            <surname>Arlot</surname>
            <initial>S.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-editorial-board="yes" x-international-audience="yes" id="rid01276">
        <idno type="issn">1532-4435</idno>
        <title level="j">Journal of Machine Learning Research</title>
        <imprint>
          <biblScope type="volume">13</biblScope>
          <dateStruct>
            <month>September</month>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">2773-2812</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00610534" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00610534</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4143" id="sierra-2012-bid3" type="inproceedings" rend="year" n="cite:bach:hal-00681128">
      <identifiant type="hal" value="hal-00681128"/>
      <analytic>
        <title level="a">On the Equivalence between Herding and Conditional Gradient Algorithms</title>
        <author>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName key="sierra-2011-idm457989376096">
            <foreName>Simon</foreName>
            <surname>Lacoste-Julien</surname>
            <initial>S.</initial>
          </persName>
          <persName key="willow-2009-idm241890428288">
            <foreName>Guillaume</foreName>
            <surname>Obozinski</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">ICML 2012 International Conference on Machine Learning</title>
        <loc>Edimburgh, United Kingdom</loc>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00681128" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00681128</ref>
        </imprint>
        <meeting id="cid32516">
          <title>International Conference on Machine Learning</title>
          <num>29</num>
          <abbr type="sigle">ICML</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4122" id="sierra-2012-bid17" type="inproceedings" rend="year" n="cite:buchman:hal-00717714">
      <identifiant type="hal" value="hal-00717714"/>
      <analytic>
        <title level="a">On Sparse, Spectral and Other Parameterizations of Binary Probabilistic Models</title>
        <author>
          <persName>
            <foreName>David</foreName>
            <surname>Buchman</surname>
            <initial>D.</initial>
          </persName>
          <persName key="sierra-2011-idm457989367008">
            <foreName>Mark</foreName>
            <surname>Schmidt</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Shakir</foreName>
            <surname>Mohamed</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>David</foreName>
            <surname>Poole</surname>
            <initial>D.</initial>
          </persName>
          <persName>
            <foreName>Nando</foreName>
            <surname>De Freitas</surname>
            <initial>N.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">AISTATS 2012 - 15th International Conference on Artificial Intelligence and Statistics</title>
        <loc>La Palma, Spain</loc>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00717714" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00717714</ref>
        </imprint>
        <meeting id="cid388734">
          <title>International Conference on Artificial Intelligence and Statistics</title>
          <num>15</num>
          <abbr type="sigle">AISTATS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2483" id="sierra-2012-bid11" type="inproceedings" rend="year" n="cite:jenatton:hal-00776335">
      <identifiant type="hal" value="hal-00776335"/>
      <analytic>
        <title level="a">A latent factor model for highly multi-relational data</title>
        <author>
          <persName key="willow-2008-idm253693195904">
            <foreName>Rodolphe</foreName>
            <surname>Jenatton</surname>
            <initial>R.</initial>
          </persName>
          <persName key="cafe-2006-idm360414076672">
            <foreName>Nicolas</foreName>
            <surname>Le Roux</surname>
            <initial>N.</initial>
          </persName>
          <persName>
            <foreName>Antoine</foreName>
            <surname>Bordes</surname>
            <initial>A.</initial>
          </persName>
          <persName key="willow-2009-idm241890428288">
            <foreName>Guillaume</foreName>
            <surname>Obozinski</surname>
            <initial>G.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">Neural Information Processing Systems (NIPS)</title>
        <loc>Lake Tahoe, Nevada, États-Unis</loc>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00776335" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00776335</ref>
        </imprint>
        <meeting id="cid29560">
          <title>Annual Conference on Neural Information Processing Systems</title>
          <num>23</num>
          <abbr type="sigle">NIPS</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="2394" id="sierra-2012-bid9" type="inproceedings" rend="year" n="cite:joulin:hal-00717450">
      <identifiant type="hal" value="hal-00717450"/>
      <analytic>
        <title level="a">A convex relaxation for weakly supervised classifiers</title>
        <author>
          <persName key="willow-2009-idm241890401936">
            <foreName>Armand</foreName>
            <surname>Joulin</surname>
            <initial>A.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">ICML 2012 International Conference on Machine Learning</title>
        <loc>Edinburgh, United Kingdom</loc>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">641</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00717450" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00717450</ref>
        </imprint>
        <meeting id="cid32516">
          <title>International Conference on Machine Learning</title>
          <num>29</num>
          <abbr type="sigle">ICML</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3975" id="sierra-2012-bid10" type="inproceedings" rend="year" n="cite:joulin:hal-00717448">
      <identifiant type="hal" value="hal-00717448"/>
      <analytic>
        <title level="a">Multi-Class Cosegmentation</title>
        <author>
          <persName key="willow-2009-idm241890401936">
            <foreName>Armand</foreName>
            <surname>Joulin</surname>
            <initial>A.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName key="willow-2007-idm119098021056">
            <foreName>Jean</foreName>
            <surname>Ponce</surname>
            <initial>J.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">CVPR 2012 : 25th IEEE Conference on Computer Vision and Pattern Recognition</title>
        <loc>Providence, United States</loc>
        <imprint>
          <dateStruct>
            <month>June</month>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">0109</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00717448" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00717448</ref>
        </imprint>
        <meeting id="cid82398">
          <title>IEEE International Conference on Computer Vision and Pattern Recognition</title>
          <num>2012</num>
          <abbr type="sigle">CVPR</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="4575" id="sierra-2012-bid12" type="inproceedings" rend="year" n="cite:lefevre:hal-00717366">
      <identifiant type="hal" value="hal-00717366"/>
      <analytic>
        <title level="a">Semi-supervised NMF with time-frequency annotations for single-channel source separation</title>
        <author>
          <persName key="willow-2009-idm241890399312">
            <foreName>Augustin</foreName>
            <surname>Lefèvre</surname>
            <initial>A.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Cédric</foreName>
            <surname>Févotte</surname>
            <initial>C.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">ISMIR 2012 : 13th International Society for Music Information Retrieval Conference</title>
        <loc>Porto, Portugal</loc>
        <imprint>
          <dateStruct>
            <month>October</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00717366" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00717366</ref>
        </imprint>
        <meeting id="cid95673">
          <title>International Society for Music Information Retrieval Conference</title>
          <num>13</num>
          <abbr type="sigle">ISMIR</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3775" id="sierra-2012-bid6" type="inproceedings" rend="year" n="cite:pedregosa:hal-00717990">
      <identifiant type="hal" value="hal-00717990"/>
      <analytic>
        <title level="a">Learning to rank from medical imaging data</title>
        <author>
          <persName key="parietal-2009-idm302557838896">
            <foreName>Fabian</foreName>
            <surname>Pedregosa</surname>
            <initial>F.</initial>
          </persName>
          <persName key="odyssee-2006-idm405611837616">
            <foreName>Alexandre</foreName>
            <surname>Gramfort</surname>
            <initial>A.</initial>
          </persName>
          <persName key="parietal-2008-idm343501667328">
            <foreName>Gaël</foreName>
            <surname>Varoquaux</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Elodie</foreName>
            <surname>Cauvet</surname>
            <initial>E.</initial>
          </persName>
          <persName>
            <foreName>Christophe</foreName>
            <surname>Pallier</surname>
            <initial>C.</initial>
          </persName>
          <persName key="parietal-2008-idm343501673536">
            <foreName>Bertrand</foreName>
            <surname>Thirion</surname>
            <initial>B.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">MLMI 2012 - 3rd International Workshop on Machine Learning in Medical Imaging</title>
        <loc>Nice, France</loc>
        <imprint>
          <publisher>
            <orgName type="organisation">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>July</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00717990" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00717990</ref>
        </imprint>
        <meeting id="cid389732">
          <title>MICCAI Workshop on Machine Learning in Medical Imaging</title>
          <num>2012</num>
          <abbr type="sigle">MLMI</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="3613" id="sierra-2012-bid5" type="inproceedings" rend="year" n="cite:pedregosa:hal-00717954">
      <identifiant type="hal" value="hal-00717954"/>
      <analytic>
        <title level="a">Improved brain pattern recovery through ranking approaches</title>
        <author>
          <persName key="parietal-2009-idm302557838896">
            <foreName>Fabian</foreName>
            <surname>Pedregosa</surname>
            <initial>F.</initial>
          </persName>
          <persName key="odyssee-2006-idm405611837616">
            <foreName>Alexandre</foreName>
            <surname>Gramfort</surname>
            <initial>A.</initial>
          </persName>
          <persName key="parietal-2008-idm343501667328">
            <foreName>Gaël</foreName>
            <surname>Varoquaux</surname>
            <initial>G.</initial>
          </persName>
          <persName key="parietal-2008-idm343501673536">
            <foreName>Bertrand</foreName>
            <surname>Thirion</surname>
            <initial>B.</initial>
          </persName>
          <persName>
            <foreName>Christophe</foreName>
            <surname>Pallier</surname>
            <initial>C.</initial>
          </persName>
          <persName>
            <foreName>Elodie</foreName>
            <surname>Cauvet</surname>
            <initial>E.</initial>
          </persName>
        </author>
      </analytic>
      <monogr x-international-audience="yes" x-proceedings="yes">
        <title level="m">PRNI 2012 : 2nd International Workshop on Pattern Recognition in NeuroImaging</title>
        <loc>London, United Kingdom</loc>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00717954" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00717954</ref>
        </imprint>
        <meeting id="cid538352">
          <title>IEEE International Workshop on Pattern Recognition in NeuroImaging</title>
          <num>2012</num>
          <abbr type="sigle">PRNI</abbr>
        </meeting>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="5929" id="sierra-2012-bid19" type="techreport" rend="year" n="cite:jenatton:hal-00737152">
      <identifiant type="hal" value="hal-00737152"/>
      <monogr>
        <title level="m">Local stability and robustness of sparse dictionary learning in the presence of noise</title>
        <author>
          <persName key="willow-2008-idm253693195904">
            <foreName>Rodolphe</foreName>
            <surname>Jenatton</surname>
            <initial>R.</initial>
          </persName>
          <persName key="metiss-2006-idm235968094256">
            <foreName>Rémi</foreName>
            <surname>Gribonval</surname>
            <initial>R.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="institution">HAL-Inria</orgName>
          </publisher>
          <dateStruct>
            <month>October</month>
            <year>2012</year>
          </dateStruct>
          <biblScope type="pages">41</biblScope>
          <ref xlink:href="http://hal.inria.fr/hal-00737152" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00737152</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    <biblStruct dedoublkey="5965" id="sierra-2012-bid18" type="techreport" rend="year" n="cite:kadri:hal-00677012">
      <identifiant type="hal" value="hal-00677012"/>
      <monogr>
        <title level="m">Multiple Operator-valued Kernel Learning</title>
        <author>
          <persName key="sequel-2008-idm13200184608">
            <foreName>Hachem</foreName>
            <surname>Kadri</surname>
            <initial>H.</initial>
          </persName>
          <persName>
            <foreName>Alain</foreName>
            <surname>Rakotomamonjy</surname>
            <initial>A.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName key="sequel-2006-idm391148966784">
            <foreName>Philippe</foreName>
            <surname>Preux</surname>
            <initial>P.</initial>
          </persName>
        </author>
        <imprint>
          <biblScope type="number">RR-7900</biblScope>
          <publisher>
            <orgName type="institution">Inria</orgName>
          </publisher>
          <dateStruct>
            <month>March</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00677012" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00677012</ref>
        </imprint>
      </monogr>
      <note type="typdoc">Research Report</note>
    </biblStruct>
    <biblStruct dedoublkey="5767" id="sierra-2012-bid1" type="techreport" rend="year" n="cite:obozinski:hal-00694765">
      <identifiant type="hal" value="hal-00694765"/>
      <monogr>
        <title level="m">Convex Relaxation for Combinatorial Penalties</title>
        <author>
          <persName key="willow-2009-idm241890428288">
            <foreName>Guillaume</foreName>
            <surname>Obozinski</surname>
            <initial>G.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
        </author>
        <imprint>
          <publisher>
            <orgName type="institution">HAL-Inria</orgName>
          </publisher>
          <dateStruct>
            <month>May</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00694765" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00694765</ref>
        </imprint>
      </monogr>
      <note type="bnote">35 page</note>
      <note type="typdoc">Report</note>
    </biblStruct>
    <biblStruct dedoublkey="6327" id="sierra-2012-bid2" type="unpublished" rend="year" n="cite:arlot:hal-00671174">
      <identifiant type="hal" value="hal-00671174"/>
      <monogr>
        <title level="m">Kernel change-point detection</title>
        <author>
          <persName key="select-2006-idm193321381344">
            <foreName>Sylvain</foreName>
            <surname>Arlot</surname>
            <initial>S.</initial>
          </persName>
          <persName key="modal-2011-idm448863566768">
            <foreName>Alain</foreName>
            <surname>Celisse</surname>
            <initial>A.</initial>
          </persName>
          <persName key="lear-2010-idm32410115776">
            <foreName>Zaid</foreName>
            <surname>Harchaoui</surname>
            <initial>Z.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00671174" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00671174</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="6430" id="sierra-2012-bid21" type="unpublished" rend="year" n="cite:bach:hal-00723365">
      <identifiant type="hal" value="hal-00723365"/>
      <monogr>
        <title level="m">Sharp analysis of low-rank kernel matrix approximations</title>
        <author>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00723365" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00723365</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="6334" id="sierra-2012-bid20" type="unpublished" rend="year" n="cite:hocking:hal-00663790">
      <identifiant type="hal" value="hal-00663790"/>
      <monogr>
        <title level="m">Learning smoothing models of copy number profiles using breakpoint annotations</title>
        <author>
          <persName key="willow-2009-idm241890407184">
            <foreName>Toby Dylan</foreName>
            <surname>Hocking</surname>
            <initial>T. D.</initial>
          </persName>
          <persName>
            <foreName>Gudrun</foreName>
            <surname>Schleiermacher</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Isabelle</foreName>
            <surname>Janoueix-Lerosey</surname>
            <initial>I.</initial>
          </persName>
          <persName>
            <foreName>Olivier</foreName>
            <surname>Delattre</surname>
            <initial>O.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
          <persName>
            <foreName>Jean-Philippe</foreName>
            <surname>Vert</surname>
            <initial>J.-P.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00663790" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00663790</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="6450" id="sierra-2012-bid8" type="unpublished" rend="year" n="cite:lacostejulien:hal-00720158">
      <identifiant type="hal" value="hal-00720158"/>
      <monogr>
        <title level="m">Stochastic Block-Coordinate Frank-Wolfe Optimization for Structural SVMs</title>
        <author>
          <persName key="sierra-2011-idm457989376096">
            <foreName>Simon</foreName>
            <surname>Lacoste-Julien</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Martin</foreName>
            <surname>Jaggi</surname>
            <initial>M.</initial>
          </persName>
          <persName key="sierra-2011-idm457989367008">
            <foreName>Mark</foreName>
            <surname>Schmidt</surname>
            <initial>M.</initial>
          </persName>
          <persName>
            <foreName>Patrick</foreName>
            <surname>Pletscher</surname>
            <initial>P.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00720158" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00720158</ref>
        </imprint>
      </monogr>
      <note type="bnote">13 pages main text + 13 pages appendix (short version). Under review</note>
    </biblStruct>
    <biblStruct dedoublkey="6431" id="sierra-2012-bid7" type="unpublished" rend="year" n="cite:lacostejulien:hal-00768180">
      <identifiant type="hal" value="hal-00768180"/>
      <monogr>
        <title level="m">SiGMa: Simple Greedy Matching for Aligning Large Knowledge Bases</title>
        <author>
          <persName key="sierra-2011-idm457989376096">
            <foreName>Simon</foreName>
            <surname>Lacoste-Julien</surname>
            <initial>S.</initial>
          </persName>
          <persName>
            <foreName>Konstantina</foreName>
            <surname>Palla</surname>
            <initial>K.</initial>
          </persName>
          <persName>
            <foreName>Alex</foreName>
            <surname>Davies</surname>
            <initial>A.</initial>
          </persName>
          <persName>
            <foreName>Gjergji</foreName>
            <surname>Kasneci</surname>
            <initial>G.</initial>
          </persName>
          <persName>
            <foreName>Thore</foreName>
            <surname>Graepel</surname>
            <initial>T.</initial>
          </persName>
          <persName>
            <foreName>Zoubin</foreName>
            <surname>Ghahramani</surname>
            <initial>Z.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <month>July</month>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00768180" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00768180</ref>
        </imprint>
      </monogr>
      <note type="bnote">10 pages + 2 pages appendix; 5 figures – initial preprint</note>
    </biblStruct>
    <biblStruct dedoublkey="6228" id="sierra-2012-bid0" type="unpublished" rend="year" n="cite:leroux:hal-00674995">
      <identifiant type="hal" value="hal-00674995"/>
      <monogr>
        <title level="m">A Stochastic Gradient Method with an Exponential Convergence Rate for Strongly-Convex Optimization with Finite Training Sets</title>
        <author>
          <persName key="cafe-2006-idm360414076672">
            <foreName>Nicolas</foreName>
            <surname>Le Roux</surname>
            <initial>N.</initial>
          </persName>
          <persName key="sierra-2011-idm457989367008">
            <foreName>Mark</foreName>
            <surname>Schmidt</surname>
            <initial>M.</initial>
          </persName>
          <persName key="willow-2007-idm119098005552">
            <foreName>Francis</foreName>
            <surname>Bach</surname>
            <initial>F.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00674995" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00674995</ref>
        </imprint>
      </monogr>
    </biblStruct>
    <biblStruct dedoublkey="6480" id="sierra-2012-bid4" type="unpublished" rend="year" n="cite:lerasle:hal-00743931">
      <identifiant type="hal" value="hal-00743931"/>
      <monogr>
        <title level="m"><formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold cross-validation and <formula type="inline"><math xmlns="http://www.w3.org/1998/Math/MathML" overflow="scroll"><mi>V</mi></math></formula>-fold penalization in least-squares density estimation</title>
        <author>
          <persName>
            <foreName>Matthieu</foreName>
            <surname>Lerasle</surname>
            <initial>M.</initial>
          </persName>
          <persName key="select-2006-idm193321381344">
            <foreName>Sylvain</foreName>
            <surname>Arlot</surname>
            <initial>S.</initial>
          </persName>
        </author>
        <imprint>
          <dateStruct>
            <year>2012</year>
          </dateStruct>
          <ref xlink:href="http://hal.inria.fr/hal-00743931" location="extern" xlink:type="simple" xlink:show="replace" xlink:actuate="onRequest">http://<allowbreak/>hal.<allowbreak/>inria.<allowbreak/>fr/<allowbreak/>hal-00743931</ref>
        </imprint>
      </monogr>
    </biblStruct>
  </biblio>
</raweb>
