X-Git-Url: https://git.auder.net/?a=blobdiff_plain;f=communication%2Fslides%2Fslides.tex;fp=communication%2Fslides%2Fslides.tex;h=8606bdae5e27fdb2f837cb69fa809293d6a9b02a;hb=769ea203f7dae481c270e8ba6569d33ae4044817;hp=0000000000000000000000000000000000000000;hpb=3e5dbc70596573851076afe1f5121eefdc02b567;p=ppam-mpi.git

diff --git a/communication/slides/slides.tex b/communication/slides/slides.tex
new file mode 100644
index 0000000..8606bda
--- /dev/null
+++ b/communication/slides/slides.tex
@@ -0,0 +1,534 @@
+\input{startdoc.tex}
+
+\usepackage{tikz}
+\usepackage{array}
+
+\usepackage[utf8]{inputenc}
+\usepackage{amsmath, amsfonts}
+%\usepackage[francais]{babel}
+\usepackage{hyperref, url, caption, tikz}
+\usepackage{wrapfig}
+%\usepackage{graphicx}
+%\hypersetup{colorlinks,linkcolor=black,urlcolor=violet}
+
+\mode<presentation>{
+  \setbeamertemplate{sections/subsections in toc}[square]
+  \beamertemplatenavigationsymbolsempty
+}
+
+%\newcommand{\N}{\mathbb{N}}                          % naturals
+\newcommand{\set}[1]{\lbrace#1\rbrace}               % set
+%\newcommand{\R}{\mathbb{R}}         % real
+
+\colorlet{darkred}{red!80!black}
+\colorlet{darkblue}{blue!80!black}
+\colorlet{darkgreen}{green!60!black}
+
+\usetikzlibrary{calc,decorations.pathmorphing,patterns}
+\pgfdeclaredecoration{penciline}{initial}{
+    \state{initial}[width=+\pgfdecoratedinputsegmentremainingdistance,
+    auto corner on length=1mm,]{
+        \pgfpathcurveto%
+        {% From
+            \pgfqpoint{\pgfdecoratedinputsegmentremainingdistance}
+                      {\pgfdecorationsegmentamplitude}
+        }
+        {%  Control 1
+        \pgfmathrand
+        \pgfpointadd{\pgfqpoint{\pgfdecoratedinputsegmentremainingdistance}{0pt}}
+                    {\pgfqpoint{-\pgfdecorationsegmentaspect
+                     \pgfdecoratedinputsegmentremainingdistance}%
+                               {\pgfmathresult\pgfdecorationsegmentamplitude}
+                    }
+        }
+        {%TO 
+        \pgfpointadd{\pgfpointdecoratedinputsegmentlast}{\pgfpoint{1pt}{1pt}}
+        }
+    }
+    \state{final}{}
+}
+%
+\tikzstyle{block} = [draw,rectangle,thick,minimum height=2em,minimum width=2em]
+
+%~ \usetikzlibrary{calc,decorations.pathmorphing,patterns}
+%~ \pgfdeclaredecoration{penciline}{initial}{
+    %~ \state{initial}[width=+\pgfdecoratedinputsegmentremainingdistance,
+    %~ auto corner on length=1mm,]{
+        %~ \pgfpathcurveto%
+        %~ {% From
+            %~ \pgfqpoint{\pgfdecoratedinputsegmentremainingdistance}
+                      %~ {\pgfdecorationsegmentamplitude}
+        %~ }
+        %~ {%  Control 1
+        %~ \pgfmathrand
+        %~ \pgfpointadd{\pgfqpoint{\pgfdecoratedinputsegmentremainingdistance}{0pt}}
+                    %~ {\pgfqpoint{-\pgfdecorationsegmentaspect
+                     %~ \pgfdecoratedinputsegmentremainingdistance}%
+                               %~ {\pgfmathresult\pgfdecorationsegmentamplitude}
+                    %~ }
+        %~ }
+        %~ {%TO 
+        %~ \pgfpointadd{\pgfpointdecoratedinputsegmentlast}{\pgfpoint{1pt}{1pt}}
+        %~ }
+    %~ }
+    %~ \state{final}{}
+%~ }
+%~ %
+%~ \tikzstyle{block} = [draw,rectangle,thick,minimum height=2em,minimum width=2em]
+%~ \colorlet{darkred}{red!80!black}
+%~ \colorlet{darkblue}{blue!80!black}
+%~ \colorlet{darkgreen}{green!60!black}
+
+%\newcommand*\mystrut[1]{\vrule width0pt height0pt depth#1\relax}
+%http://tex.stackexchange.com/questions/13843/vertical-spacing-with-underbrace-command
+
+\title[Clustering de courbes de charge EDF]
+{Clustering de courbes de charge EDF%\\
+%Application Ã  la prÃ©vision de la qualitÃ© de l'air
+\vspace*{0.5cm}}
+\author[Benjamin Auder, Jairo Cugliari]
+{Benjamin Auder \inst{1}\\[0.2cm]Jairo Cugliari \inst{2}\hspace*{0.6cm}\vspace*{1cm}}
+\date[]{}
+\institute[]{\inst{1} CNRS Orsay / UniversitÃ© Paris-Sud\hspace*{1.3cm} \and
+\inst{2} Laboratoire ERIC / UniversitÃ© LumiÃ¨re Lyon 2}
+%~ \titlegraphic{
+	%~ \includegraphics[width=2cm]{logo_eric.png}\hspace*{4.75cm}~%
+	%~ \includegraphics[width=2cm]{logo_lyon2.jpg}
+%~ }
+
+\begin{document}
+
+\begin{frame}
+\vspace*{0.5cm}
+\titlepage
+\end{frame}
+
+\begin{frame}{Contexte industriel}
+
+\begin{columns}
+
+\column{0.5\textwidth}
+Smartgrid \& Smart meters : 35M compteurs individuels donnant de l'information en temps rÃ©el.\\[0.7cm]
+$\Rightarrow$ \textbf{Beaucoup} de donnÃ©es.\\[1cm]
+%\textcolor{white}{$\Rightarrow$} problÃ¨mes informatiques : protocoles de transfert, sÃ©curitÃ©, \dots
+Comment les traiter ?
+
+\column{0.5\textwidth} 
+\includegraphics[width = \textwidth]{smartgrid.jpg}\\
+\includegraphics[width = \textwidth]{linky.jpg} 
+
+\end{columns}
+
+\end{frame}
+
+\begin{frame}{Des donnÃ©es variÃ©es, Ã  diffÃ©rentes Ã©chelles}
+
+\begin{figure}[!ht] \centering
+  \begin{minipage}[c]{0.48\textwidth}
+     \includegraphics[width=\textwidth,height=3.45cm]{longtermload.png}
+     \vspace*{-0.35cm}
+%     \vspace*{-0.85cm}
+     \caption{Tendance Ã  long terme} %\label{fig:gull}
+  \end{minipage}%
+  ~ %spacing between images
+  \begin{minipage}[c]{0.48\textwidth}
+     \includegraphics[width=\textwidth,height=3.45cm]{twoyearsload.png}
+     \vspace*{-0.35cm}
+%     \vspace*{-0.85cm}
+     \caption{CyclicitÃ© semaine} %     \label{fig:tiger}
+  \end{minipage}
+  ~\\[-0.05cm]
+  \begin{minipage}[c]{0.48\textwidth}
+     \includegraphics[width=\textwidth,height=3.45cm]{dailyloads.png}
+     \vspace*{-0.35cm}
+%     \vspace*{-0.85cm}
+     \caption{Moyenne journaliÃ¨re} %   \label{fig:mouse}
+  \end{minipage}
+  ~ %spacing between images
+  \begin{minipage}[c]{0.48\textwidth}
+     \includegraphics[width=\textwidth,height=3.45cm]{consotemp.png}
+     \vspace*{-0.35cm}
+%     \vspace*{-0.85cm}
+     \caption{Conso. vs. tempÃ©rature}
+  \end{minipage}
+\end{figure}
+
+\end{frame}
+
+\begin{frame}{DÃ©coupage en tranches non stationnaires}
+
+Si $\exists \delta \ll D$, tel que les sÃ©ries $\delta-$agrÃ©gÃ©es soient stationnaires,\\
+on les agrÃ¨ge et les traite comme des processus stationnaires.\\[0.3cm]
+
+\begin{columns}
+  \column{6cm}    
+    \input{tikz/axis2}
+   ~
+  \column{5cm}
+	\vspace*{-1cm}
+     \[ Z_k(t) = X(t + (k-1)\delta)             \]
+     \[  k\in\N \;\;\; \forall t \in [0,\delta) \]
+\end{columns}
+
+\textbf{\emph{Mais...}} 
+Une sÃ©rie temporelle reprÃ©sentant un phÃ©nomÃ¨ne complexe 
+\textcolor{white}{\textbf{\emph{Mais...}} }est en gÃ©nÃ©ral clairement non stationnaire.\\[0.5cm]
+
+$\Rightarrow$ On dÃ©cide de tenir compte de chaque point de discrÃ©tisation.
+
+%Par exemple, la consommation Ã©lectrique moyenne sur une semaine varie
+
+%~ \vfill
+  %~ If $X$ contents a $\delta-$seasonal component, 
+     %~ $Z$ is particularly fruitful.
+
+%~ C'est pas vraiment notre cas : saisonnier Ã  plusieurs echelles
+%~ ==> objectif : tout prendre en compte
+
+\end{frame}
+
+\begin{frame}{RÃ©duction de dimension}
+
+DonnÃ©es enregistrÃ©es toutes les 30 minutes pendant un an :\\
+$48 \times 365 =$ \textbf{17520 points de discrÃ©tisation}.\\[0.3cm]
+
+\vspace*{-0.4cm}
+\begin{figure}[!ht]
+\centering
+\includegraphics[width=\textwidth,height=5.5cm]{3centers.png}
+\vspace*{-0.35cm}
+%\vspace*{-0.95cm}
+\caption{Trois types de courbes de charge \emph{(donnÃ©es irlandaises)}}% prÃ©sentant diffÃ©rents rÃ©gimes}%{[Spoiler] Cinq centres de clusters}
+\end{figure}
+
+\vspace*{-0.3cm}
+$\Rightarrow$ Il faut dÃ©terminer une reprÃ©sentation parcimonieuse, capturant\\
+\textcolor{white}{$\Rightarrow$ }bien les variations localisÃ©es. On choisit une base d'ondelettes.\\[0.5cm]
+%TODO: placer l'equation puis sa version discrÃ¨te.
+
+\end{frame}
+
+\begin{frame}{Wavelets to cope with \textsc{fd}}
+
+\begin{columns}
+  \column{.6\textwidth}
+ %\begin{figure}
+ \centering
+ \includegraphics[width = \textwidth]{./pics/weekly-5.png}
+  % * * * * * * * *  * * * * * * * * * * *
+  \column{.4\textwidth}
+\begin{footnotesize}
+\begin{itemize}
+ \item domain-transform technique for hierarchical decomposing finite energy signals
+ \item description in terms of a broad trend (\textcolor{PineGreen}{approximation part}), plus a set of localized changes kept in the \textcolor{red}{details parts}.
+\end{itemize}
+\end{footnotesize}
+\end{columns}
+
+\vspace*{-0.1cm}
+\begin{block}{Discrete Wavelet Transform }
+\begin{footnotesize}
+  If $z \in L_2([0, 1])$ we can write it as
+  \vspace*{-0.4cm}
+   \begin{equation*}\label{eq:zeta}
+     z(t) = \sum_{k=0}^{2^{j_0}-1} \textcolor{PineGreen}{c_{j_0, k}} \phi_{j_0,k} (t)  + 
+        \sum_{j={j_0}}^{\infty} 
+           \sum_{k=0}^{2^j-1} \textcolor{red}{d_{j,k}} \psi_{j,k} (t) ,
+   \end{equation*}
+%
+~\\[-0.6cm]
+where $ c_{j,k} = <g, \phi_{j,k} > $, $ d_{j,k} = <g, \varphi_{j,k}>$ are the 
+\textcolor{PineGreen}{scale coefficients} and \textcolor{red}{wavelet coefficients} respectively, and the functions $\phi$ et $\varphi$ are associated to a orthogonal \textsc{mra} of $L_2([0, 1])$.
+\end{footnotesize}
+\end{block}
+\end{frame}
+
+%---------------------------------------- SLIDE ---------------------
+
+\begin{frame}{Energy decomposition of the DWT}
+
+\begin{block}{ }
+ \begin{itemize}
+  \item Energy conservation of the signal
+\vspace*{-0.15cm}
+  \begin{equation*}\label{eq:energy}  
+     \| z \|_H^2    \approx     \| \widetilde{z_J} \|_2^2 
+        = c_{0,0}^2 + \sum_{j=0}^{J-1} \sum_{k=0}^{2^j-1} d_{j,k} ^2  = 
+                     c_{0,0}^2 + \sum_{j=0}^{J-1} \| \mathbf{d}_{j} \|_2^2.
+  \end{equation*}
+%  \item characterization by the set of channel variances estimated at the output of the corresponding filter bank
+ \item For each $j=0,1,\ldots,J-1$, we compute the absolute and 
+ relative contribution representations by
+\vspace*{-0.15cm}      
+   \[ \underbrace{\hbox{cont}_j = ||\mathbf{d_j}||^2}_{\fbox{AC}}  
+      \qquad  \text{and}  \qquad
+       \underbrace{\hbox{rel}_j  = 
+     \frac{||\mathbf{d_j}||^2}
+          {\sum_j ||\mathbf{d_j}||^2 }}_{\fbox{RC}} .\]
+ \item They quantify the relative importance of the scales to the global dynamic.
+% \item Only the wavelet coefficients $\set{d_{j,k}}$ are used.
+ \item RC normalizes the energy of each signal to 1.
+\end{itemize}
+\end{block}
+\end{frame}
+
+%===========================================================================================
+% fin de l'intro...
+%===========================================================================================
+
+\begin{frame}{Objectif}
+
+\begin{figure}[!ht]\centering
+  \includegraphics[width = \textwidth]{pics/schema.png} 
+%\caption{Hierarchical structure of $N$ individual clients among $K$ groups.}\label{fig:schema-hier}
+\end{figure}
+
+Regroupement par tarifs, zones gÃ©ographiques, types de clients \dots\\[0.3cm]
+
+$\Rightarrow$ \textbf{IdÃ©e} : clustering pour dÃ©terminer ces groupes.\\[0.3cm]
+
+\textcolor{white}{$\Rightarrow$ }\textbf{MÃ©thode} : parallÃ©liser un algorithme classique.
+
+%~ functional clustering
+%~ wavelets to reduce dimension
+%~ open MPI to cluster a bounded number of vectors at a time
+
+\end{frame}
+
+\begin{frame}{Fonction objectif}
+
+On cherche Ã  minimiser la distorsion
+$$\Delta = \sum_{i=1}^{n} \min_{k=1..K} \| x_i - c_k \|_2^{}$$
+avec pour variables les $\{c_1,\dots,c_K\} \subset \{x_1,\dots,x_n\}, c_i \neq c_j \,  \forall i \neq j$.\\[0.3cm]
+
+C'est un problÃ¨me NP-dur {\footnotesize (O. Kariv \& S. L. Hakimi, \emph{An Algorithmic Approach to Network Location Problems. II: The p-Medians})}.\\[0.1cm]
+%SIAM J. Appl. Math., 37(3), 539â560. (22 pages)
+%~ C'est-Ã -dire :
+%~ \begin{itemize}
+%~ \item Soit $P$ le problÃ¨me de dÃ©cision associÃ© : $P(c_1,\dots,c_k) = 1$ si $(c_1,\dots,c_k)$ est optimal, 0 sinon.
+%~ \item Soit $C$ un problÃ¨me de dÃ©cision bien connu comme Ã©tant NP-complet
+%~ \item Il existe un algorithme ...
+%~ \end{itemize}
+
+Pire : garantir un facteur $(1+\varepsilon)$ de l'optimum est NP-dur 
+{\footnotesize (J-H. Lin \& J. S. Vitter $\varepsilon$-Approximations with Minimum Packing Constraint Violation)}.\\[0.2cm]%(Extended Abstract)
+
+\begin{block}{NP : ``Non-deterministic Polynomial-time algorithms''}
+{\footnotesize ExÃ©cution en temps polynomial sur une machine de Turing non dÃ©terministe.}
+\end{block}
+
+\begin{block}{NP-dur}
+``Au moins aussi dur que le plus complexe des problÃ¨mes NP''
+\end{block}
+
+%~ Tous les algorithmes existants dÃ©terminant les $c_k$ sont donc des heuristiques d'approximation
+%~ ...et parler de la parallÃ©lisation ??! donc 16 slides au total.
+%NP-complet : c'est Ã  dire... expliquer.
+%Algos existants = heuristiques pr s'approcher de l'optimum (d'un...)
+
+\end{frame}
+
+\begin{frame}{Algorithme PAM}
+
+%PAM : montrer algo, dire comment on parallÃ©lise naÃ¯vement
+
+\begin{enumerate}
+\setcounter{enumi}{-1}
+\item Initialize: randomly select (without replacement) $K$ of the $n$ data points as the medoids.
+\item Associate each data point to the closest medoid. (``closest'' here is defined using any valid distance metric, most commonly Euclidean distance, Manhattan distance or Minkowski distance).
+\item For each medoid $m$\\
+\quad For each non-medoid data point $o$ \emph{in the same cluster}\\
+\quad\quad Swap $m$ and $o$ and compute the total cost.
+\item Select the configuration with the lowest cost.\\
+If any change occurred in the medoids, go to step 1.
+\end{enumerate}
+
+\begin{block}{RÃ©duire le coÃ»t des Ã©tapes 2 et 3 ?}
+\begin{itemize}
+\item Dans R, pam(do.swap=FALSE) supprime les Ã©tapes 2 et 3.
+\item A. P. Reynolds et al. (2006) : quelques astuces algorithmiques.
+\end{itemize}
+\end{block}
+
+\end{frame}
+
+\begin{frame}{ParallÃ©lisation}
+
+\begin{block}{Deux approches (entre autres)}
+\begin{itemize}
+\item DÃ©coupage de l'espace en $Z < K$ zones, et recherche de $K/Z$ clusters dans chaque zone.
+\item Partition des donnÃ©es $P_1,\dots,P_Z$ puis clustering Ã  $K$ groupes dans chaque $P_k$. 
+(Puis ``fusion'' des mÃ©doÃ¯des).
+\end{itemize}
+\end{block}
+
+~\\[-0.1cm]
+{\footnotesize
+Choix de la seconde alternative et implÃ©mentation avec OpenMPI :
+\begin{enumerate}
+\setcounter{enumi}{-1}
+\item Le processus ``maÃ®tre'' a pour numÃ©ro 0. Il divise les donnÃ©es en sous-ensembles de cardinal au plus 
+$C$ ($C = 5000$ par exemple). Il envoie ensuite une tÃ¢che de clustering par sous-ensemble, et attend les rÃ©sultats.
+\item Chaque processus ``esclave'' (numÃ©rotÃ©s de 1 Ã  $p-1$) reÃ§oit une liste de (rÃ©fÃ©rences de) courbes, qu'il rÃ©cupÃ¨re 
+et classe via l'algorithme PAM. Il retourne les centres au processus 0.
+\item Si on obtient plus de $C$ mÃ©doÃ¯des, on recommence depuis l'Ã©tape 1. Sinon, on applique une derniÃ¨re 
+fois l'algorithme PAM (sur les mÃ©doÃ¯des).
+\end{enumerate}
+}
+
+\end{frame}
+
+\begin{frame}{ExÃ©cution du programme}
+
+\vspace*{-0.5cm}
+\begin{figure}
+\includegraphics[width=\linewidth,height=8cm]{pics/screen_demo.png}
+	%~ \vspace*{-0.35cm}
+	%~ \caption{Groupe 1}
+\end{figure}
+
+\end{frame}
+
+\begin{frame}{Application I: Electricity Smart Meter CBT}
+
+%\footnotetext[1]{\textit{Irish Social Science Data Archive}, }
+
+\begin{itemize}
+ \item 4621 Irish households smart meter data 
+ (\href{http://www.ucd.ie/issda/data/}{ISSDA})
+ % esÃ©ries de consommation Ã©lectrique de foyers irlandais
+ \item About 25K discretization points 
+ \item We test with $K=$ 3 or 5 classes
+ \item We compare sequential and parallel versions 
+\end{itemize}
+
+\begin{table}[H]
+\centering
+\begin{tabular}{lcc}                       \hline
+% &            &       \\
+ & Distortion & (Internal) adequacy  \\ \hline
+3 clusters sequential & 1.90e7 & 0.90   \\
+3 clusters parallel   & 2.15e7 & 0.90   \\
+5 clusters sequential & 1.61e7 & 0.89   \\
+5 clusters parallel   & 1.84e7 & 0.89   \\ \hline
+\end{tabular}
+%  \caption{Distorsions et indices d'adÃ©quation des partitions}
+\end{table}
+
+\textbf{Adequacy :} given $P_1 = (i_1,\dots,i_n)$ and $P_2 = (j_1,\dots,j_n)$,\\
+\textcolor{white}{\textbf{Adequacy :}} find a matching which maximize $S = \sum_{k=1}^{n} \mathbb{1}_{i_k = j_k}$\\
+\textcolor{white}{\textbf{Adequacy :}} (hungarian algorithm), and then return $S/n$.
+
+\end{frame}
+
+\begin{frame}{Application II: Starlight curves}
+
+\begin{itemize}
+ \item Data from \href{http://www.cs.ucr.edu/~eamonn/time_series_data/}{UCR Time Series Classification/Clustering}
+ %\url{http://www.cs.ucr.edu/~eamonn/time_series_data/}}
+ \item 1000 curves learning set + 8236 validation set ($d = 1024$)% discretization points
+\end{itemize}
+
+\begin{figure}[H]
+\begin{minipage}[c]{.32\linewidth}
+	\includegraphics[width=\linewidth,height=3.5cm]{pics/slgr1.png}
+	\vspace*{-0.35cm}
+	\caption{Groupe 1}
+\end{minipage}
+\begin{minipage}[c]{.32\linewidth}
+	\includegraphics[width=\linewidth,height=3.5cm]{pics/slgr2.png}
+	\vspace*{-0.35cm}
+	\caption{Groupe 2}
+\end{minipage}
+\begin{minipage}[c]{.32\linewidth}
+	\includegraphics[width=\linewidth,height=3.5cm]{pics/slgr3.png}
+	\vspace*{-0.35cm}
+	\caption{Groupe 3}
+\end{minipage}
+\end{figure}
+
+\begin{footnotesize}
+\vspace*{-0.3cm}
+\begin{table}[H]
+\centering
+\begin{tabular}{lccc}                           \hline
+ &            & \multicolumn{2}{c}{Adequacy} \\
+ & Distortion & Internal & External          \\ \hline
+Training (sequential) & 1.31e4 & 0.79 & 0.77 \\
+Training (parallel)   & 1.40e4 & 0.79 & 0.68 \\
+Test (sequential)     & 1.09e5 & 0.78 & 0.76 \\
+Test (parallel)       & 1.15e5 & 0.78 & 0.69 \\ \hline
+\end{tabular}
+%\caption{Distorsions et indices d'adÃ©quation des partitions}
+\end{table}
+\end{footnotesize}
+
+\end{frame}
+
+\begin{frame}{Conclusion}
+
+%~ On peut clusteriser
+%~ Faudrait etre moins naif
+%~ Faudrait aussi Ã©tendre/gÃ©nÃ©raliser le code...
+
+\begin{block}{RÃ©sumÃ©}
+\begin{itemize}
+\itemsep0.1em
+\item Les smartmÃ¨tres mesurent la charge Ã©lectrique pour chaque client, en temps rÃ©el $\Rightarrow$ donnÃ©es fonctionnelles.
+\item Les ondelettes fournissent des reprÃ©sentations parcimonieuses tout en prÃ©servant la nature fonctionnelle des donnÃ©es.
+\item L'analyse de ces reprÃ©sentations Ã  l'aide de l'algorithme PAM permet d'identifier des groupes de clients.
+\item L'algorithme PAM est appliquÃ© en parallÃ¨le sur des jeux de donnÃ©es de tailles raisonnables.
+\end{itemize}
+\end{block}
+
+% \item \textit{Divide-and-Conquer} approach thanks to MPI library %pour l'algorithme des $k$-mÃ©doÃ¯des : d'abord  sur des groupes de donnÃ©es courbes, puis des groupes de mÃ©doÃ¯des jusqu'Ã  obtenir un seul ensemble traitÃ© sur un processseur.
+ %\item %Les rÃ©sultats obtenus sur les deux jeux de donnÃ©es prÃ©sentÃ©s sont assez encourageants, et permettent d'envisager une utilisation Ã  plus grande Ã©chelle.
+%\end{itemize}
+
+\begin{exampleblock}{Perspectives}
+\begin{itemize}
+\itemsep0.1em
+\item L'Ã©tude des groupes de clients peut donner lieu Ã  l'Ã©laboration de $K$ modÃ¨les prÃ©dictifs spÃ©cialisÃ©s.
+\item La mÃ©thode de clustering parallÃ¨le proposÃ©e peut Ãªtre adaptÃ©e pour traiter les 35M sÃ©ries (sur un supercalculateur ?).
+%\item Apply the algorithm over many hundreds of processors
+\end{itemize}
+\end{exampleblock}
+
+\end{frame}
+
+\begin{frame}{RÃ©fÃ©rences}
+
+\begin{thebibliography}{4}
+\bibitem{1} \textcolor{black}{A. Antoniadis, X. Brossat, J. Cugliari, J.-M. Poggi} (2013), Clustering Functional Data Using Wavelets, \textcolor{black}{{\it Wavelets, Multiresolution and Information Processing}, 11(1), 35--64}
+
+\bibitem{2} \textcolor{black}{A. Arbelaez, L. Quesada} (2013), Parallelising the k-Medoids Clustering Problem Using Space-Partitioning, \textcolor{black}{{\it Symposium on Combinatorial Search}, AAAI Publications}
+
+\bibitem{3} \textcolor{black}{R. Bekkerman, M. Bilenko, J. Langford - Ã©diteurs} (2011), 
+Scaling up Machine Learning: Parallel and Distributed Approaches, \textcolor{black}{Cambridge University Press}
+
+\bibitem{4} \textcolor{black}{A. P. Reynolds, G. Richards, B. de la Iglesia, V. J. Rayward-Smith} (2006), Clustering Rules: A Comparison of Partitioning and Hierarchical Clustering Algorithms, \textcolor{black}{{\it Mathematical Modelling and Algorithms}, 5(4), 475--504}
+
+%\bibitem{3} P. Berkhin (2006), A Survey of Clustering Data Mining Techniques, {\it Grouping Multidimensional Data, Ã©diteurs : J. Kogan, C. Nicholas, M. Teboulle}.
+
+%\bibitem{6} J. Dean et S. Ghemawat (2004), MapReduce: Simplified Data Processing on Large Clusters, {\it Sixth Symposium on Operating System Design and Implementation}.
+
+%\bibitem{7} G. De Francisci Morales et A. Bifet (2013), G. De Francisci Morales SAMOA: A Platform for Mining Big Data Streams Keynote Talk at RAMSS â13: 2nd International Workshop on Real-Time Analysis and Mining of Social Streams WWW, Rio De Janeiro
+
+%\bibitem{10} L. Kaufman et P.J. Rousseeuw (1987), Clustering by means of Medoids, {\it Statistical Data Analysis Based on the L\_1-Norm and Related Methods, Ã©diteur : Y. Dodge}.
+\end{thebibliography}
+
+%[2013] A. Antoniadis, X. Brossat, J. Cugliari & J.-M. Poggi. Clustering functional data using Wavelets Inter. J. of Wavelets, Multiresolution and Information Procesing. doi:10.1142/S0219691313500033
+
+%~ Scaling up Machine Learning: Parallel and Distributed Approaches [Anglais] [ReliÃ©]
+%~ Ron Bekkerman (Sous la direction de), Mikhail Bilenko (Sous la direction de), John Langford
+
+\end{frame}
+
+\begin{frame}
+
+\centering
+\includegraphics[width=7cm,height=7cm]{Questions.jpg}
+
+\end{frame}
+
+\end{document}