\documentclass[12pt, handout]{beamer} \input{style/style.tex} \begin{document} \frame{\titlepage} \begin{frame}\frametitle{Motivation} \begin{tcolorbox}[title=Context] Heterogeneous datacenter architectures are common~\cite{DBLP:conf/date/MilojicicFDR21} due to the end of Dennard's scaling~\cite{DBLP:image/48Microprocessor/Rupp}. Today, computational needs of AI drive managers to diversify datacenters even more~\cite{DBLP:journals/computer/AthavaleBBMMPS24}. In result datacenters become extremely complex and hard to operate. \end{tcolorbox} \begin{minipage}[t]{0.45\linewidth} \tiny {\centering \includegraphics[width=1.05\linewidth]{images/48-years-processor-trend-2.pdf} } \textbf{Figure 1.1:} 48 years of microprocessor trend data. Legend: \textcolor{Orange}{$\bigblacktriangleup$ Transistors (thousands)}, \textcolor{Blue}{$\lgblkcircle$ Single Thread Performance (SpecINT $\times 10^3$)}, \textcolor{Green}{$\lgblksquare$ Frequency (MHz)}, \textcolor{Maroon}{$\bigblacktriangledown$ Typical Power (Watts)}, $\mdlgblkdiamond$ Number of Logical Cores~\cite{DBLP:image/48Microprocessor/Rupp}. \end{minipage} \hspace{0.5cm} \begin{minipage}[t]{0.45\linewidth} {\centering \includegraphics[width=1.1\linewidth]{images/AthavaleBBMMPS24_cropped.pdf} } \tiny \textbf{Figure 1.2:} Explosive growth in AI computational requirements drives datacenter upgrades (source: NVIDIA Analysis: reproduction with NVIDIA permission by~\cite{DBLP:journals/computer/AthavaleBBMMPS24}). \end{minipage} \end{frame} \begin{frame}\frametitle{Problem Statement} \begin{tcolorbox}[title=We need effective tools to manage datacenters] To address the increasing datacenter complexity, Datacenter Digital Twins (DCDT) were proposed~\cite{DBLP:journals/computer/AthavaleBBMMPS24}. However, many DCDT's are not useful in practice, because they lack critical features (\emph{e.g.,} predictive analytics) native to the generic Digital Twin definition~\cite{DBLP:usdoe/report/AP26894}. \end{tcolorbox} \input{images/table.tex} \end{frame} \begin{frame}\frametitle{Research Questions} \begin{tcolorbox}[title=Main Research Question, colbacktitle=red!70!black,colback=red!20!white] How to enable predictive analytics for datacenters through digital twinning? \end{tcolorbox} \begin{tcolorbox}[title=Research Question 1] How to asses the current state-of-the-art of digital twinning for datacenters? \end{tcolorbox} \begin{tcolorbox}[title=Research Question 2] How to design a datacenter digital twin reference architecture using discrete-event simulation and predictive data analytics? \end{tcolorbox} \begin{tcolorbox}[title=Research Question 3] How to evaluate and validate a datacenter digital twin architecture in relation to system requirements? \end{tcolorbox} \end{frame} \begin{frame}\frametitle{\textbf{RQ1}: System Model} \end{frame} \begin{frame}\frametitle{\textbf{RQ2}: Reference Architecture} \end{frame} \begin{frame}\frametitle{\textbf{RQ3}: Experimental Results I} \end{frame} \begin{frame}\frametitle{\textbf{RQ3}: Experimental Results II} \end{frame} \begin{frame}\frametitle{Discussion} \end{frame} \begin{frame}[allowframebreaks]\frametitle{References} \tiny \bibliographystyle{is-plain} \bibliography{main.bib} \end{frame} % Unfortunately this must remain here. \setbeamercolor{frametitle}{fg=Brown,bg=Brown!20} \setbeamertemplate{frametitle}{ \vspace*{-0.1cm} \begin{beamercolorbox}[wd=\paperwidth, ht=0.75cm, dp=0.3cm,leftskip=10pt, rightskip=10pt]{frametitle} \usebeamerfont{frametitle}\insertframetitle\hfill \end{beamercolorbox} } \begin{frame}\frametitle{Extra Slides: Societal Impact} \begin{tcolorbox}[title=Why is this research important today?] Over 3 million jobs in the Netherlands directly depend on cloud services, which are hosted in datacenters~\cite{DBLP:journals/corr/IosupKLVG22}. Already the rapid expansion of datacenters has increased the presence of service failures across all cloud services~\cite{DBLP:conf/acsos/TalluriOVTI21}. We need to act now. \end{tcolorbox} \begin{center} \includegraphics[height=10em]{images/IosupLVG22-2_cropped.pdf} \end{center} \tiny \textbf{Figure E.1:} Horizontally: the most important research areas in computer science in Netherlands. Vertically: qualities we should ensure across all research areas with the most outstanding impact on society. Datacenter manageability is a top-priority~\cite{DBLP:journals/corr/IosupKLVG22}. \end{frame} \begin{frame}\frametitle{Extra Slides: Why Digital Twinning?} \begin{tcolorbox}[title=Definition] A DCDT mirrors the structure, context and behaviour of a datacenter~\cite{DBLP:journals/computer/AthavaleBBMMPS24}. The prerequisite to any digital twin is good monitoring and sensing capabilities in the physical entity. Datacenters meet this requirement easily because they already connect hundreds of monitoring sensors. \end{tcolorbox} \begin{center} \includegraphics[height=10em]{images/TaoIEEE2019-3_cropped.pdf} \end{center} \tiny \textbf{Figure E.2:} Due to insufficient technological foundations, little work is available on DTs between 2003 and 2018, and it is only with the rapid growth of cloud computing, Internet-of-Things and Big Data analytics that DTs have reemerged~\cite{DBLP:conf/cirp/TAO2018169}. That is why nobody used digital twins to mirror datacenters earlier. \end{frame} \begin{frame}\frametitle{Extra Slides: Why \emph{not} pure simulation?} \begin{tcolorbox}[title=Predicting job failures] Preventing failure-caused outages in advance can reduce huge operational costs, as over 20\% of all reported outages amount to more than 1 million US\$~\cite{DBLP:report/AnnualOutageAnalysis2025}. Only a constant bi-directional interaction (digital twin $\iff$ physical entity) can achieve this. \end{tcolorbox} \begin{center} \includegraphics[height=10em]{images/AthavaleBBMMPS24-3_cropped.pdf} \end{center} \tiny \textbf{Figure E.3:} Real-time control that is tightly-coupled with the IT equipment is a prerequisite for timely predictions within seconds/minutes~\cite{DBLP:journals/computer/AthavaleBBMMPS24}. \end{frame} % Computational Fluid Dynamics (CFD) have high computation overhead, unsuitable for real-time simulation of a dynamic datacenter. %Moreover oftentimes a poorly configured CFD model can lead to high error rates~\cite{DBLP:conf/sensys/WangZD0TCWZ20}. %Data-driven Machine Learning performs poorly by the cases not covered in the training data. \end{document}