1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
|
\documentclass[12pt, handout]{beamer}
\input{style/style.tex}
\begin{document}
\frame{\titlepage}
\begin{frame}\frametitle{Motivation}
\begin{tcolorbox}[title=Context]
Heterogeneous datacenter architectures are common ~\cite{DBLP:conf/date/MilojicicFDR21} and
modern computational needs of AI drive managers to diversify datacenters even more~\cite{DBLP:journals/computer/AthavaleBBMMPS24}.
In result datacenters become extremely complex and hard to operate with millions of CPU's, GPU's etc.
\end{tcolorbox}
\begin{center}
\includegraphics[width=\linewidth]{images/datacenter_complexity.pdf}
\end{center}
\tiny
\textbf{Figure 1.1:} Society depends on datacenters to keep running, and therefore we cannot afford to let these systems break down or experience significant performance-related issues.
With millions of servers in the largest datacenters, real-time management becomes very difficult.
Left to right: a Google datacenter, server racks, Ada Lovelace AD102 GPU architecture.
\end{frame}
\begin{frame}\frametitle{Problem Statement}
\begin{tcolorbox}[title=We need tools to tackle datacenter complexity]
We need Datacenter Digital Twins (DCDT) to be better able to detect and solve issues in this critical infrastructure~\cite{DBLP:journals/computer/AthavaleBBMMPS24}.
However, DCDT's are still actively developed, and lack crucial features \emph{e.g.,} predictive analytics~\cite{DBLP:usdoe/report/AP26894} to prevent unexpected job failures.
\end{tcolorbox}
\end{frame}
\begin{frame}\frametitle{Research Questions}
\begin{tcolorbox}[title=Main Research Question, colbacktitle=red!70!black,colback=red!20!white]
How to enable predictive analytics for datacenters through digital twinning?
\end{tcolorbox}
\begin{tcolorbox}[title=Research Question 1]
How to asses the current state-of-the-art of digital twinning for datacenters?
\end{tcolorbox}
\begin{tcolorbox}[title=Research Question 2]
How to design a datacenter digital twin reference architecture using discrete-event simulation and predictive data analytics?
\end{tcolorbox}
\begin{tcolorbox}[title=Research Question 3]
How to evaluate and validate a datacenter digital twin architecture in relation to system requirements?
\end{tcolorbox}
\end{frame}
\begin{frame}\frametitle{\textbf{RQ1}: System Model}
\end{frame}
\begin{frame}\frametitle{\textbf{RQ2}: Reference Architecture}
\end{frame}
\begin{frame}\frametitle{\textbf{RQ3}: Experimental Results I}
\end{frame}
\begin{frame}\frametitle{\textbf{RQ3}: Experimental Results II}
\end{frame}
\begin{frame}\frametitle{Discussion}
\end{frame}
\setcounter{framenumber}{4}
\setbeamertemplate{footline}[page number]{
% Unfortunately this must remain here.
\setbeamercolor{frametitle}{fg=Brown,bg=Brown!20}
\setbeamertemplate{frametitle}{
\vspace*{-0.1cm}
\begin{beamercolorbox}[wd=\paperwidth, ht=0.75cm, dp=0.3cm,leftskip=10pt, rightskip=10pt]{frametitle}
\usebeamerfont{frametitle}\insertframetitle\hfill
\end{beamercolorbox}
}
\begin{frame}[allowframebreaks]\frametitle{Extra Slides: References}
\tiny
\bibliographystyle{is-plain}
\bibliography{main.bib}
\end{frame}
\begin{frame}\frametitle{Extra Slides: Societal Impact}
\begin{tcolorbox}[title=Why is this research important today?]
Over 3 million jobs in the Netherlands directly depend on cloud services, which are hosted in datacenters~\cite{DBLP:journals/corr/IosupKLVG22}.
Already the rapid
expansion of datacenters has increased the presence of service failures across all cloud
services~\cite{DBLP:conf/acsos/TalluriOVTI21}.
We need to act now.
\end{tcolorbox}
\begin{center}
\includegraphics[height=10em]{images/IosupLVG22-2_cropped.pdf}
\end{center}
\tiny
\textbf{Figure E.1:} Horizontally: the most important research areas in computer science in Netherlands.
Vertically: qualities we should ensure across all research areas with the most outstanding impact on society.
Datacenter manageability is a top-priority~\cite{DBLP:journals/corr/IosupKLVG22}.
\end{frame}
\begin{frame}\frametitle{Extra Slides: Why Digital Twinning?}
\begin{tcolorbox}[title=Definition]
A DCDT mirrors the structure, context and behaviour of a datacenter~\cite{DBLP:journals/computer/AthavaleBBMMPS24}. The prerequisite to any digital twin is good monitoring and sensing capabilities in the physical entity.
Datacenters meet this requirement easily because they already connect hundreds of monitoring sensors. \end{tcolorbox}
\begin{center}
\includegraphics[height=10em]{images/TaoIEEE2019-3_cropped.pdf}
\end{center}
\tiny
\textbf{Figure E.2:} Due to insufficient technological foundations,
little work is available on DTs between 2003 and 2018, and it is only with the rapid growth
of cloud computing, Internet-of-Things and Big Data analytics that DTs have reemerged~\cite{DBLP:conf/cirp/TAO2018169}.
That is why nobody used digital twins to mirror datacenters earlier.
\end{frame}
\begin{frame}\frametitle{Extra Slides: Why not pure simulation?}
\begin{tcolorbox}[title=Predicting job failures]
Preventing failure-caused outages in advance
can reduce huge operational costs, as over 20\% of all reported outages amount to more than 1 million
US\$~\cite{DBLP:report/AnnualOutageAnalysis2025}.
Only a constant bi-directional interaction (digital twin $\iff$ physical entity) can achieve this.
\end{tcolorbox}
\begin{center}
\includegraphics[height=10em]{images/AthavaleBBMMPS24-3_cropped.pdf}
\end{center}
\tiny \textbf{Figure E.3:} Real-time control that is tightly-coupled with the IT equipment is a prerequisite for timely predictions within seconds/minutes~\cite{DBLP:journals/computer/AthavaleBBMMPS24}.
\end{frame}
% Computational Fluid Dynamics (CFD) have high computation overhead, unsuitable for real-time simulation of a dynamic datacenter.
%Moreover oftentimes a poorly configured CFD model can lead to high error rates~\cite{DBLP:conf/sensys/WangZD0TCWZ20}.
%Data-driven Machine Learning performs poorly by the cases not covered in the training data.
\end{document}
|