summaryrefslogtreecommitdiff
path: root/main.tex
diff options
context:
space:
mode:
Diffstat (limited to 'main.tex')
-rw-r--r--main.tex60
1 files changed, 34 insertions, 26 deletions
diff --git a/main.tex b/main.tex
index c600fb7..32b7591 100644
--- a/main.tex
+++ b/main.tex
@@ -23,16 +23,14 @@
\begin{tcolorbox}[title=DCDT's lack predictive analytics]
We need Datacenter Digital Twins (DCDT) to be better able to detect and solve issues in critical ICT infrastructure~\cite{DBLP:journals/computer/AthavaleBBMMPS24}.
However, DCDT's are still actively developed and lack crucial features such as predictive analytics~\cite{DBLP:usdoe/report/AP26894} to \emph{e.g.,} prevent unexpected failures.
- With predictive analysis (\emph{e.g.,} simulation) DCDT's could save millions of lost \$USD~\cite{DBLP:conf/acsos/TalluriOVTI21}.
\end{tcolorbox}
\begin{center}
\includegraphics[width=0.9\linewidth]{images/predictive_analytics.pdf}
\end{center}
\tiny
- \textbf{Figure 1.2:} Where does our work fit within the field of datacenter digital twinning?
- There are 5 core elements to any Digital Twin: \myCircled{A} The Digital $\rightarrow$ Physical Twin link, \myCircled{B} the Physical Twin (\emph{e.g.,} the datacenter), \myCircled{C} the Physical $\rightarrow$ Digital Twin link, \myCircled{D} the Digital Twin, \myCircled{E} the features necessary to any Digital Twin.
- \textcolor{Green}{\faHighlighter~Highlighted areas are the contributions from this thesis, which include the autonomous actions resulting from predictive insights \myCircledGreen{A} and the predictive analysis itself within \myCircledGreen{E}.}
+ \textbf{Figure 1.2:} Datacenter Digital Twin Diagram. There are 5 core elements to any Digital Twin: \myCircled{A} The Digital $\rightarrow$ Physical Twin link, \myCircled{B} the Physical Twin (\emph{e.g.,} the datacenter), \myCircled{C} the Physical $\rightarrow$ Digital Twin link, \myCircled{D} the Digital Twin, \myCircled{E} the features necessary to any Digital Twin.
+ \textcolor{Green}{\faHighlighter~Highlighted areas are the contributions from this thesis, which include the autonomous actions resulting from predictive insights \myCircledGreen{A} and the predictive analysis framework (including simple storage capabilities) within \myCircledGreen{E}.}
\end{frame}
\begin{frame}\frametitle{Research Questions}
@@ -56,13 +54,13 @@
\begin{frame}\frametitle{\textbf{RQ1}: Literature Review I}
\begin{tcolorbox}[title=Main Finding I]
- The literature on DCDTs is scarce.
+ The literature on DCDTs is sparse.
Some systems barely classify as DTs (\emph{e.g.,} Kalibre~\cite{DBLP:conf/sensys/WangZD0TCWZ20}, ChatTwin~\cite{DBLP:conf/sensys/LiW0Z0T23}).
Existing deployments specialize in \textcolor{Red}{Cooling and Heat Modelling}, together with \textcolor{Red}{3D visualizations}.
Most lack predictive modelling of DC operations.
\end{tcolorbox}
\vspace{-0.1cm}
- \input{images/table.tex}
+ \input{sources/table.tex}
% Research on DTs for datacenters have been separate, siloed efforts focused on either datacenter cooling, network performance, power consumption or visualization efforts.
% CFD usually means Navier-Stokes equations.
% CFD models take ages to compute.
@@ -72,11 +70,11 @@
% Mandatory: split the figure into 2: top and bottom, and that way you can fill in the entire slide nicely.
\begin{tcolorbox}[title=A holistic DCDT system model]
- We propose a generic model of datacenter digital twinning that can be mapped to each system from \textbf{Table 1.1}. Within this model (see \textbf{Fig. 1.3}) we introduce a concept of the \emph{Digital Thread}: a bridge between the DCDT and the physical DC equipment.
+ We propose a holistic model of datacenter digital twinning that can be mapped to each system from \textbf{Table 1.1}. Within this model (see \textbf{Fig. 1.3}) we introduce a concept of the \emph{Digital Thread}: a bridge between the DCDT and the physical DC equipment.
\end{tcolorbox}
\begin{center}
\vspace{-0.1cm}
- \includegraphics[width=0.8\textwidth]{images/system_model2.pdf}
+ \includegraphics[width=0.8\textwidth]{images/system_model.pdf}
\end{center}
% The reason why the cooling system is in the graph is because of the fact that 40\% of total energy consumed in DCs comes from cooling~\cite{DBLP:conf/noms/ZhangZLZWC22}.
% It has come to the point where datacenters are being build in the Pan-Arctic region, such as Finland,Russia,Sweden etc. with Iceland leading in number of DCs https://www.datacentermap.com/iceland/
@@ -142,7 +140,7 @@
\begin{minipage}[b]{0.45\linewidth}
\vspace{-0.2cm}
\begin{center}
- \includegraphics[width=1.2\linewidth]{images/predictive_analyticsv3.pdf}
+ \includegraphics[width=1.2\linewidth]{images/novel_eval_method.pdf}
\end{center}
\tiny
\vspace{-0.2cm}
@@ -169,7 +167,7 @@
\hspace{-0.2cm}
\begin{minipage}[b]{0.45\linewidth}
\begin{center}
- \includegraphics[width=1.1\textwidth]{images/25_Jun_2026_152341.pdf}
+ \includegraphics[width=1.1\textwidth]{images/red_yellow_alarms.pdf}
\end{center}
\vspace{-0.3cm}
\tiny
@@ -179,7 +177,7 @@
\hspace{0.6cm}
\begin{minipage}[b]{0.45\linewidth}
\begin{center}
- \includegraphics[width=1.1\textwidth]{images/25_Jun_2026_161052.pdf}
+ \includegraphics[width=1.1\textwidth]{images/failure_detecton_rate.pdf}
\end{center}
\vspace{-0.3cm}
\tiny
@@ -190,55 +188,65 @@
% Give more reliable results than just numbers -- do statistical testing, i.e., standard deviation, confidence intervals.
\end{frame}
-\begin{frame}\frametitle{\textbf{RQ3}: Experimental Results II}
+\begin{frame}\frametitle{\textbf{RQ3}: Experimental Results II} % Let's say we have some knowledge about the kind of workload we are going to run, e.g., Skype video calls.
+ % We can then estimate on previous Skype node failures and one of statistical distributions when are failures likely to happen.
+ % During the experiment, we unfortunately do not know what kind of distribution will the failures follow, so we constantly check to see which one fits best, and dynamically adjust the scheduling policy based on that.
+ %---%
+ % Step 1: We know we are going to soon run a workload coming in from Skype. Let's try to predict the failure pattern we might encounter.
+ % Run the OpenDC simulator 5 times to estimate the possible failure patterns. Save the results inside the Digital Twin.
+ % Step 2: Run the Digital Twin. Each time a new metric comes in, update the similarity score of each possible distribution.
+ % If the distribution with the similarity score that is the highest is about to match timestamps with the running workload AND according to the distribution we are going to experience failures in hosts A,B,C,D, % We decide to stop scheduling tasks on hosts A,B,C and D (we send a message to the running datacenter).
\begin{tcolorbox}[title=Main Finding III]
- \emph{Sunfish} is capable of dynamic adjustments to the physical twin at runtime, and can lower the mean number of failed tasks.
+ Predicting failures in advance is really difficult. \emph{Sunfish} is capable of dynamic adjustments to the physical twin at runtime, and can slightly lower the number of failed tasks.
\end{tcolorbox}
- \hspace{0.2cm}
+ \hspace{-0.2cm}
\begin{minipage}[b]{0.45\linewidth}
\begin{center}
- \includegraphics[width=1.1\textwidth]{images/23_Jun_2026_102028.pdf}
+ \includegraphics[width=1.1\textwidth]{images/failure_likelihood.pdf}
\end{center}
\vspace{-0.3cm}
\tiny
- \textbf{Figure 1.8a:} Experiment 2a.
+ \textbf{Figure 1.8a:} Experiment 2a. The figure shows which failure distribution is the most likely to be the true failure distribution while the simulation is running.
+ This figure shows the difficulty of predictive analytics.
\end{minipage}
+ \hspace{0.5cm}
\begin{minipage}[b]{0.45\linewidth}
+ \vspace{-0.1cm}
\begin{center}
- \includegraphics[width=1.1\textwidth]{images/23_Jun_2026_102028.pdf}
+ \includegraphics[width=1.1\textwidth]{images/conceptual_experiment.pdf}
\end{center}
\vspace{-0.3cm}
\tiny
- \textbf{Figure 1.8b:} Experiment 2b.
+ \textbf{Figure 1.8b:} Experiment 2b. With perfect precognition (\emph{i.e.,} knowing on which day, what failures might happen) we could lower the mean number of failures.
+ This experiment is a proof of concept (results are indication-only).
\end{minipage}
\end{frame}
\begin{frame}\frametitle{Key Takeaways}
- \begin{tcolorbox}[title=What is the societal context?]
+ \begin{tcolorbox}[title=Societal Context]
Datacenter manageability is a top-priority for the digital society.
Over 3 million jobs in the Netherlands directly depend on cloud services, which are hosted in datacenters~\cite{DBLP:journals/corr/IosupKLVG22}.
\end{tcolorbox}
- \begin{tcolorbox}[title=What problem did we solve?]
+ \begin{tcolorbox}[title=Problem Statement]
DCDT's, still under development, lack crucial features such as predictive analytics to manage datacenters well.
The entire DCDT design space remains largely unexplored.
\end{tcolorbox}
- \begin{tcolorbox}[title=How did we solve this problem?]
- Our contributions are: a thorough literature survey with a system model, a DCDT reference architecture, and prototype-based experiments via a novel evaluation method.
+ \begin{tcolorbox}[title=Contributions]
+ (1) A thorough literature survey with a system model, (2) a DCDT reference architecture, and (3) prototype-based experiments via a novel evaluation method.
\end{tcolorbox}
- \begin{tcolorbox}[title=What did we find?]
- \emph{Sunfish} can reliably detect unexpected failures based on discrete-event predictions, and can serve as a foundation for additional research and future work.
+ \begin{tcolorbox}[title=Main Findings]
+ \emph{Sunfish} can reliably detect unexpected failures based on discrete-event predictions, and can serve as a foundation for research and future work in predictive analytics.
\end{tcolorbox}
% Mandatory to mention here the future work that you see happening.
% Not enough space for another tcolorbox.
\end{frame}
-\setcounter{framenumber}{3}
+\setcounter{framenumber}{4}
\setbeamertemplate{footline}[page number]{}
-
% Unfortunately this must remain here.
\setbeamercolor{frametitle}{fg=Brown,bg=Brown!20}
\setbeamertemplate{frametitle}{