Further writeup
This commit is contained in:
parent
4368f6eaa6
commit
f8e83ebaf7
3 changed files with 20 additions and 9 deletions
|
@ -27,7 +27,7 @@
|
|||
\end{frame}
|
||||
|
||||
\begin{frame}{Quelques ordres de grandeur}
|
||||
|
||||
\todo{}
|
||||
\begin{columns}
|
||||
\begin{column}{0.32\textwidth}
|
||||
\begin{block}{Nombres}
|
||||
|
|
|
@ -7,16 +7,16 @@
|
|||
|
||||
\begin{frame}{Possible bottlenecks}
|
||||
\begin{columns}
|
||||
\begin{column}{0.4\textwidth}
|
||||
\begin{column}{0.37\textwidth}
|
||||
\begin{center}
|
||||
\includegraphics[width=\textwidth]{cpu_big_picture_truncate.svg}
|
||||
\end{center}
|
||||
\end{column}
|
||||
\hfill
|
||||
\begin{column}{0.58\textwidth}
|
||||
\begin{column}{0.62\textwidth}
|
||||
\begin{tightitemize}{0pt}
|
||||
\begin{itemize}
|
||||
\item \alert{Frontend:} \uops{} issued not fast enough;
|
||||
\item \alert{Frontend:} \uops{} not issued fast enough;
|
||||
issuing faster would speed up computation;
|
||||
\bigskip
|
||||
|
||||
|
@ -31,6 +31,11 @@
|
|||
\end{tightitemize}
|
||||
\end{column}
|
||||
\end{columns}
|
||||
|
||||
\pause{}
|
||||
\begin{center}
|
||||
\textbf{\alert{These pieces can (mostly) be modeled independently!}}
|
||||
\end{center}
|
||||
\end{frame}
|
||||
|
||||
\begin{frame}{Dependencies and the ROB}
|
||||
|
@ -67,6 +72,8 @@
|
|||
given CPU
|
||||
\item Features microarchitectural models
|
||||
\item Most often static analyzers
|
||||
\item Predict at least the \emph{reverse-throughput} of a
|
||||
kernel (cycles per iteration)
|
||||
\item May derive further useful metrics, \eg{} bottlenecks, by
|
||||
inspecting their model at will
|
||||
\end{itemize}
|
||||
|
@ -87,14 +94,13 @@
|
|||
|
||||
\begin{frame}{Existing code analyzers}
|
||||
\begin{itemize}
|
||||
\item Intel \alert{\iaca{}}: proprietary and only compatible with
|
||||
Intel. First ``good'' code analyzer, now deprecated. Was (is?)
|
||||
widely used.
|
||||
\item Intel \alert{\iaca{}}: proprietary, Intel CPUs only. First
|
||||
``good'' code analyzer, now deprecated. Was (is?) widely used.
|
||||
\item \alert{\llvmmca{}}: FOSS, production-grade, many
|
||||
microarchitectures. Based on data from the \texttt{llvm} compiler.
|
||||
\item \alert{\uica{}} and \alert{\uopsinfo{}}: research, good accuracy.
|
||||
Intel.
|
||||
\item \alert{\ithemal{}}: machine-learning based. Not so accurate.
|
||||
Intel CPUs.
|
||||
\item \alert{\ithemal{}}: machine-learning based.
|
||||
\item \alert{\gus{}}: instrumentation-based code analyzer (not
|
||||
static) $\leadsto$ slow. Access to mode information. Made in the
|
||||
CORSE team.
|
||||
|
@ -103,3 +109,8 @@
|
|||
Except Ithemal, \alert{all} are (to some extent) based on manually-made
|
||||
models!
|
||||
\end{frame}
|
||||
|
||||
\begin{frame}{When I started my PhD\ldots}
|
||||
\centering
|
||||
\includegraphics[height=0.9\textheight]{patate_placeholder.jpg}
|
||||
\end{frame}
|
||||
|
|
BIN
slides/assets/imgs/20_foundations/patate_placeholder.jpg
Normal file
BIN
slides/assets/imgs/20_foundations/patate_placeholder.jpg
Normal file
Binary file not shown.
After Width: | Height: | Size: 198 KiB |
Loading…
Reference in a new issue