This commit is contained in:
Anthony Scemama 2024-06-19 14:22:19 +02:00
parent 24f2b44dae
commit 0643fb7008

View File

@ -434,11 +434,11 @@ On the ARM architecture, we utilized the \textsc{ArmPL} library for BLAS operati
\begin{ruledtabular}
\begin{tabular}{lccccccc}
CPU & $N_{\text{cores}}$ & Shared L3 cache & $V$ & $F$ & Memory Bandwidth & Peak DP & Measured performance \\
& (MB) & & & (GHz) & (GB/s) & (GFlop/s) & (GFlop/s) \\
& & (MB) & & (GHz) & (GB/s) & (GFlop/s) & (GFlop/s) \\
\hline
\textsc{EPYC} 7513 & $2\times 128$ & $2 \times 32)$ & 4 & 2.6 & 409.6 & 2~662 & 1~576 \\
Xeon Gold 6130 & $2\times 22$ & $2 \times 16)$ & 8 & 2.1 & 256.0 & 2~150 & 667 \\ % 239.891
ARM Q80 & $32$ & $80$ & 2 & 2.8 & 204.8 & 1~792 & 547 \\ % 292.492
\textsc{EPYC} 7513 & $2 \times 32$ & $2\times 128$ & 4 & 2.6 & 409.6 & 2~662 & 1~576 \\
Xeon Gold 6130 & $2 \times 16$ & $2\times 22$ & 8 & 2.1 & 256.0 & 2~150 & 667 \\ % 239.891
ARM Q80 & $80$ & $32$ & 2 & 2.8 & 204.8 & 1~792 & 547 \\ % 292.492
\end{tabular}
\end{ruledtabular}
\caption{\label{tab:flops} Average performance of the code measured as the number of double precision (DP) floating-point operations per second (Flop/s) on different machines.}