From 5633dc5a8760e47d810704185b25635cefe28180 Mon Sep 17 00:00:00 2001 From: Bartosz Taudul Date: Sat, 13 Jul 2019 15:32:07 +0200 Subject: [PATCH] Add ARM64 NEON timings for DXT1 compression. --- manual/tracy.tex | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/manual/tracy.tex b/manual/tracy.tex index 0b851386..bbddce9f 100644 --- a/manual/tracy.tex +++ b/manual/tracy.tex @@ -460,12 +460,16 @@ To further reduce image data size, frame images are internally compressed using \begin{tabular}[h]{c|c|c} \textbf{Implementation} & \textbf{Required define} & \textbf{Time} \\ \hline x86 Reference & --- & 228 \si{\micro\second} \\ -x86 SSE4.1 & \texttt{\_\_SSE4\_1\_\_} & 35.8 \si{\micro\second} \\ +x86 SSE4.1\textsuperscript{a} & \texttt{\_\_SSE4\_1\_\_} & 35.8 \si{\micro\second} \\ x86 AVX2 & \texttt{\_\_AVX2\_\_} & 26.5 \si{\micro\second} \\ ARM Reference & --- & 1.23 \si{\milli\second} \\ -ARM NEON & \texttt{\_\_ARM\_NEON} & 551 \si{\micro\second} +ARM32 NEON\textsuperscript{b} & \texttt{\_\_ARM\_NEON} & 561 \si{\micro\second} \\ +ARM64 NEON & \texttt{\_\_ARM\_NEON} & 473 \si{\micro\second} \end{tabular} -\caption{Compression time of $320\times180$ image. x86: i7 8700K; ARM: ODROID-C2} + +\vspace{1em} +\textsuperscript{a)} VEX encoding; \hspace{0.5em} \textsuperscript{b)} ARM32 NEON code compiled for ARM64 +\caption{Compression time of $320\times180$ image. x86: i7 8700K; ARM: ODROID-C2.} \label{EtcSimd} \end{table}