/articles/toma

To get this branch, use:
bzr branch http://darksoft.org/webbzr/articles/toma
24 by Suren A. Chilingaryan
Occupancy tunning
1
%ToDo: Shall we add the unrolling of projection-loop in parameters?
34 by Suren A. Chilingaryan
Fix cross-references and some latex complaints
2
\begin{table}[htb] %[htbp]
24 by Suren A. Chilingaryan
Occupancy tunning
3
\begin{threeparttable}
27 by Suren A. Chilingaryan
Alutex/Oversampling tables are fixed and hybrid section is finished
4
\caption{\label{tbl:newtex} Performance and configuration of cache-aware texture-based back-projection kernel}
24 by Suren A. Chilingaryan
Occupancy tunning
5
\centering
6
\noindent
7
%\resizebox{\columnwidth}{!}{\begin{tabular}{} ... \end{\tabular}}
8
\begin{tabularx}{\columnwidth}{ | X  c | r | r r r | }
9
\hline
10
& & & \multicolumn{3}{c|}{Configuration} \\
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
11
\mhd{|c}{GPU} & \mhd{c|}{$n_v$} & \mhd{c|}{Perf.} & \mhd{c}{Occupancy} & \mhd{c}{L1/ShMem} & \mhd{c|}{Cache} \\
24 by Suren A. Chilingaryan
Occupancy tunning
12
13
\hline
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
14
GTX295 & 1 &  49 GU/s & 75\% & - & -  \\
24 by Suren A. Chilingaryan
Occupancy tunning
15
16
\hline
17
\multirow{3}{*}{GTX580} 
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
18
& 1 &  49 GU/s & 50\% & 16/48 & -  \\
19
& 2 &  97 GU/s & 50\% & 16/48 & -  \\
20
& 4 & 172 GU/s & 50\% & 16/48 & -  \\
24 by Suren A. Chilingaryan
Occupancy tunning
21
\hline
22
23
\multirow{3}{*}{GTX680} 
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
24
& 1 & 118 GU/s & 100\% & 16/48 & - \\
25
& 2 & 232 GU/s & 100\% & 32/32 & - \\ 
24 by Suren A. Chilingaryan
Occupancy tunning
26
\hline
27
28
\multirow{3}{*}{Titan} 
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
29
& 1 & 200 GU/s & 100\% & 16/48 & -  \\
30
& 2 & 362 GU/s & 100\% & 32/32 & - \\
24 by Suren A. Chilingaryan
Occupancy tunning
31
\hline
32
33
\multirow{3}{*}{GTX980} 
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
34
& 1 & 155 GU/s & 100\% & -     & - \\
35
& 2 & 304 GU/s & 100\% & -     & - \\
36
& 4 & 555 GU/s &  75\% & -     & - \\
24 by Suren A. Chilingaryan
Occupancy tunning
37
\hline
38
39
\multirow{3}{*}{Titan X} 
32 by Suren A. Chilingaryan
Fix algorithms and separate them into the files as well
40
& 1 & 389 GU/s & 100\% & -     & - \\
41
& 2 & 726 GU/s & 100\% & -     & - \\
42
& 4 &1396 GU/s &  75\% & -     & - \\
24 by Suren A. Chilingaryan
Occupancy tunning
43
\hline
44
45
HD5970 & 1 &  56 GU/s & - & - & 256 \\
46
\hline
47
HD7970 & 1 & 115 GU/s & - & - & 256 \\
48
\hline
49
R9-290 & 1 & 146 GU/s & - & - & 256 \\
50
\hline
51
\end{tabularx}
52
\begin{tablenotes}
27 by Suren A. Chilingaryan
Alutex/Oversampling tables are fixed and hybrid section is finished
53
\item The table summarizes the performance and optimal configuration for the texture-based back-projection kernel. Information is provided for all supported slice-modes.
24 by Suren A. Chilingaryan
Occupancy tunning
54
\end{tablenotes}
55
\end{threeparttable}
56
\end{table}