|
@@ -1,82 +1,42 @@
|
|
|
-% raw data and charts
|
|
|
|
|
-% differences in used algos/ algos in tools
|
|
|
|
|
-% optimization approach
|
|
|
|
|
-% further research focus
|
|
|
|
|
-% (how optimization would be recognizable in testdata)
|
|
|
|
|
-
|
|
|
|
|
\chapter{Results and Discussion}
|
|
\chapter{Results and Discussion}
|
|
|
|
|
|
|
|
-\begin{table}[ht]
|
|
|
|
|
-\caption{Multi-column table}
|
|
|
|
|
-\begin{center}
|
|
|
|
|
-\begin{tabular}{cc}
|
|
|
|
|
- \hline
|
|
|
|
|
- \multicolumn{2}{c}{Multi-column}\\
|
|
|
|
|
- X&X\\
|
|
|
|
|
- \hline
|
|
|
|
|
-\end{tabular}
|
|
|
|
|
-\end{center}
|
|
|
|
|
-\label{tab:multicol}
|
|
|
|
|
-\end{table}
|
|
|
|
|
-
|
|
|
|
|
-
|
|
|
|
|
-\begin{table}[ht]
|
|
|
|
|
-\caption{Multi-column table}
|
|
|
|
|
-\begin{center}
|
|
|
|
|
-\begin{tabular}{ |p{3cm}||p{3cm}|p{3cm}|p{3cm}| }
|
|
|
|
|
- \hline
|
|
|
|
|
- \multicolumn{4}{|c|}{ratio}\\
|
|
|
|
|
- \hline
|
|
|
|
|
- h: tool v: taks&GeCo&samtools to BAM& samtools to CRAM\\
|
|
|
|
|
- \hline
|
|
|
|
|
- method/taks& geco &sam -> bam &sam -> cram\\
|
|
|
|
|
-% conversion& - &- & \\
|
|
|
|
|
-% compression in ms& & & \\
|
|
|
|
|
-% compression ratio& & & \\
|
|
|
|
|
- \hline
|
|
|
|
|
-\end{tabular}
|
|
|
|
|
-\end{center}
|
|
|
|
|
-\label{tab:multicol}
|
|
|
|
|
-\end{table}
|
|
|
|
|
-
|
|
|
|
|
|
|
|
|
|
-\begin{tabular}{ |p{3cm}||p{3cm}|p{3cm}|p{3cm}| }
|
|
|
|
|
|
|
+\begin{tabular}{ |p{2cm}||p{3cm}|p{3,5cm}|p{3,5cm}| }
|
|
|
\hline
|
|
\hline
|
|
|
- \multicolumn{4}{|c|}{Compression time} \\
|
|
|
|
|
|
|
+ \multicolumn{4}{|c|}{Compression time in milliseconds} \\
|
|
|
\hline
|
|
\hline
|
|
|
- & \acs{GECO}& Samtools&\\
|
|
|
|
|
|
|
+ & \acs{GeCo}& Samtools \acs{BAM}& Samtools \acs{CRAM}\\
|
|
|
\hline
|
|
\hline
|
|
|
- % method/taks& geco &sam -> bam &sam -> cram\\
|
|
|
|
|
- File 1 & 235005& 15178& \\
|
|
|
|
|
- File 2 & 246503& 15211& \\
|
|
|
|
|
- File 3 & 20169& 12526& \\
|
|
|
|
|
- File 4 & 194081& 11986& \\
|
|
|
|
|
- File 5 & 183878& 11436& \\
|
|
|
|
|
- File 6 & 173646& 10738& \\
|
|
|
|
|
- File 7 & 159999& 9995& \\
|
|
|
|
|
- File 8 & 148288& 9142& \\
|
|
|
|
|
- File 9 & 12304& 8276& \\
|
|
|
|
|
- File 10 & 134937& 8460& \\
|
|
|
|
|
- File 11 & 136299& 8508& \\
|
|
|
|
|
- File 12 & 134932& 8467& \\
|
|
|
|
|
- File 13 & 999022& 6770& \\
|
|
|
|
|
- File 14 & 924753& 6309& \\
|
|
|
|
|
- File 15 & 852555& 5959& \\
|
|
|
|
|
- File 16 & 827651& 5481& \\
|
|
|
|
|
- File 17 & 820814& 5151& \\
|
|
|
|
|
- File 18 & 798429& 5012& \\
|
|
|
|
|
- File 19 & 586058& 3662& \\
|
|
|
|
|
- File 20 & 645884& 4025& \\
|
|
|
|
|
- File 21 & 411984& 2783& \\
|
|
|
|
|
|
|
+ File 1 & 235005& 3786& 16926\\
|
|
|
|
|
+ File 2 & 246503& 3784& 17043\\
|
|
|
|
|
+ File 3 & 20169& 3123& 13999\\
|
|
|
|
|
+ File 4 & 194081& 3011& 13445\\
|
|
|
|
|
+ File 5 & 183878& 2862& 12802\\
|
|
|
|
|
+ File 6 & 173646& 2685& 12015\\
|
|
|
|
|
+ File 7 & 159999& 2503& 11198\\
|
|
|
|
|
+ File 8 & 148288& 2286& 10244\\
|
|
|
|
|
+ File 9 & 12304& 2078& 9210\\
|
|
|
|
|
+ File 10 & 134937& 2127& 9461\\
|
|
|
|
|
+ File 11 & 136299& 2132& 9508\\
|
|
|
|
|
+ File 12 & 134932& 2115& 9456\\
|
|
|
|
|
+ File 13 & 999022& 1695& 7533\\
|
|
|
|
|
+ File 14 & 924753& 1592& 7011\\
|
|
|
|
|
+ File 15 & 852555& 1507& 6598\\
|
|
|
|
|
+ File 16 & 827651& 1390& 6089\\
|
|
|
|
|
+ File 17 & 820814& 1306& 5791\\
|
|
|
|
|
+ File 18 & 798429& 1277& 5603\\
|
|
|
|
|
+ File 19 & 586058& 960& 4106\\
|
|
|
|
|
+ File 20 & 645884& 1026& 4507\\
|
|
|
|
|
+ File 21 & 411984& 721& 3096\\
|
|
|
\hline
|
|
\hline
|
|
|
\end{tabular}
|
|
\end{tabular}
|
|
|
|
|
|
|
|
|
|
|
|
|
\begin{tabular}{ |p{3cm}||p{3cm}|p{3cm}|p{3cm}| }
|
|
\begin{tabular}{ |p{3cm}||p{3cm}|p{3cm}|p{3cm}| }
|
|
|
\hline
|
|
\hline
|
|
|
- \multicolumn{4}{|c|}{File sizes} \\
|
|
|
|
|
|
|
+ \multicolumn{4}{|c|}{File sizes in bytes} \\
|
|
|
\hline
|
|
\hline
|
|
|
- & Source file& \acs{GECO}& Samtools CRAM\\
|
|
|
|
|
|
|
+ & Source file& \acs{GeCo}& Samtools \acs{CRAM}\\
|
|
|
\hline
|
|
\hline
|
|
|
File 1& 253105752& 46364770& 55769827\\
|
|
File 1& 253105752& 46364770& 55769827\\
|
|
|
File 2& 136027438& 27411806& 32238052\\
|
|
File 2& 136027438& 27411806& 32238052\\
|
|
@@ -101,3 +61,14 @@
|
|
|
File 21& 147557670& 23932541& 29459829\\
|
|
File 21& 147557670& 23932541& 29459829\\
|
|
|
\hline
|
|
\hline
|
|
|
\end{tabular}
|
|
\end{tabular}
|
|
|
|
|
+
|
|
|
|
|
+% raw data and charts
|
|
|
|
|
+% differences in used algos/ algos in tools
|
|
|
|
|
+% optimization approach
|
|
|
|
|
+% further research focus
|
|
|
|
|
+% (how optimization would be recognizable in testdata)
|
|
|
|
|
+
|
|
|
|
|
+% todo ms to minutes and bytes to mb. Those tables move to the appendix
|
|
|
|
|
+The two tables above contain rather raw measurement values for the two goals, described in \ref{k5:goals}. The first table shows how long each compression procedure took. Each row contains information about one of the \texttt{Homo\_sapiens.GRCh38.dna.chromosome.}x\texttt{.fa} files. To improve readability, the filename were replaced by \texttt{File}. To determine which file was compressed, simply replace the placeholder with the number following \texttt{File}.\\
|
|
|
|
|
+
|
|
|
|
|
+While \acs{GeCo} takes more time to compress, an increase in effectivity, meaning in the reduction of file size, can be recognized.\\
|