From 258970eaf49a77897ae6ae8a8019ed86983c9e0d Mon Sep 17 00:00:00 2001 From: Connor Moore Date: Tue, 10 Feb 2026 10:52:40 -0500 Subject: Implemented feedback. Redid plots and gnuplot file. --- report/figures/f1_n_scaling.pdf | Bin 0 -> 9270 bytes report/figures/f1_n_scaling.tex | 122 ++++++++++++ report/figures/f2_compilers_scaling.pdf | Bin 0 -> 7880 bytes report/figures/f2_compilers_scaling.tex | 124 ++++++++++++ report/figures/f3_compilers_scaling.pdf | Bin 0 -> 10329 bytes report/figures/f3_compilers_scaling.tex | 122 ++++++++++++ report/figures/f4_compilers_scaling.pdf | Bin 0 -> 7905 bytes report/figures/f4_compilers_scaling.tex | 124 ++++++++++++ report/figures/f5_compilers_scaling.pdf | Bin 0 -> 10571 bytes report/figures/f5_compilers_scaling.tex | 122 ++++++++++++ report/figures/f6_optflags_scaling.pdf | Bin 0 -> 7954 bytes report/figures/f6_optflags_scaling.tex | 122 ++++++++++++ report/figures/f7_optflags_scaling.pdf | Bin 0 -> 7835 bytes report/figures/f7_optflags_scaling.tex | 124 ++++++++++++ report/figures/gfortran_O3_serial.csv | 52 +++++ report/figures/gfortran_rowloop_opt.csv | 141 ++++++++++++++ report/figures/gfortran_rowloop_optflags.csv | 35 ++++ report/figures/gfortran_serial_perflags.csv | 141 ++++++++++++++ report/figures/ifx_rowloop_opt.csv | 141 ++++++++++++++ report/figures/ifx_rowloop_optflags.csv | 35 ++++ report/figures/ifx_serial_perflags.csv | 141 ++++++++++++++ .../figures/ifx_vs_gfortran_O3_serial_results.csv | 106 +++++++++++ .../ifx_vs_gfortran_parallel_O3_results.csv | 106 +++++++++++ report/figures/plots.gnu | 211 +++++++-------------- 24 files changed, 1826 insertions(+), 143 deletions(-) create mode 100644 report/figures/f1_n_scaling.pdf create mode 100644 report/figures/f1_n_scaling.tex create mode 100644 report/figures/f2_compilers_scaling.pdf create mode 100644 report/figures/f2_compilers_scaling.tex create mode 100644 report/figures/f3_compilers_scaling.pdf create mode 100644 report/figures/f3_compilers_scaling.tex create mode 100644 report/figures/f4_compilers_scaling.pdf create mode 100644 report/figures/f4_compilers_scaling.tex create mode 100644 report/figures/f5_compilers_scaling.pdf create mode 100644 report/figures/f5_compilers_scaling.tex create mode 100644 report/figures/f6_optflags_scaling.pdf create mode 100644 report/figures/f6_optflags_scaling.tex create mode 100644 report/figures/f7_optflags_scaling.pdf create mode 100644 report/figures/f7_optflags_scaling.tex create mode 100644 report/figures/gfortran_O3_serial.csv create mode 100644 report/figures/gfortran_rowloop_opt.csv create mode 100644 report/figures/gfortran_rowloop_optflags.csv create mode 100644 report/figures/gfortran_serial_perflags.csv create mode 100644 report/figures/ifx_rowloop_opt.csv create mode 100644 report/figures/ifx_rowloop_optflags.csv create mode 100644 report/figures/ifx_serial_perflags.csv create mode 100644 report/figures/ifx_vs_gfortran_O3_serial_results.csv create mode 100644 report/figures/ifx_vs_gfortran_parallel_O3_results.csv (limited to 'report/figures') diff --git a/report/figures/f1_n_scaling.pdf b/report/figures/f1_n_scaling.pdf new file mode 100644 index 0000000..e16ad62 Binary files /dev/null and b/report/figures/f1_n_scaling.pdf differ diff --git a/report/figures/f1_n_scaling.tex b/report/figures/f1_n_scaling.tex new file mode 100644 index 0000000..b769510 --- /dev/null +++ b/report/figures/f1_n_scaling.tex @@ -0,0 +1,122 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,865){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1285){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1705){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2125){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2545){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1323,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(3843,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6364,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}Row-major loop}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}Col.-major loop}}% + \csname LTb\endcsname%% + \put(5568,3395){\makebox(0,0)[r]{\strut{}\texttt{Matmul}}}% + \csname LTb\endcsname%% + \put(5568,3190){\makebox(0,0)[r]{\strut{}DGEMM}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f1_n_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/f2_compilers_scaling.pdf b/report/figures/f2_compilers_scaling.pdf new file mode 100644 index 0000000..bedf2a5 Binary files /dev/null and b/report/figures/f2_compilers_scaling.pdf differ diff --git a/report/figures/f2_compilers_scaling.tex b/report/figures/f2_compilers_scaling.tex new file mode 100644 index 0000000..7fa4589 --- /dev/null +++ b/report/figures/f2_compilers_scaling.tex @@ -0,0 +1,124 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,655){\makebox(0,0)[r]{\strut{}$10^{-8}$}}% + \csname LTb\endcsname%% + \put(820,1040){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1425){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1810){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2195){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2580){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1913,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(4378,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6843,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: Row-major}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: Col.-major}}% + \csname LTb\endcsname%% + \put(6240,3395){\makebox(0,0)[r]{\strut{}\texttt{ifx}: Row-major}}% + \csname LTb\endcsname%% + \put(6240,3190){\makebox(0,0)[r]{\strut{}\texttt{ifx}: Col.-major}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f2_compilers_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/f3_compilers_scaling.pdf b/report/figures/f3_compilers_scaling.pdf new file mode 100644 index 0000000..35d958b Binary files /dev/null and b/report/figures/f3_compilers_scaling.pdf differ diff --git a/report/figures/f3_compilers_scaling.tex b/report/figures/f3_compilers_scaling.tex new file mode 100644 index 0000000..4ff4818 --- /dev/null +++ b/report/figures/f3_compilers_scaling.tex @@ -0,0 +1,122 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,865){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1285){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1705){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2125){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2545){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1323,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(3843,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6364,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: \texttt{matmul}}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: OpenBLAS}}% + \csname LTb\endcsname%% + \put(6016,3395){\makebox(0,0)[r]{\strut{}\texttt{ifx}: \texttt{matmul}}}% + \csname LTb\endcsname%% + \put(6016,3190){\makebox(0,0)[r]{\strut{}\texttt{ifx}: MKL BLAS}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f3_compilers_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/f4_compilers_scaling.pdf b/report/figures/f4_compilers_scaling.pdf new file mode 100644 index 0000000..6ea6095 Binary files /dev/null and b/report/figures/f4_compilers_scaling.pdf differ diff --git a/report/figures/f4_compilers_scaling.tex b/report/figures/f4_compilers_scaling.tex new file mode 100644 index 0000000..b3e4728 --- /dev/null +++ b/report/figures/f4_compilers_scaling.tex @@ -0,0 +1,124 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,655){\makebox(0,0)[r]{\strut{}$10^{-8}$}}% + \csname LTb\endcsname%% + \put(820,1040){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1425){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1810){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2195){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2580){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1913,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(4378,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6843,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: Row-major}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: Col.-major}}% + \csname LTb\endcsname%% + \put(6240,3395){\makebox(0,0)[r]{\strut{}\texttt{ifx}: Row-major}}% + \csname LTb\endcsname%% + \put(6240,3190){\makebox(0,0)[r]{\strut{}\texttt{ifx}: Col.-major}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f4_compilers_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/f5_compilers_scaling.pdf b/report/figures/f5_compilers_scaling.pdf new file mode 100644 index 0000000..af6f1df Binary files /dev/null and b/report/figures/f5_compilers_scaling.pdf differ diff --git a/report/figures/f5_compilers_scaling.tex b/report/figures/f5_compilers_scaling.tex new file mode 100644 index 0000000..188d766 --- /dev/null +++ b/report/figures/f5_compilers_scaling.tex @@ -0,0 +1,122 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,865){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1285){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1705){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2125){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2545){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1323,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(3843,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6364,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: \texttt{matmul}}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: OpenBLAS}}% + \csname LTb\endcsname%% + \put(6016,3395){\makebox(0,0)[r]{\strut{}\texttt{ifx}: \texttt{matmul}}}% + \csname LTb\endcsname%% + \put(6016,3190){\makebox(0,0)[r]{\strut{}\texttt{ifx}: MKL BLAS}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f5_compilers_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/f6_optflags_scaling.pdf b/report/figures/f6_optflags_scaling.pdf new file mode 100644 index 0000000..d90f1ac Binary files /dev/null and b/report/figures/f6_optflags_scaling.pdf differ diff --git a/report/figures/f6_optflags_scaling.tex b/report/figures/f6_optflags_scaling.tex new file mode 100644 index 0000000..54ceb56 --- /dev/null +++ b/report/figures/f6_optflags_scaling.tex @@ -0,0 +1,122 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,865){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1285){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1705){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2125){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2545){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1913,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(4378,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6843,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: O1}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: O2}}% + \csname LTb\endcsname%% + \put(5680,3395){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: O3}}% + \csname LTb\endcsname%% + \put(5680,3190){\makebox(0,0)[r]{\strut{}\texttt{gfortran}: Ofast}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f6_optflags_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/f7_optflags_scaling.pdf b/report/figures/f7_optflags_scaling.pdf new file mode 100644 index 0000000..8b608b7 Binary files /dev/null and b/report/figures/f7_optflags_scaling.pdf differ diff --git a/report/figures/f7_optflags_scaling.tex b/report/figures/f7_optflags_scaling.tex new file mode 100644 index 0000000..7f9fae6 --- /dev/null +++ b/report/figures/f7_optflags_scaling.tex @@ -0,0 +1,124 @@ +% GNUPLOT: LaTeX picture with Postscript +\begingroup + \makeatletter + \providecommand\color[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package color not loaded in conjunction with + terminal option `colourtext'% + }{See the gnuplot documentation for explanation.% + }{Either use 'blacktext' in gnuplot or load the package + color.sty in LaTeX.}% + \renewcommand\color[2][]{}% + }% + \providecommand\includegraphics[2][]{% + \GenericError{(gnuplot) \space\space\space\@spaces}{% + Package graphicx or graphics not loaded% + }{See the gnuplot documentation for explanation.% + }{The gnuplot epslatex terminal needs graphicx.sty or graphics.sty.}% + \renewcommand\includegraphics[2][]{}% + }% + \providecommand\rotatebox[2]{#2}% + \@ifundefined{ifGPcolor}{% + \newif\ifGPcolor + \GPcolortrue + }{}% + \@ifundefined{ifGPblacktext}{% + \newif\ifGPblacktext + \GPblacktexttrue + }{}% + % define a \g@addto@macro without @ in the name: + \let\gplgaddtomacro\g@addto@macro + % define empty templates for all commands taking text: + \gdef\gplbacktext{}% + \gdef\gplfronttext{}% + \makeatother + \ifGPblacktext + % no textcolor at all + \def\colorrgb#1{}% + \def\colorgray#1{}% + \else + % gray or color? + \ifGPcolor + \def\colorrgb#1{\color[rgb]{#1}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color[rgb]{1,0,0}}% + \expandafter\def\csname LT1\endcsname{\color[rgb]{0,1,0}}% + \expandafter\def\csname LT2\endcsname{\color[rgb]{0,0,1}}% + \expandafter\def\csname LT3\endcsname{\color[rgb]{1,0,1}}% + \expandafter\def\csname LT4\endcsname{\color[rgb]{0,1,1}}% + \expandafter\def\csname LT5\endcsname{\color[rgb]{1,1,0}}% + \expandafter\def\csname LT6\endcsname{\color[rgb]{0,0,0}}% + \expandafter\def\csname LT7\endcsname{\color[rgb]{1,0.3,0}}% + \expandafter\def\csname LT8\endcsname{\color[rgb]{0.5,0.5,0.5}}% + \else + % gray + \def\colorrgb#1{\color{black}}% + \def\colorgray#1{\color[gray]{#1}}% + \expandafter\def\csname LTw\endcsname{\color{white}}% + \expandafter\def\csname LTb\endcsname{\color{black}}% + \expandafter\def\csname LTa\endcsname{\color{black}}% + \expandafter\def\csname LT0\endcsname{\color{black}}% + \expandafter\def\csname LT1\endcsname{\color{black}}% + \expandafter\def\csname LT2\endcsname{\color{black}}% + \expandafter\def\csname LT3\endcsname{\color{black}}% + \expandafter\def\csname LT4\endcsname{\color{black}}% + \expandafter\def\csname LT5\endcsname{\color{black}}% + \expandafter\def\csname LT6\endcsname{\color{black}}% + \expandafter\def\csname LT7\endcsname{\color{black}}% + \expandafter\def\csname LT8\endcsname{\color{black}}% + \fi + \fi + \setlength{\unitlength}{0.0500bp}% + \ifx\gptboxheight\undefined% + \newlength{\gptboxheight}% + \newlength{\gptboxwidth}% + \newsavebox{\gptboxtext}% + \fi% + \setlength{\fboxrule}{0.5pt}% + \setlength{\fboxsep}{1pt}% + \definecolor{tbcol}{rgb}{1,1,1}% +\begin{picture}(7200.00,3600.00)% + \gplgaddtomacro\gplbacktext{% + \csname LTb\endcsname%% + \put(820,655){\makebox(0,0)[r]{\strut{}$10^{-8}$}}% + \csname LTb\endcsname%% + \put(820,1040){\makebox(0,0)[r]{\strut{}$10^{-6}$}}% + \csname LTb\endcsname%% + \put(820,1425){\makebox(0,0)[r]{\strut{}$10^{-4}$}}% + \csname LTb\endcsname%% + \put(820,1810){\makebox(0,0)[r]{\strut{}$10^{-2}$}}% + \csname LTb\endcsname%% + \put(820,2195){\makebox(0,0)[r]{\strut{}$10^{0}$}}% + \csname LTb\endcsname%% + \put(820,2580){\makebox(0,0)[r]{\strut{}$10^{2}$}}% + \csname LTb\endcsname%% + \put(820,2965){\makebox(0,0)[r]{\strut{}$10^{4}$}}% + \csname LTb\endcsname%% + \put(1913,450){\makebox(0,0){\strut{}$100$}}% + \csname LTb\endcsname%% + \put(4378,450){\makebox(0,0){\strut{}$1000$}}% + \csname LTb\endcsname%% + \put(6843,450){\makebox(0,0){\strut{}$10000$}}% + }% + \gplgaddtomacro\gplfronttext{% + \csname LTb\endcsname%% + \put(3134,3395){\makebox(0,0)[r]{\strut{}\texttt{ifx}: O1}}% + \csname LTb\endcsname%% + \put(3134,3190){\makebox(0,0)[r]{\strut{}\texttt{ifx}: O2}}% + \csname LTb\endcsname%% + \put(5120,3395){\makebox(0,0)[r]{\strut{}\texttt{ifx}: O3}}% + \csname LTb\endcsname%% + \put(5120,3190){\makebox(0,0)[r]{\strut{}\texttt{ifx}: Ofast}}% + \csname LTb\endcsname%% + \put(186,1810){\rotatebox{-270.00}{\makebox(0,0){\strut{}Wall Time [s]}}}% + \csname LTb\endcsname%% + \put(3888,143){\makebox(0,0){\strut{}Size [$N \times N$]}}% + }% + \gplbacktext + \put(0,0){\includegraphics[width={360.00bp},height={180.00bp}]{f7_optflags_scaling}}% + \gplfronttext + \end{picture}% +\endgroup diff --git a/report/figures/gfortran_O3_serial.csv b/report/figures/gfortran_O3_serial.csv new file mode 100644 index 0000000..5686747 --- /dev/null +++ b/report/figures/gfortran_O3_serial.csv @@ -0,0 +1,52 @@ +100,0.83196300E-03,0.82436000E-03,0.82171000E-04,0.40903000E-04 +200,0.84310250E-02,0.81942280E-02,0.52900100E-03,0.35716000E-03 +300,0.30393838E-01,0.29753641E-01,0.13883800E-02,0.11548400E-02 +400,0.75706575E-01,0.72053057E-01,0.26542930E-02,0.26334740E-02 +500,0.14779813E+00,0.13896792E+00,0.50301090E-02,0.48926140E-02 +600,0.25050676E+00,0.23771815E+00,0.86409790E-02,0.84664220E-02 +700,0.40370530E+00,0.38789537E+00,0.13572686E-01,0.13392029E-01 +800,0.62435679E+00,0.69020772E+00,0.20599722E-01,0.20583156E-01 +900,0.92557958E+00,0.97868840E+00,0.29087199E-01,0.29092604E-01 +1000,0.12971958E+01,0.13472624E+01,0.40578720E-01,0.40631869E-01 +1100,0.17403942E+01,0.19294426E+01,0.53757086E-01,0.54524503E-01 +1200,0.22731768E+01,0.26668477E+01,0.68460332E-01,0.69950589E-01 +1300,0.29280082E+01,0.33949951E+01,0.88916825E-01,0.91294859E-01 +1400,0.35930989E+01,0.41113147E+01,0.11034260E+00,0.11363157E+00 +1500,0.44426296E+01,0.53547077E+01,0.13540845E+00,0.14067237E+00 +1600,0.54982263E+01,0.79132809E+01,0.17527097E+00,0.17639820E+00 +1700,0.68705292E+01,0.85675598E+01,0.20611171E+00,0.21453854E+00 +1800,0.85638411E+01,0.10256766E+02,0.24548081E+00,0.25602355E+00 +1900,0.97956918E+01,0.12504037E+02,0.29145721E+00,0.29859006E+00 +2000,0.19977299E+02,0.22947921E+02,0.31671464E+00,0.33806302E+00 +2100,0.21728356E+02,0.24098549E+02,0.37766086E+00,0.40404478E+00 +2200,0.30368333E+02,0.31722219E+02,0.42580020E+00,0.45154765E+00 +2300,0.38040478E+02,0.39322543E+02,0.49845491E+00,0.52755086E+00 +2400,0.49238694E+02,0.53578220E+02,0.57475876E+00,0.60260881E+00 +2500,0.60229746E+02,0.60307600E+02,0.65482310E+00,0.69371856E+00 +2600,0.72275943E+02,0.75698785E+02,0.72118898E+00,0.76456032E+00 +2700,0.88066671E+02,0.85564199E+02,0.81734604E+00,0.86148218E+00 +2800,0.10227876E+03,0.10637486E+03,0.89947522E+00,0.95027684E+00 +2900,0.11620340E+03,0.11244430E+03,0.10111145E+01,0.10586032E+01 +3000,0.13147382E+03,0.13369315E+03,0.11102709E+01,0.11684749E+01 +3100,0.14999620E+03,0.14414675E+03,0.12802729E+01,0.13289489E+01 +3200,0.18354226E+03,0.19611960E+03,0.14315322E+01,0.14602543E+01 +3300,0.18601760E+03,0.18076827E+03,0.15415264E+01,0.15960495E+01 +3400,0.20476938E+03,0.21299748E+03,0.16521923E+01,0.16990593E+01 +3500,0.22834303E+03,0.22285553E+03,0.18681888E+01,0.19161202E+01 +4000,-1.00000000E+00,-1.00000000E+00,0.28359602E+01,0.28575599E+01 +4500,-1.00000000E+00,-1.00000000E+00,0.40505999E+01,0.40985922E+01 +5000,-1.00000000E+00,-1.00000000E+00,0.55805927E+01,0.56317293E+01 +5500,-1.00000000E+00,-1.00000000E+00,0.74133843E+01,0.74104958E+01 +6000,-1.00000000E+00,-1.00000000E+00,0.95258379E+01,0.95492209E+01 +6500,-1.00000000E+00,-1.00000000E+00,0.12021052E+02,0.12031542E+02 +7000,-1.00000000E+00,-1.00000000E+00,0.14963398E+02,0.15090944E+02 +7500,-1.00000000E+00,-1.00000000E+00,0.18778133E+02,0.18914046E+02 +8000,-1.00000000E+00,-1.00000000E+00,0.22653876E+02,0.22470571E+02 +8500,-1.00000000E+00,-1.00000000E+00,0.26873721E+02,0.27407130E+02 +9000,-1.00000000E+00,-1.00000000E+00,0.32200993E+02,0.31895406E+02 +9500,-1.00000000E+00,-1.00000000E+00,0.37974351E+02,0.38280771E+02 +10000,-1.00000000E+00,-1.00000000E+00,0.43953310E+02,0.44048979E+02 +10500,-1.00000000E+00,-1.00000000E+00,0.51627049E+02,0.50738458E+02 +11000,-1.00000000E+00,-1.00000000E+00,0.59155068E+02,0.58639799E+02 +11500,-1.00000000E+00,-1.00000000E+00,0.67404317E+02,0.66714712E+02 +12000,-1.00000000E+00,-1.00000000E+00,0.76974160E+02,0.75930372E+02 diff --git a/report/figures/gfortran_rowloop_opt.csv b/report/figures/gfortran_rowloop_opt.csv new file mode 100644 index 0000000..b412bd8 --- /dev/null +++ b/report/figures/gfortran_rowloop_opt.csv @@ -0,0 +1,141 @@ +opt,size,matmul +O1,100,0.15843390E-02 +O2,100,0.91776000E-03 +O3,100,0.83196300E-03 +Ofast,100,0.30917400E-03 +O1,200,0.15226468E-01 +O2,200,0.88798160E-02 +O3,200,0.84310250E-02 +Ofast,200,0.35476020E-02 +O1,300,0.50955954E-01 +O2,300,0.31395742E-01 +O3,300,0.30393838E-01 +Ofast,300,0.12742578E-01 +O1,400,0.12773344E+00 +O2,400,0.78643620E-01 +O3,400,0.75706575E-01 +Ofast,400,0.42815258E-01 +O1,500,0.24604570E+00 +O2,500,0.15303675E+00 +O3,500,0.14779813E+00 +Ofast,500,0.61111429E-01 +O1,600,0.43114100E+00 +O2,600,0.25507298E+00 +O3,600,0.25050676E+00 +Ofast,600,0.10847798E+00 +O1,700,0.69199010E+00 +O2,700,0.40859331E+00 +O3,700,0.40370530E+00 +Ofast,700,0.20581741E+00 +O1,800,0.10717053E+01 +O2,800,0.63825526E+00 +O3,800,0.62435679E+00 +Ofast,800,0.52888689E+00 +O1,900,0.15404577E+01 +O2,900,0.93850974E+00 +O3,900,0.92557958E+00 +Ofast,900,0.54681181E+00 +O1,1000,0.27305068E+01 +O2,1000,0.13441181E+01 +O3,1000,0.12971958E+01 +Ofast,1000,0.78722030E+00 +O1,1100,0.36062488E+01 +O2,1100,0.17628016E+01 +O3,1100,0.17403942E+01 +Ofast,1100,0.10706449E+01 +O1,1200,0.46450021E+01 +O2,1200,0.23031509E+01 +O3,1200,0.22731768E+01 +Ofast,1200,0.14552126E+01 +O1,1300,0.59029006E+01 +O2,1300,0.29607831E+01 +O3,1300,0.29280082E+01 +Ofast,1300,0.19152277E+01 +O1,1400,0.74960709E+01 +O2,1400,0.36552327E+01 +O3,1400,0.35930989E+01 +Ofast,1400,0.22676895E+01 +O1,1500,0.93026917E+01 +O2,1500,0.45110176E+01 +O3,1500,0.44426296E+01 +Ofast,1500,0.28225538E+01 +O1,1600,0.11342043E+02 +O2,1600,0.55577301E+01 +O3,1600,0.54982263E+01 +Ofast,1600,0.44651484E+01 +O1,1700,0.13274264E+02 +O2,1700,0.69197675E+01 +O3,1700,0.68705292E+01 +Ofast,1700,0.55033843E+01 +O1,1800,0.15669101E+02 +O2,1800,0.84757305E+01 +O3,1800,0.85638411E+01 +Ofast,1800,0.82615895E+01 +O1,1900,0.18839968E+02 +O2,1900,0.97958641E+01 +O3,1900,0.97956918E+01 +Ofast,1900,0.83408876E+01 +O1,2000,0.23471672E+02 +O2,2000,0.17688268E+02 +O3,2000,0.19977299E+02 +Ofast,2000,0.20366439E+02 +O1,2100,0.25537293E+02 +O2,2100,0.18367017E+02 +O3,2100,0.21728356E+02 +Ofast,2100,0.24215233E+02 +O1,2200,0.30945931E+02 +O2,2200,0.25050362E+02 +O3,2200,0.30368333E+02 +Ofast,2200,0.33078015E+02 +O1,2300,0.37129506E+02 +O2,2300,0.33096253E+02 +O3,2300,0.38040478E+02 +Ofast,2300,0.42665518E+02 +O1,2400,0.46662185E+02 +O2,2400,0.42657981E+02 +O3,2400,0.49238694E+02 +Ofast,2400,0.54617642E+02 +O1,2500,0.56352622E+02 +O2,2500,0.50056533E+02 +O3,2500,0.60229746E+02 +Ofast,2500,0.66109200E+02 +O1,2600,0.68959785E+02 +O2,2600,0.59790048E+02 +O3,2600,0.72275943E+02 +Ofast,2600,0.79140537E+02 +O1,2700,0.81912480E+02 +O2,2700,0.71778559E+02 +O3,2700,0.88066671E+02 +Ofast,2700,0.93871874E+02 +O1,2800,0.95063966E+02 +O2,2800,0.84949950E+02 +O3,2800,0.10227876E+03 +Ofast,2800,0.11033462E+03 +O1,2900,0.11009257E+03 +O2,2900,0.95040378E+02 +O3,2900,0.11620340E+03 +Ofast,2900,0.12442431E+03 +O1,3000,0.12441803E+03 +O2,3000,0.10697283E+03 +O3,3000,0.13147382E+03 +Ofast,3000,0.14033719E+03 +O1,3100,0.14058953E+03 +O2,3100,0.12264525E+03 +O3,3100,0.14999620E+03 +Ofast,3100,0.15929938E+03 +O1,3200,0.17324665E+03 +O2,3200,0.15985753E+03 +O3,3200,0.18354226E+03 +Ofast,3200,0.20479539E+03 +O1,3300,0.17757750E+03 +O2,3300,0.15501507E+03 +O3,3300,0.18601760E+03 +Ofast,3300,0.19725137E+03 +O1,3400,0.19650695E+03 +O2,3400,0.17226114E+03 +O3,3400,0.20476938E+03 +Ofast,3400,0.21640871E+03 +O1,3500,0.21871626E+03 +O2,3500,0.19217208E+03 +O3,3500,0.22834303E+03 +Ofast,3500,0.24214705E+03 diff --git a/report/figures/gfortran_rowloop_optflags.csv b/report/figures/gfortran_rowloop_optflags.csv new file mode 100644 index 0000000..c2ce3b5 --- /dev/null +++ b/report/figures/gfortran_rowloop_optflags.csv @@ -0,0 +1,35 @@ +100,0.15843390E-02,0.91776000E-03,0.83196300E-03,0.30917400E-03 +200,0.15226468E-01,0.88798160E-02,0.84310250E-02,0.35476020E-02 +300,0.50955954E-01,0.31395742E-01,0.30393838E-01,0.12742578E-01 +400,0.12773344E+00,0.78643620E-01,0.75706575E-01,0.42815258E-01 +500,0.24604570E+00,0.15303675E+00,0.14779813E+00,0.61111429E-01 +600,0.43114100E+00,0.25507298E+00,0.25050676E+00,0.10847798E+00 +700,0.69199010E+00,0.40859331E+00,0.40370530E+00,0.20581741E+00 +800,0.10717053E+01,0.63825526E+00,0.62435679E+00,0.52888689E+00 +900,0.15404577E+01,0.93850974E+00,0.92557958E+00,0.54681181E+00 +1000,0.27305068E+01,0.13441181E+01,0.12971958E+01,0.78722030E+00 +1100,0.36062488E+01,0.17628016E+01,0.17403942E+01,0.10706449E+01 +1200,0.46450021E+01,0.23031509E+01,0.22731768E+01,0.14552126E+01 +1300,0.59029006E+01,0.29607831E+01,0.29280082E+01,0.19152277E+01 +1400,0.74960709E+01,0.36552327E+01,0.35930989E+01,0.22676895E+01 +1500,0.93026917E+01,0.45110176E+01,0.44426296E+01,0.28225538E+01 +1600,0.11342043E+02,0.55577301E+01,0.54982263E+01,0.44651484E+01 +1700,0.13274264E+02,0.69197675E+01,0.68705292E+01,0.55033843E+01 +1800,0.15669101E+02,0.84757305E+01,0.85638411E+01,0.82615895E+01 +1900,0.18839968E+02,0.97958641E+01,0.97956918E+01,0.83408876E+01 +2000,0.23471672E+02,0.17688268E+02,0.19977299E+02,0.20366439E+02 +2100,0.25537293E+02,0.18367017E+02,0.21728356E+02,0.24215233E+02 +2200,0.30945931E+02,0.25050362E+02,0.30368333E+02,0.33078015E+02 +2300,0.37129506E+02,0.33096253E+02,0.38040478E+02,0.42665518E+02 +2400,0.46662185E+02,0.42657981E+02,0.49238694E+02,0.54617642E+02 +2500,0.56352622E+02,0.50056533E+02,0.60229746E+02,0.66109200E+02 +2600,0.68959785E+02,0.59790048E+02,0.72275943E+02,0.79140537E+02 +2700,0.81912480E+02,0.71778559E+02,0.88066671E+02,0.93871874E+02 +2800,0.95063966E+02,0.84949950E+02,0.10227876E+03,0.11033462E+03 +2900,0.11009257E+03,0.95040378E+02,0.11620340E+03,0.12442431E+03 +3000,0.12441803E+03,0.10697283E+03,0.13147382E+03,0.14033719E+03 +3100,0.14058953E+03,0.12264525E+03,0.14999620E+03,0.15929938E+03 +3200,0.17324665E+03,0.15985753E+03,0.18354226E+03,0.20479539E+03 +3300,0.17757750E+03,0.15501507E+03,0.18601760E+03,0.19725137E+03 +3400,0.19650695E+03,0.17226114E+03,0.20476938E+03,0.21640871E+03 +3500,0.21871626E+03,0.19217208E+03,0.22834303E+03,0.24214705E+03 diff --git a/report/figures/gfortran_serial_perflags.csv b/report/figures/gfortran_serial_perflags.csv new file mode 100644 index 0000000..9d33af7 --- /dev/null +++ b/report/figures/gfortran_serial_perflags.csv @@ -0,0 +1,141 @@ +,,,,rowloop,,, +gfortran,O1,serial,100,0.00,0.00,0.00,0.00 +gfortran,O1,serial,200,0.02,0.01,0.00,0.00 +gfortran,O1,serial,300,0.05,0.05,0.00,0.00 +gfortran,O1,serial,400,0.13,0.13,0.00,0.00 +gfortran,O1,serial,500,0.25,0.24,0.00,0.00 +gfortran,O1,serial,600,0.43,0.43,0.01,0.01 +gfortran,O1,serial,700,0.69,0.75,0.01,0.01 +gfortran,O1,serial,800,1.07,1.09,0.02,0.02 +gfortran,O1,serial,900,1.54,1.64,0.03,0.03 +gfortran,O1,serial,1000,2.73,2.71,0.04,0.04 +gfortran,O1,serial,1100,3.61,3.65,0.05,0.05 +gfortran,O1,serial,1200,4.65,4.79,0.07,0.07 +gfortran,O1,serial,1300,5.90,6.18,0.08,0.09 +gfortran,O1,serial,1400,7.50,7.85,0.11,0.11 +gfortran,O1,serial,1500,9.30,9.86,0.13,0.14 +gfortran,O1,serial,1600,11.34,12.61,0.16,0.17 +gfortran,O1,serial,1700,13.27,14.33,0.19,0.20 +gfortran,O1,serial,1800,15.67,17.25,0.23,0.25 +gfortran,O1,serial,1900,18.84,20.42,0.28,0.30 +gfortran,O1,serial,2000,23.47,25.75,0.32,0.34 +gfortran,O1,serial,2100,25.54,27.92,0.38,0.40 +gfortran,O1,serial,2200,30.95,33.21,0.43,0.46 +gfortran,O1,serial,2300,37.13,37.82,0.51,0.54 +gfortran,O1,serial,2400,46.66,49.52,0.57,0.60 +gfortran,O1,serial,2500,56.35,56.58,0.64,0.68 +gfortran,O1,serial,2600,68.96,70.45,0.74,0.77 +gfortran,O1,serial,2700,81.91,81.13,0.84,0.93 +gfortran,O1,serial,2800,95.06,100.52,0.91,0.95 +gfortran,O1,serial,2900,110.09,107.58,1.02,1.06 +gfortran,O1,serial,3000,124.42,127.72,1.13,1.17 +gfortran,O1,serial,3100,140.59,138.38,1.25,1.30 +gfortran,O1,serial,3200,173.25,186.00,1.43,1.45 +gfortran,O1,serial,3300,177.58,172.30,1.53,1.59 +gfortran,O1,serial,3400,196.51,202.47,1.71,1.75 +gfortran,O1,serial,3500,218.72,212.36,1.82,1.88 +gfortran,O2,serial,100,0.00,0.00,0.00,0.00 +gfortran,O2,serial,200,0.01,0.01,0.00,0.00 +gfortran,O2,serial,300,0.03,0.03,0.00,0.00 +gfortran,O2,serial,400,0.08,0.07,0.00,0.00 +gfortran,O2,serial,500,0.15,0.14,0.01,0.00 +gfortran,O2,serial,600,0.26,0.25,0.01,0.01 +gfortran,O2,serial,700,0.41,0.40,0.01,0.01 +gfortran,O2,serial,800,0.64,0.70,0.02,0.02 +gfortran,O2,serial,900,0.94,0.97,0.03,0.03 +gfortran,O2,serial,1000,1.34,1.33,0.04,0.04 +gfortran,O2,serial,1100,1.76,1.97,0.05,0.05 +gfortran,O2,serial,1200,2.30,2.67,0.07,0.07 +gfortran,O2,serial,1300,2.96,3.44,0.09,0.09 +gfortran,O2,serial,1400,3.66,4.14,0.11,0.11 +gfortran,O2,serial,1500,4.51,5.49,0.13,0.14 +gfortran,O2,serial,1600,5.56,7.94,0.18,0.18 +gfortran,O2,serial,1700,6.92,8.84,0.21,0.22 +gfortran,O2,serial,1800,8.48,9.99,0.25,0.26 +gfortran,O2,serial,1900,9.80,12.54,0.29,0.30 +gfortran,O2,serial,2000,17.69,20.82,0.32,0.34 +gfortran,O2,serial,2100,18.37,20.93,0.37,0.40 +gfortran,O2,serial,2200,25.05,27.80,0.43,0.47 +gfortran,O2,serial,2300,33.10,33.80,0.50,0.54 +gfortran,O2,serial,2400,42.66,45.89,0.55,0.60 +gfortran,O2,serial,2500,50.06,51.56,0.63,0.68 +gfortran,O2,serial,2600,59.79,62.89,0.71,0.76 +gfortran,O2,serial,2700,71.78,72.21,0.80,0.86 +gfortran,O2,serial,2800,84.95,90.52,0.91,0.98 +gfortran,O2,serial,2900,95.04,95.72,1.02,1.10 +gfortran,O2,serial,3000,106.97,111.61,1.10,1.17 +gfortran,O2,serial,3100,122.65,122.44,1.26,1.32 +gfortran,O2,serial,3200,159.86,173.04,1.38,1.41 +gfortran,O2,serial,3300,155.02,154.27,1.53,1.59 +gfortran,O2,serial,3400,172.26,178.85,1.68,1.75 +gfortran,O2,serial,3500,192.17,190.19,1.84,1.91 +gfortran,O3,serial,100,0.00,0.00,0.00,0.00 +gfortran,O3,serial,200,0.01,0.01,0.00,0.00 +gfortran,O3,serial,300,0.03,0.03,0.00,0.00 +gfortran,O3,serial,400,0.08,0.07,0.00,0.00 +gfortran,O3,serial,500,0.15,0.14,0.01,0.00 +gfortran,O3,serial,600,0.25,0.24,0.01,0.01 +gfortran,O3,serial,700,0.40,0.39,0.01,0.01 +gfortran,O3,serial,800,0.62,0.69,0.02,0.02 +gfortran,O3,serial,900,0.93,0.98,0.03,0.03 +gfortran,O3,serial,1000,1.30,1.35,0.04,0.04 +gfortran,O3,serial,1100,1.74,1.93,0.05,0.05 +gfortran,O3,serial,1200,2.27,2.67,0.07,0.07 +gfortran,O3,serial,1300,2.93,3.39,0.09,0.09 +gfortran,O3,serial,1400,3.59,4.11,0.11,0.11 +gfortran,O3,serial,1500,4.44,5.35,0.14,0.14 +gfortran,O3,serial,1600,5.50,7.91,0.18,0.18 +gfortran,O3,serial,1700,6.87,8.57,0.21,0.21 +gfortran,O3,serial,1800,8.56,10.26,0.25,0.26 +gfortran,O3,serial,1900,9.80,12.50,0.29,0.30 +gfortran,O3,serial,2000,19.98,22.95,0.32,0.34 +gfortran,O3,serial,2100,21.73,24.10,0.38,0.40 +gfortran,O3,serial,2200,30.37,31.72,0.43,0.45 +gfortran,O3,serial,2300,38.04,39.32,0.50,0.53 +gfortran,O3,serial,2400,49.24,53.58,0.57,0.60 +gfortran,O3,serial,2500,60.23,60.31,0.65,0.69 +gfortran,O3,serial,2600,72.28,75.70,0.72,0.76 +gfortran,O3,serial,2700,88.07,85.56,0.82,0.86 +gfortran,O3,serial,2800,102.28,106.37,0.90,0.95 +gfortran,O3,serial,2900,116.20,112.44,1.01,1.06 +gfortran,O3,serial,3000,131.47,133.69,1.11,1.17 +gfortran,O3,serial,3100,150.00,144.15,1.28,1.33 +gfortran,O3,serial,3200,183.54,196.12,1.43,1.46 +gfortran,O3,serial,3300,186.02,180.77,1.54,1.60 +gfortran,O3,serial,3400,204.77,213.00,1.65,1.70 +gfortran,O3,serial,3500,228.34,222.86,1.87,1.92 +gfortran,Ofast,serial,100,0.00,0.00,0.00,0.00 +gfortran,Ofast,serial,200,0.00,0.00,0.00,0.00 +gfortran,Ofast,serial,300,0.01,0.01,0.00,0.00 +gfortran,Ofast,serial,400,0.04,0.04,0.00,0.00 +gfortran,Ofast,serial,500,0.06,0.07,0.01,0.01 +gfortran,Ofast,serial,600,0.11,0.12,0.01,0.01 +gfortran,Ofast,serial,700,0.21,0.22,0.01,0.01 +gfortran,Ofast,serial,800,0.53,0.61,0.02,0.02 +gfortran,Ofast,serial,900,0.55,0.62,0.03,0.03 +gfortran,Ofast,serial,1000,0.79,0.87,0.04,0.04 +gfortran,Ofast,serial,1100,1.07,1.29,0.06,0.06 +gfortran,Ofast,serial,1200,1.46,2.03,0.08,0.08 +gfortran,Ofast,serial,1300,1.92,2.48,0.10,0.10 +gfortran,Ofast,serial,1400,2.27,2.94,0.13,0.13 +gfortran,Ofast,serial,1500,2.82,3.92,0.16,0.16 +gfortran,Ofast,serial,1600,4.47,7.26,0.18,0.18 +gfortran,Ofast,serial,1700,5.50,7.21,0.22,0.22 +gfortran,Ofast,serial,1800,8.26,9.90,0.25,0.25 +gfortran,Ofast,serial,1900,8.34,10.84,0.30,0.30 +gfortran,Ofast,serial,2000,20.37,24.08,0.33,0.35 +gfortran,Ofast,serial,2100,24.22,24.76,0.38,0.40 +gfortran,Ofast,serial,2200,33.08,34.51,0.45,0.47 +gfortran,Ofast,serial,2300,42.67,41.87,0.50,0.53 +gfortran,Ofast,serial,2400,54.62,57.49,0.56,0.60 +gfortran,Ofast,serial,2500,66.11,64.53,0.65,0.69 +gfortran,Ofast,serial,2600,79.14,79.93,0.74,0.79 +gfortran,Ofast,serial,2700,93.87,93.81,0.81,0.86 +gfortran,Ofast,serial,2800,110.33,114.95,0.91,0.95 +gfortran,Ofast,serial,2900,124.42,124.24,1.02,1.07 +gfortran,Ofast,serial,3000,140.34,144.50,1.15,1.20 +gfortran,Ofast,serial,3100,159.30,158.88,1.25,1.31 +gfortran,Ofast,serial,3200,204.80,211.06,1.42,1.45 +gfortran,Ofast,serial,3300,197.25,197.69,1.57,1.61 +gfortran,Ofast,serial,3400,216.41,225.48,1.66,1.70 +gfortran,Ofast,serial,3500,242.15,244.41,1.81,1.87 diff --git a/report/figures/ifx_rowloop_opt.csv b/report/figures/ifx_rowloop_opt.csv new file mode 100644 index 0000000..a30edb3 --- /dev/null +++ b/report/figures/ifx_rowloop_opt.csv @@ -0,0 +1,141 @@ +opt,size,matmul +O1,100,0.87400000E-03 +O1,200,0.85290000E-02 +O1,300,0.31776000E-01 +O1,400,0.76352000E-01 +O1,500,0.14845400E+00 +O1,600,0.25019100E+00 +O1,700,0.41009400E+00 +O1,800,0.63952200E+00 +O1,900,0.93205100E+00 +O1,1000,0.13031930E+01 +O1,1100,0.17408600E+01 +O1,1200,0.22755160E+01 +O1,1300,0.29508160E+01 +O1,1400,0.36393460E+01 +O1,1500,0.44860030E+01 +O1,1600,0.54553380E+01 +O1,1700,0.66324260E+01 +O1,1800,0.83380020E+01 +O1,1900,0.94449070E+01 +O1,2000,0.16506140E+02 +O1,2100,0.19062231E+02 +O1,2200,0.26409338E+02 +O1,2300,0.32798385E+02 +O1,2400,0.42770344E+02 +O1,2500,0.51294565E+02 +O1,2600,0.61256019E+02 +O1,2700,0.72455728E+02 +O1,2800,0.85004594E+02 +O1,2900,0.96607561E+02 +O1,3000,0.10970506E+03 +O1,3100,0.12403605E+03 +O1,3200,0.16208840E+03 +O1,3300,0.15700769E+03 +O1,3400,0.17293530E+03 +O1,3500,0.19277203E+03 +O2,100,0.69000000E-04 +O2,200,0.46400000E-03 +O2,300,0.14940000E-02 +O2,400,0.36100000E-02 +O2,500,0.73180000E-02 +O2,600,0.11930000E-01 +O2,700,0.18818000E-01 +O2,800,0.28678000E-01 +O2,900,0.41686000E-01 +O2,1000,0.58162000E-01 +O2,1100,0.80023000E-01 +O2,1200,0.10370700E+00 +O2,1300,0.22824500E+00 +O2,1400,0.16092100E+00 +O2,1500,0.19796700E+00 +O2,1600,0.24094500E+00 +O2,1700,0.34717000E+00 +O2,1800,0.34645400E+00 +O2,1900,0.42644300E+00 +O2,2000,0.49293000E+00 +O2,2100,0.54097800E+00 +O2,2200,0.83217700E+00 +O2,2300,0.80164600E+00 +O2,2400,0.80474400E+00 +O2,2500,0.91444900E+00 +O2,2600,0.10868780E+01 +O2,2700,0.11443750E+01 +O2,2800,0.14138060E+01 +O2,2900,0.15019830E+01 +O2,3000,0.15233760E+01 +O2,3100,0.16917410E+01 +O2,3200,0.19101330E+01 +O2,3300,0.20891040E+01 +O2,3400,0.22203300E+01 +O2,3500,0.24048120E+01 +O3,100,0.58000000E-04 +O3,200,0.44300000E-03 +O3,300,0.14680000E-02 +O3,400,0.36640000E-02 +O3,500,0.71830000E-02 +O3,600,0.11946000E-01 +O3,700,0.18771000E-01 +O3,800,0.29006000E-01 +O3,900,0.41680000E-01 +O3,1000,0.66717000E-01 +O3,1100,0.77178000E-01 +O3,1200,0.10297700E+00 +O3,1300,0.16374000E+00 +O3,1400,0.16045300E+00 +O3,1500,0.20290800E+00 +O3,1600,0.23383900E+00 +O3,1700,0.28733400E+00 +O3,1800,0.34376400E+00 +O3,1900,0.40683300E+00 +O3,2000,0.48620900E+00 +O3,2100,0.53323000E+00 +O3,2200,0.60910100E+00 +O3,2300,0.73816700E+00 +O3,2400,0.85756900E+00 +O3,2500,0.11705600E+01 +O3,2600,0.10060130E+01 +O3,2700,0.11340300E+01 +O3,2800,0.12724890E+01 +O3,2900,0.15094350E+01 +O3,3000,0.15846610E+01 +O3,3100,0.17252340E+01 +O3,3200,0.19596070E+01 +O3,3300,0.21563500E+01 +O3,3400,0.23250370E+01 +O3,3500,0.25408590E+01 +Ofast,100,0.56000000E-04 +Ofast,200,0.45200000E-03 +Ofast,300,0.14910000E-02 +Ofast,400,0.35090000E-02 +Ofast,500,0.70130000E-02 +Ofast,600,0.11894000E-01 +Ofast,700,0.20238000E-01 +Ofast,800,0.29047000E-01 +Ofast,900,0.41890000E-01 +Ofast,1000,0.60054000E-01 +Ofast,1100,0.77388000E-01 +Ofast,1200,0.10083800E+00 +Ofast,1300,0.12631200E+00 +Ofast,1400,0.15809900E+00 +Ofast,1500,0.19154500E+00 +Ofast,1600,0.23460400E+00 +Ofast,1700,0.27811300E+00 +Ofast,1800,0.33408400E+00 +Ofast,1900,0.38401600E+00 +Ofast,2000,0.45196200E+00 +Ofast,2100,0.81503500E+00 +Ofast,2200,0.60132200E+00 +Ofast,2300,0.14056800E+01 +Ofast,2400,0.79103900E+00 +Ofast,2500,0.89177100E+00 +Ofast,2600,0.10486280E+01 +Ofast,2700,0.11373380E+01 +Ofast,2800,0.12624200E+01 +Ofast,2900,0.14467200E+01 +Ofast,3000,0.15409600E+01 +Ofast,3100,0.17920540E+01 +Ofast,3200,0.19401520E+01 +Ofast,3300,0.20774270E+01 +Ofast,3400,0.23692760E+01 +Ofast,3500,0.24388450E+01 diff --git a/report/figures/ifx_rowloop_optflags.csv b/report/figures/ifx_rowloop_optflags.csv new file mode 100644 index 0000000..a43eafe --- /dev/null +++ b/report/figures/ifx_rowloop_optflags.csv @@ -0,0 +1,35 @@ +100,0.87400000E-03,0.69000000E-04,0.58000000E-04,0.56000000E-04 +200,0.85290000E-02,0.46400000E-03,0.44300000E-03,0.45200000E-03 +300,0.31776000E-01,0.14940000E-02,0.14680000E-02,0.14910000E-02 +400,0.76352000E-01,0.36100000E-02,0.36640000E-02,0.35090000E-02 +500,0.14845400E+00,0.73180000E-02,0.71830000E-02,0.70130000E-02 +600,0.25019100E+00,0.11930000E-01,0.11946000E-01,0.11894000E-01 +700,0.41009400E+00,0.18818000E-01,0.18771000E-01,0.20238000E-01 +800,0.63952200E+00,0.28678000E-01,0.29006000E-01,0.29047000E-01 +900,0.93205100E+00,0.41686000E-01,0.41680000E-01,0.41890000E-01 +1000,0.13031930E+01,0.58162000E-01,0.66717000E-01,0.60054000E-01 +1100,0.17408600E+01,0.80023000E-01,0.77178000E-01,0.77388000E-01 +1200,0.22755160E+01,0.10370700E+00,0.10297700E+00,0.10083800E+00 +1300,0.29508160E+01,0.22824500E+00,0.16374000E+00,0.12631200E+00 +1400,0.36393460E+01,0.16092100E+00,0.16045300E+00,0.15809900E+00 +1500,0.44860030E+01,0.19796700E+00,0.20290800E+00,0.19154500E+00 +1600,0.54553380E+01,0.24094500E+00,0.23383900E+00,0.23460400E+00 +1700,0.66324260E+01,0.34717000E+00,0.28733400E+00,0.27811300E+00 +1800,0.83380020E+01,0.34645400E+00,0.34376400E+00,0.33408400E+00 +1900,0.94449070E+01,0.42644300E+00,0.40683300E+00,0.38401600E+00 +2000,0.16506140E+02,0.49293000E+00,0.48620900E+00,0.45196200E+00 +2100,0.19062231E+02,0.54097800E+00,0.53323000E+00,0.81503500E+00 +2200,0.26409338E+02,0.83217700E+00,0.60910100E+00,0.60132200E+00 +2300,0.32798385E+02,0.80164600E+00,0.73816700E+00,0.14056800E+01 +2400,0.42770344E+02,0.80474400E+00,0.85756900E+00,0.79103900E+00 +2500,0.51294565E+02,0.91444900E+00,0.11705600E+01,0.89177100E+00 +2600,0.61256019E+02,0.10868780E+01,0.10060130E+01,0.10486280E+01 +2700,0.72455728E+02,0.11443750E+01,0.11340300E+01,0.11373380E+01 +2800,0.85004594E+02,0.14138060E+01,0.12724890E+01,0.12624200E+01 +2900,0.96607561E+02,0.15019830E+01,0.15094350E+01,0.14467200E+01 +3000,0.10970506E+03,0.15233760E+01,0.15846610E+01,0.15409600E+01 +3100,0.12403605E+03,0.16917410E+01,0.17252340E+01,0.17920540E+01 +3200,0.16208840E+03,0.19101330E+01,0.19596070E+01,0.19401520E+01 +3300,0.15700769E+03,0.20891040E+01,0.21563500E+01,0.20774270E+01 +3400,0.17293530E+03,0.22203300E+01,0.23250370E+01,0.23692760E+01 +3500,0.19277203E+03,0.24048120E+01,0.25408590E+01,0.24388450E+01 diff --git a/report/figures/ifx_serial_perflags.csv b/report/figures/ifx_serial_perflags.csv new file mode 100644 index 0000000..45af162 --- /dev/null +++ b/report/figures/ifx_serial_perflags.csv @@ -0,0 +1,141 @@ +,,,,rowloop,,, +ifx,O1,serial,100,0.00,0.00,0.00,0.01 +ifx,O1,serial,200,0.01,0.01,0.01,0.00 +ifx,O1,serial,300,0.03,0.03,0.02,0.00 +ifx,O1,serial,400,0.08,0.07,0.04,0.00 +ifx,O1,serial,500,0.15,0.14,0.08,0.01 +ifx,O1,serial,600,0.25,0.25,0.13,0.01 +ifx,O1,serial,700,0.41,0.40,0.21,0.01 +ifx,O1,serial,800,0.64,0.68,0.32,0.02 +ifx,O1,serial,900,0.93,0.95,0.51,0.03 +ifx,O1,serial,1000,1.30,1.32,0.76,0.04 +ifx,O1,serial,1100,1.74,1.86,1.15,0.06 +ifx,O1,serial,1200,2.28,2.65,1.44,0.07 +ifx,O1,serial,1300,2.95,3.32,1.91,0.09 +ifx,O1,serial,1400,3.64,4.03,2.41,0.12 +ifx,O1,serial,1500,4.49,5.22,2.98,0.14 +ifx,O1,serial,1600,5.46,7.88,3.59,0.17 +ifx,O1,serial,1700,6.63,8.11,4.32,0.21 +ifx,O1,serial,1800,8.34,9.64,5.11,0.25 +ifx,O1,serial,1900,9.44,11.79,6.07,0.29 +ifx,O1,serial,2000,16.51,19.91,7.06,0.34 +ifx,O1,serial,2100,19.06,20.83,8.15,0.39 +ifx,O1,serial,2200,26.41,28.43,9.40,0.45 +ifx,O1,serial,2300,32.80,34.34,10.80,0.52 +ifx,O1,serial,2400,42.77,47.20,12.22,0.60 +ifx,O1,serial,2500,51.29,51.70,13.87,0.68 +ifx,O1,serial,2600,61.26,63.91,15.54,0.75 +ifx,O1,serial,2700,72.46,73.90,17.32,0.84 +ifx,O1,serial,2800,85.00,91.17,19.15,0.94 +ifx,O1,serial,2900,96.61,96.74,21.26,1.04 +ifx,O1,serial,3000,109.71,113.47,23.53,1.14 +ifx,O1,serial,3100,124.04,123.18,26.10,1.30 +ifx,O1,serial,3200,162.09,177.53,28.64,1.44 +ifx,O1,serial,3300,157.01,154.57,31.45,1.53 +ifx,O1,serial,3400,172.94,178.52,37.46,1.70 +ifx,O1,serial,3500,192.77,189.33,38.28,1.85 +ifx,O2,serial,100,0.00,0.00,0.00,0.00 +ifx,O2,serial,200,0.00,0.00,0.00,0.00 +ifx,O2,serial,300,0.00,0.00,0.00,0.00 +ifx,O2,serial,400,0.00,0.00,0.00,0.00 +ifx,O2,serial,500,0.01,0.02,0.01,0.01 +ifx,O2,serial,600,0.01,0.01,0.01,0.01 +ifx,O2,serial,700,0.02,0.02,0.02,0.02 +ifx,O2,serial,800,0.03,0.03,0.03,0.02 +ifx,O2,serial,900,0.04,0.04,0.05,0.04 +ifx,O2,serial,1000,0.06,0.06,0.07,0.05 +ifx,O2,serial,1100,0.08,0.08,0.09,0.06 +ifx,O2,serial,1200,0.10,0.10,0.11,0.08 +ifx,O2,serial,1300,0.23,0.13,0.14,0.10 +ifx,O2,serial,1400,0.16,0.17,0.19,0.13 +ifx,O2,serial,1500,0.20,0.20,0.22,0.16 +ifx,O2,serial,1600,0.24,0.25,0.27,0.19 +ifx,O2,serial,1700,0.35,0.37,0.31,0.23 +ifx,O2,serial,1800,0.35,0.36,0.38,0.27 +ifx,O2,serial,1900,0.43,0.57,0.42,0.32 +ifx,O2,serial,2000,0.49,0.49,0.51,0.38 +ifx,O2,serial,2100,0.54,0.56,0.59,0.44 +ifx,O2,serial,2200,0.83,0.97,0.66,0.50 +ifx,O2,serial,2300,0.80,0.75,0.82,0.56 +ifx,O2,serial,2400,0.80,0.84,0.87,0.64 +ifx,O2,serial,2500,0.91,0.96,1.51,0.70 +ifx,O2,serial,2600,1.09,1.82,1.13,0.80 +ifx,O2,serial,2700,1.14,1.19,1.22,0.89 +ifx,O2,serial,2800,1.41,1.37,1.33,0.99 +ifx,O2,serial,2900,1.50,1.48,1.50,1.08 +ifx,O2,serial,3000,1.52,1.57,1.60,1.18 +ifx,O2,serial,3100,1.69,1.75,1.77,1.30 +ifx,O2,serial,3200,1.91,1.97,2.10,1.43 +ifx,O2,serial,3300,2.09,2.10,2.12,1.54 +ifx,O2,serial,3400,2.22,2.28,2.31,1.68 +ifx,O2,serial,3500,2.40,2.47,2.49,1.84 +ifx,O3,serial,100,0.00,0.00,0.00,0.00 +ifx,O3,serial,200,0.00,0.00,0.00,0.00 +ifx,O3,serial,300,0.00,0.00,0.00,0.00 +ifx,O3,serial,400,0.00,0.01,0.00,0.00 +ifx,O3,serial,500,0.01,0.01,0.01,0.01 +ifx,O3,serial,600,0.01,0.01,0.01,0.01 +ifx,O3,serial,700,0.02,0.02,0.02,0.02 +ifx,O3,serial,800,0.03,0.03,0.03,0.02 +ifx,O3,serial,900,0.04,0.04,0.05,0.04 +ifx,O3,serial,1000,0.07,0.06,0.06,0.05 +ifx,O3,serial,1100,0.08,0.08,0.08,0.06 +ifx,O3,serial,1200,0.10,0.10,0.11,0.08 +ifx,O3,serial,1300,0.16,0.20,0.14,0.10 +ifx,O3,serial,1400,0.16,0.16,0.17,0.13 +ifx,O3,serial,1500,0.20,0.53,0.36,0.15 +ifx,O3,serial,1600,0.23,0.25,0.26,0.19 +ifx,O3,serial,1700,0.29,0.30,0.34,0.23 +ifx,O3,serial,1800,0.34,0.36,0.37,0.27 +ifx,O3,serial,1900,0.41,0.53,0.92,0.30 +ifx,O3,serial,2000,0.49,0.48,0.50,0.37 +ifx,O3,serial,2100,0.53,0.58,0.57,0.43 +ifx,O3,serial,2200,0.61,0.64,0.67,0.49 +ifx,O3,serial,2300,0.74,0.74,0.78,0.56 +ifx,O3,serial,2400,0.86,1.09,0.88,0.63 +ifx,O3,serial,2500,1.17,1.04,0.96,0.71 +ifx,O3,serial,2600,1.01,1.05,1.06,0.79 +ifx,O3,serial,2700,1.13,1.20,1.29,0.90 +ifx,O3,serial,2800,1.27,1.32,1.40,0.99 +ifx,O3,serial,2900,1.51,1.66,1.54,1.09 +ifx,O3,serial,3000,1.58,1.63,1.63,1.20 +ifx,O3,serial,3100,1.73,1.79,1.90,1.33 +ifx,O3,serial,3200,1.96,2.05,2.05,1.45 +ifx,O3,serial,3300,2.16,2.48,2.20,1.59 +ifx,O3,serial,3400,2.33,2.38,2.40,1.73 +ifx,O3,serial,3500,2.54,2.60,2.61,1.91 +ifx,Ofast,serial,100,0.00,0.00,0.00,0.00 +ifx,Ofast,serial,200,0.00,0.00,0.00,0.00 +ifx,Ofast,serial,300,0.00,0.00,0.00,0.00 +ifx,Ofast,serial,400,0.00,0.00,0.00,0.00 +ifx,Ofast,serial,500,0.01,0.01,0.01,0.01 +ifx,Ofast,serial,600,0.01,0.01,0.01,0.01 +ifx,Ofast,serial,700,0.02,0.02,0.02,0.02 +ifx,Ofast,serial,800,0.03,0.03,0.03,0.03 +ifx,Ofast,serial,900,0.04,0.04,0.05,0.03 +ifx,Ofast,serial,1000,0.06,0.06,0.06,0.05 +ifx,Ofast,serial,1100,0.08,0.08,0.09,0.06 +ifx,Ofast,serial,1200,0.10,0.10,0.11,0.08 +ifx,Ofast,serial,1300,0.13,0.13,0.13,0.10 +ifx,Ofast,serial,1400,0.16,0.16,0.17,0.13 +ifx,Ofast,serial,1500,0.19,0.19,0.21,0.16 +ifx,Ofast,serial,1600,0.23,0.24,0.25,0.19 +ifx,Ofast,serial,1700,0.28,0.28,0.30,0.23 +ifx,Ofast,serial,1800,0.33,0.34,0.36,0.27 +ifx,Ofast,serial,1900,0.38,0.40,0.41,0.32 +ifx,Ofast,serial,2000,0.45,0.49,0.53,0.37 +ifx,Ofast,serial,2100,0.82,0.54,0.56,0.42 +ifx,Ofast,serial,2200,0.60,0.63,0.65,0.49 +ifx,Ofast,serial,2300,1.41,0.71,0.75,0.55 +ifx,Ofast,serial,2400,0.79,0.83,0.85,0.63 +ifx,Ofast,serial,2500,0.89,0.93,0.96,0.71 +ifx,Ofast,serial,2600,1.05,1.93,1.13,0.79 +ifx,Ofast,serial,2700,1.14,1.19,1.21,0.89 +ifx,Ofast,serial,2800,1.26,1.31,1.33,0.99 +ifx,Ofast,serial,2900,1.45,1.50,1.58,1.09 +ifx,Ofast,serial,3000,1.54,1.60,1.62,1.19 +ifx,Ofast,serial,3100,1.79,1.77,1.79,1.32 +ifx,Ofast,serial,3200,1.94,2.02,2.23,1.44 +ifx,Ofast,serial,3300,2.08,2.13,2.19,1.56 +ifx,Ofast,serial,3400,2.37,2.30,2.49,1.70 +ifx,Ofast,serial,3500,2.44,2.49,2.51,1.86 diff --git a/report/figures/ifx_vs_gfortran_O3_serial_results.csv b/report/figures/ifx_vs_gfortran_O3_serial_results.csv new file mode 100644 index 0000000..8271650 --- /dev/null +++ b/report/figures/ifx_vs_gfortran_O3_serial_results.csv @@ -0,0 +1,106 @@ +gfortran,100,0.83196300E-03,0.82436000E-03,0.82171000E-04,0.40903000E-04 +gfortran,200,0.84310250E-02,0.81942280E-02,0.52900100E-03,0.35716000E-03 +gfortran,300,0.30393838E-01,0.29753641E-01,0.13883800E-02,0.11548400E-02 +gfortran,400,0.75706575E-01,0.72053057E-01,0.26542930E-02,0.26334740E-02 +gfortran,500,0.14779813E+00,0.13896792E+00,0.50301090E-02,0.48926140E-02 +gfortran,600,0.25050676E+00,0.23771815E+00,0.86409790E-02,0.84664220E-02 +gfortran,700,0.40370530E+00,0.38789537E+00,0.13572686E-01,0.13392029E-01 +gfortran,800,0.62435679E+00,0.69020772E+00,0.20599722E-01,0.20583156E-01 +gfortran,900,0.92557958E+00,0.97868840E+00,0.29087199E-01,0.29092604E-01 +gfortran,1000,0.12971958E+01,0.13472624E+01,0.40578720E-01,0.40631869E-01 +gfortran,1100,0.17403942E+01,0.19294426E+01,0.53757086E-01,0.54524503E-01 +gfortran,1200,0.22731768E+01,0.26668477E+01,0.68460332E-01,0.69950589E-01 +gfortran,1300,0.29280082E+01,0.33949951E+01,0.88916825E-01,0.91294859E-01 +gfortran,1400,0.35930989E+01,0.41113147E+01,0.11034260E+00,0.11363157E+00 +gfortran,1500,0.44426296E+01,0.53547077E+01,0.13540845E+00,0.14067237E+00 +gfortran,1600,0.54982263E+01,0.79132809E+01,0.17527097E+00,0.17639820E+00 +gfortran,1700,0.68705292E+01,0.85675598E+01,0.20611171E+00,0.21453854E+00 +gfortran,1800,0.85638411E+01,0.10256766E+02,0.24548081E+00,0.25602355E+00 +gfortran,1900,0.97956918E+01,0.12504037E+02,0.29145721E+00,0.29859006E+00 +gfortran,2000,0.19977299E+02,0.22947921E+02,0.31671464E+00,0.33806302E+00 +gfortran,2100,0.21728356E+02,0.24098549E+02,0.37766086E+00,0.40404478E+00 +gfortran,2200,0.30368333E+02,0.31722219E+02,0.42580020E+00,0.45154765E+00 +gfortran,2300,0.38040478E+02,0.39322543E+02,0.49845491E+00,0.52755086E+00 +gfortran,2400,0.49238694E+02,0.53578220E+02,0.57475876E+00,0.60260881E+00 +gfortran,2500,0.60229746E+02,0.60307600E+02,0.65482310E+00,0.69371856E+00 +gfortran,2600,0.72275943E+02,0.75698785E+02,0.72118898E+00,0.76456032E+00 +gfortran,2700,0.88066671E+02,0.85564199E+02,0.81734604E+00,0.86148218E+00 +gfortran,2800,0.10227876E+03,0.10637486E+03,0.89947522E+00,0.95027684E+00 +gfortran,2900,0.11620340E+03,0.11244430E+03,0.10111145E+01,0.10586032E+01 +gfortran,3000,0.13147382E+03,0.13369315E+03,0.11102709E+01,0.11684749E+01 +gfortran,3100,0.14999620E+03,0.14414675E+03,0.12802729E+01,0.13289489E+01 +gfortran,3200,0.18354226E+03,0.19611960E+03,0.14315322E+01,0.14602543E+01 +gfortran,3300,0.18601760E+03,0.18076827E+03,0.15415264E+01,0.15960495E+01 +gfortran,3400,0.20476938E+03,0.21299748E+03,0.16521923E+01,0.16990593E+01 +gfortran,3500,0.22834303E+03,0.22285553E+03,0.18681888E+01,0.19161202E+01 +gfortran,4000,-1.00000000E+00,-1.00000000E+00,0.28359602E+01,0.28575599E+01 +gfortran,4500,-1.00000000E+00,-1.00000000E+00,0.40505999E+01,0.40985922E+01 +gfortran,5000,-1.00000000E+00,-1.00000000E+00,0.55805927E+01,0.56317293E+01 +gfortran,5500,-1.00000000E+00,-1.00000000E+00,0.74133843E+01,0.74104958E+01 +gfortran,6000,-1.00000000E+00,-1.00000000E+00,0.95258379E+01,0.95492209E+01 +gfortran,6500,-1.00000000E+00,-1.00000000E+00,0.12021052E+02,0.12031542E+02 +gfortran,7000,-1.00000000E+00,-1.00000000E+00,0.14963398E+02,0.15090944E+02 +gfortran,7500,-1.00000000E+00,-1.00000000E+00,0.18778133E+02,0.18914046E+02 +gfortran,8000,-1.00000000E+00,-1.00000000E+00,0.22653876E+02,0.22470571E+02 +gfortran,8500,-1.00000000E+00,-1.00000000E+00,0.26873721E+02,0.27407130E+02 +gfortran,9000,-1.00000000E+00,-1.00000000E+00,0.32200993E+02,0.31895406E+02 +gfortran,9500,-1.00000000E+00,-1.00000000E+00,0.37974351E+02,0.38280771E+02 +gfortran,10000,-1.00000000E+00,-1.00000000E+00,0.43953310E+02,0.44048979E+02 +gfortran,10500,-1.00000000E+00,-1.00000000E+00,0.51627049E+02,0.50738458E+02 +gfortran,11000,-1.00000000E+00,-1.00000000E+00,0.59155068E+02,0.58639799E+02 +gfortran,11500,-1.00000000E+00,-1.00000000E+00,0.67404317E+02,0.66714712E+02 +gfortran,12000,-1.00000000E+00,-1.00000000E+00,0.76974160E+02,0.75930372E+02 + + +ifx,100,0.58000000E-04,0.56000000E-04,0.90000000E-04,0.16070000E-02 +ifx,200,0.44300000E-03,0.42700000E-03,0.58000000E-03,0.65500000E-03 +ifx,300,0.14680000E-02,0.14470000E-02,0.18500000E-02,0.15920000E-02 +ifx,400,0.36640000E-02,0.50940000E-02,0.45920000E-02,0.29600000E-02 +ifx,500,0.71830000E-02,0.68410000E-02,0.80890000E-02,0.62120000E-02 +ifx,600,0.11946000E-01,0.11672000E-01,0.13309000E-01,0.10467000E-01 +ifx,700,0.18771000E-01,0.18607000E-01,0.20932000E-01,0.16487000E-01 +ifx,800,0.29006000E-01,0.28898000E-01,0.31436000E-01,0.24879000E-01 +ifx,900,0.41680000E-01,0.42791000E-01,0.46396000E-01,0.35810000E-01 +ifx,1000,0.66717000E-01,0.58368000E-01,0.61858000E-01,0.47731000E-01 +ifx,1100,0.77178000E-01,0.79497000E-01,0.84205000E-01,0.62863000E-01 +ifx,1200,0.10297700E+00,0.10426600E+00,0.10948500E+00,0.82169000E-01 +ifx,1300,0.16374000E+00,0.19606600E+00,0.13635600E+00,0.10359600E+00 +ifx,1400,0.16045300E+00,0.16332400E+00,0.17264000E+00,0.13045600E+00 +ifx,1500,0.20290800E+00,0.52553500E+00,0.36230500E+00,0.14967300E+00 +ifx,1600,0.23383900E+00,0.25316200E+00,0.25683400E+00,0.19188600E+00 +ifx,1700,0.28733400E+00,0.30492900E+00,0.33555100E+00,0.22984600E+00 +ifx,1800,0.34376400E+00,0.36431600E+00,0.37293700E+00,0.27164500E+00 +ifx,1900,0.40683300E+00,0.53130200E+00,0.92085100E+00,0.30233300E+00 +ifx,2000,0.48620900E+00,0.48303600E+00,0.49906700E+00,0.37369900E+00 +ifx,2100,0.53323000E+00,0.57921900E+00,0.57168700E+00,0.43273500E+00 +ifx,2200,0.60910100E+00,0.64498000E+00,0.67022300E+00,0.49184600E+00 +ifx,2300,0.73816700E+00,0.74163200E+00,0.77880200E+00,0.55604000E+00 +ifx,2400,0.85756900E+00,0.10932640E+01,0.88045900E+00,0.63325300E+00 +ifx,2500,0.11705600E+01,0.10359310E+01,0.95508900E+00,0.71130200E+00 +ifx,2600,0.10060130E+01,0.10533570E+01,0.10641200E+01,0.79390000E+00 +ifx,2700,0.11340300E+01,0.12003210E+01,0.12853780E+01,0.89655500E+00 +ifx,2800,0.12724890E+01,0.13156040E+01,0.13962350E+01,0.99175300E+00 +ifx,2900,0.15094350E+01,0.16560390E+01,0.15350060E+01,0.10929730E+01 +ifx,3000,0.15846610E+01,0.16258430E+01,0.16260140E+01,0.12001770E+01 +ifx,3100,0.17252340E+01,0.17900380E+01,0.19004570E+01,0.13292810E+01 +ifx,3200,0.19596070E+01,0.20458520E+01,0.20495750E+01,0.14506500E+01 +ifx,3300,0.21563500E+01,0.24776340E+01,0.21986880E+01,0.15850810E+01 +ifx,3400,0.23250370E+01,0.23764170E+01,0.23972010E+01,0.17294670E+01 +ifx,3500,0.25408590E+01,0.25972350E+01,0.26123750E+01,0.19139550E+01 +ifx,4000,-1.00000000E+00,-1.00000000E+00,0.38908200E+01,0.27883030E+01 +ifx,4500,-1.00000000E+00,-1.00000000E+00,0.53457480E+01,0.39658190E+01 +ifx,5000,-1.00000000E+00,-1.00000000E+00,0.74345050E+01,0.53927840E+01 +ifx,5500,-1.00000000E+00,-1.00000000E+00,0.96502170E+01,0.70565910E+01 +ifx,6000,-1.00000000E+00,-1.00000000E+00,0.12845179E+02,0.91233900E+01 +ifx,6500,-1.00000000E+00,-1.00000000E+00,0.15827001E+02,0.11524623E+02 +ifx,7000,-1.00000000E+00,-1.00000000E+00,0.20801332E+02,0.15038738E+02 +ifx,7500,-1.00000000E+00,-1.00000000E+00,0.26094525E+02,0.18208950E+02 +ifx,8000,-1.00000000E+00,-1.00000000E+00,0.31587575E+02,0.22169725E+02 +ifx,8500,-1.00000000E+00,-1.00000000E+00,0.37538095E+02,0.26493652E+02 +ifx,9000,-1.00000000E+00,-1.00000000E+00,0.44269599E+02,0.31840563E+02 +ifx,9500,-1.00000000E+00,-1.00000000E+00,0.52284059E+02,0.36582329E+02 +ifx,10000,-1.00000000E+00,-1.00000000E+00,0.61311028E+02,0.42846245E+02 +ifx,10500,-1.00000000E+00,-1.00000000E+00,0.72325632E+02,0.49676041E+02 +ifx,11000,-1.00000000E+00,-1.00000000E+00,0.83070796E+02,0.56988766E+02 +ifx,11500,-1.00000000E+00,-1.00000000E+00,0.93397373E+02,0.65669082E+02 +ifx,12000,-1.00000000E+00,-1.00000000E+00,0.10839523E+03,0.75117033E+02 diff --git a/report/figures/ifx_vs_gfortran_parallel_O3_results.csv b/report/figures/ifx_vs_gfortran_parallel_O3_results.csv new file mode 100644 index 0000000..11841df --- /dev/null +++ b/report/figures/ifx_vs_gfortran_parallel_O3_results.csv @@ -0,0 +1,106 @@ +gfortran,100,0.65345500E-02,0.59900040E-02,0.86181000E-04,0.42291000E-04 +gfortran,200,0.50174390E-02,0.59791200E-02,0.31170300E-03,0.13245500E-03 +gfortran,300,0.61210580E-02,0.44460850E-02,0.41295800E-03,0.33808100E-03 +gfortran,400,0.12667475E-01,0.13372949E-01,0.81521200E-03,0.77869500E-03 +gfortran,500,0.27877839E-01,0.26661508E-01,0.18042120E-02,0.16926660E-02 +gfortran,600,0.54333166E-01,0.55224388E-01,0.37276290E-02,0.35771950E-02 +gfortran,700,0.10559272E+00,0.12442592E+00,0.75477630E-02,0.73882030E-02 +gfortran,800,0.23475954E+00,0.25548130E+00,0.12989441E-01,0.12708304E-01 +gfortran,900,0.40482514E+00,0.39620421E+00,0.19103187E-01,0.19337220E-01 +gfortran,1000,0.92502131E+00,0.10805587E+01,0.19845650E-01,0.20756266E-01 +gfortran,1100,0.12325956E+01,0.13278188E+01,0.27864950E-01,0.28942730E-01 +gfortran,1200,0.17618679E+01,0.18503020E+01,0.32694492E-01,0.34112697E-01 +gfortran,1300,0.28281348E+01,0.31864547E+01,0.46746962E-01,0.45713662E-01 +gfortran,1400,0.32992088E+01,0.44739595E+01,0.51730821E-01,0.55246729E-01 +gfortran,1500,0.58974233E+01,0.63987345E+01,0.65677651E-01,0.71260921E-01 +gfortran,1600,0.74397705E+01,0.81612424E+01,0.85752173E-01,0.94684527E-01 +gfortran,1700,0.94707658E+01,0.95308664E+01,0.91766590E-01,0.10326883E+00 +gfortran,1800,0.10808945E+02,0.11711298E+02,0.11737023E+00,0.13288688E+00 +gfortran,1900,0.12854598E+02,0.14062292E+02,0.13853528E+00,0.15903134E+00 +gfortran,2000,0.15319408E+02,0.16280139E+02,0.16020828E+00,0.19086416E+00 +gfortran,2100,0.18984555E+02,0.20680869E+02,0.17921946E+00,0.22096635E+00 +gfortran,2200,0.21225083E+02,0.22401707E+02,0.21741163E+00,0.26642611E+00 +gfortran,2300,0.24340594E+02,0.27298272E+02,0.25116208E+00,0.32690401E+00 +gfortran,2400,0.29539821E+02,0.31200585E+02,0.27621742E+00,0.35614406E+00 +gfortran,2500,0.33012333E+02,0.34869524E+02,0.29833450E+00,0.41418427E+00 +gfortran,2600,0.37653487E+02,0.38693223E+02,0.37339042E+00,0.48488226E+00 +gfortran,2700,0.43775129E+02,0.44011717E+02,0.42273598E+00,0.55674638E+00 +gfortran,2800,0.46865910E+02,0.51751799E+02,0.42849244E+00,0.61609360E+00 +gfortran,2900,0.53416371E+02,0.57667004E+02,0.50689343E+00,0.73876719E+00 +gfortran,3000,0.59658597E+02,0.63521616E+02,0.53852453E+00,0.80783996E+00 +gfortran,3100,0.64912150E+02,0.70354467E+02,0.66474030E+00,0.89399829E+00 +gfortran,3200,0.90602590E+02,0.10027437E+03,0.85063715E+00,0.10578788E+01 +gfortran,3300,0.81809889E+02,0.84734370E+02,0.79015186E+00,0.11065690E+01 +gfortran,3400,0.88535837E+02,0.95473385E+02,0.86069586E+00,0.12151891E+01 +gfortran,3500,0.98416554E+02,0.10100206E+03,0.95841599E+00,0.13262034E+01 +gfortran,4000,-1.00000000E+00,-1.00000000E+00,0.16826234E+01,0.20811888E+01 +gfortran,4500,-1.00000000E+00,-1.00000000E+00,0.25307609E+01,0.30088221E+01 +gfortran,5000,-1.00000000E+00,-1.00000000E+00,0.35788683E+01,0.40577505E+01 +gfortran,5500,-1.00000000E+00,-1.00000000E+00,0.48177959E+01,0.52263592E+01 +gfortran,6000,-1.00000000E+00,-1.00000000E+00,0.62184667E+01,0.66499992E+01 +gfortran,6500,-1.00000000E+00,-1.00000000E+00,0.79128923E+01,0.83428266E+01 +gfortran,7000,-1.00000000E+00,-1.00000000E+00,0.99424035E+01,0.10330868E+02 +gfortran,7500,-1.00000000E+00,-1.00000000E+00,0.12193222E+02,0.12621387E+02 +gfortran,8000,-1.00000000E+00,-1.00000000E+00,0.15541630E+02,0.16425930E+02 +gfortran,8500,-1.00000000E+00,-1.00000000E+00,0.19036642E+02,0.18838578E+02 +gfortran,9000,-1.00000000E+00,-1.00000000E+00,0.21588447E+02,0.21810834E+02 +gfortran,9500,-1.00000000E+00,-1.00000000E+00,0.26831378E+02,0.27189868E+02 +gfortran,10000,-1.00000000E+00,-1.00000000E+00,0.30144515E+02,0.30040566E+02 +gfortran,10500,-1.00000000E+00,-1.00000000E+00,0.36579010E+02,0.36216507E+02 +gfortran,11000,-1.00000000E+00,-1.00000000E+00,0.39791483E+02,0.40647974E+02 +gfortran,11500,-1.00000000E+00,-1.00000000E+00,0.48409088E+02,0.46128549E+02 +gfortran,12000,-1.00000000E+00,-1.00000000E+00,0.53845028E+02,0.52554446E+02 + + +ifx,100,0.13360000E-02,0.25300000E-03,0.28400000E-03,0.62280000E-02 +ifx,200,0.94300000E-03,0.70300000E-03,0.17500000E-02,0.53200000E-03 +ifx,300,0.19540000E-02,0.98800000E-03,0.56620000E-02,0.11900000E-02 +ifx,400,0.41050000E-02,0.20040000E-02,0.12329000E-01,0.18200000E-02 +ifx,500,0.67680000E-02,0.40920000E-02,0.23081000E-01,0.37860000E-02 +ifx,600,0.10042000E-01,0.64440000E-02,0.35787000E-01,0.58940000E-02 +ifx,700,0.12868000E-01,0.94340000E-02,0.52539000E-01,0.86270000E-02 +ifx,800,0.16007000E-01,0.13084000E-01,0.79775000E-01,0.13380000E-01 +ifx,900,0.23096000E-01,0.18096000E-01,0.10751300E+00,0.17598000E-01 +ifx,1000,0.33346000E-01,0.24033000E-01,0.14744800E+00,0.22746000E-01 +ifx,1100,0.42964000E-01,0.33314000E-01,0.19822200E+00,0.29080000E-01 +ifx,1200,0.55479000E-01,0.42391000E-01,0.23895200E+00,0.35114000E-01 +ifx,1300,0.68742000E-01,0.55721000E-01,0.28449800E+00,0.42838000E-01 +ifx,1400,0.85410000E-01,0.69581000E-01,0.33305000E+00,0.51189000E-01 +ifx,1500,0.92537000E-01,0.87938000E-01,0.39305200E+00,0.61710000E-01 +ifx,1600,0.97579000E-01,0.10292500E+00,0.45614300E+00,0.72555000E-01 +ifx,1700,0.13226000E+00,0.13129200E+00,0.53266300E+00,0.85557000E-01 +ifx,1800,0.17739500E+00,0.15892500E+00,0.61273400E+00,0.95487000E-01 +ifx,1900,0.19851200E+00,0.20065300E+00,0.69702400E+00,0.11089200E+00 +ifx,2000,0.23342300E+00,0.23405400E+00,0.79726200E+00,0.12518300E+00 +ifx,2100,0.27690300E+00,0.29127200E+00,0.88808500E+00,0.14490200E+00 +ifx,2200,0.32643700E+00,0.34764600E+00,0.98091000E+00,0.16227200E+00 +ifx,2300,0.34848900E+00,0.43037800E+00,0.11075950E+01,0.18454700E+00 +ifx,2400,0.35825000E+00,0.50075100E+00,0.12508380E+01,0.20945700E+00 +ifx,2500,0.43318300E+00,0.57629600E+00,0.14015760E+01,0.24338300E+00 +ifx,2600,0.57317000E+00,0.65597400E+00,0.14842900E+01,0.27745400E+00 +ifx,2700,0.65872800E+00,0.81337300E+00,0.15621860E+01,0.32211200E+00 +ifx,2800,0.76228100E+00,0.84309800E+00,0.16839030E+01,0.35929700E+00 +ifx,2900,0.89145000E+00,0.10103540E+01,0.18771880E+01,0.41419000E+00 +ifx,3000,0.97091300E+00,0.11404110E+01,0.20041990E+01,0.45558600E+00 +ifx,3100,0.10147800E+01,0.12432690E+01,0.22279590E+01,0.49801900E+00 +ifx,3200,0.99914000E+00,0.14452240E+01,0.24975040E+01,0.57101400E+00 +ifx,3300,0.13023230E+01,0.15406600E+01,0.25502840E+01,0.65513700E+00 +ifx,3400,0.16021900E+01,0.16822170E+01,0.27196720E+01,0.73279200E+00 +ifx,3500,0.18083680E+01,0.19370000E+01,0.30889160E+01,0.82299700E+00 +ifx,4000,-1.00000000E+00,-1.00000000E+00,0.37374140E+01,0.13459400E+01 +ifx,4500,-1.00000000E+00,-1.00000000E+00,0.52909560E+01,0.20961750E+01 +ifx,5000,-1.00000000E+00,-1.00000000E+00,0.72129850E+01,0.30744000E+01 +ifx,5500,-1.00000000E+00,-1.00000000E+00,0.98952170E+01,0.44634310E+01 +ifx,6000,-1.00000000E+00,-1.00000000E+00,0.12723331E+02,0.56981020E+01 +ifx,6500,-1.00000000E+00,-1.00000000E+00,0.16173005E+02,0.71214460E+01 +ifx,7000,-1.00000000E+00,-1.00000000E+00,0.20182348E+02,0.88443290E+01 +ifx,7500,-1.00000000E+00,-1.00000000E+00,0.24834025E+02,0.11663073E+02 +ifx,8000,-1.00000000E+00,-1.00000000E+00,0.31287529E+02,0.13548773E+02 +ifx,8500,-1.00000000E+00,-1.00000000E+00,0.35770167E+02,0.16096941E+02 +ifx,9000,-1.00000000E+00,-1.00000000E+00,0.42917785E+02,0.19461302E+02 +ifx,9500,-1.00000000E+00,-1.00000000E+00,0.51301884E+02,0.24265284E+02 +ifx,10000,-1.00000000E+00,-1.00000000E+00,0.59026402E+02,0.26132817E+02 +ifx,10500,-1.00000000E+00,-1.00000000E+00,0.71054785E+02,0.30471835E+02 +ifx,11000,-1.00000000E+00,-1.00000000E+00,0.80024689E+02,0.35037184E+02 +ifx,11500,-1.00000000E+00,-1.00000000E+00,0.91333416E+02,0.39988416E+02 +ifx,12000,-1.00000000E+00,-1.00000000E+00,0.10576859E+03,0.45397994E+02 diff --git a/report/figures/plots.gnu b/report/figures/plots.gnu index 3f64e8c..3342372 100644 --- a/report/figures/plots.gnu +++ b/report/figures/plots.gnu @@ -1,172 +1,97 @@ +# Global settings set datafile separator "," -set xtics 2000 -set xtics rotate by -90 +# Borrowing the ColorBrewer set 1 theme from R for colours +set linetype 1 lc rgb '#E41A1C' pt 7 ps 0.3 +set linetype 2 lc rgb '#377EB8' pt 7 ps 0.3 +set linetype 3 lc rgb '#4DAF4A' pt 7 ps 0.3 +set linetype 4 lc rgb '#984EA3' pt 7 ps 0.3 + +# Logscale ad tics for cairolatex +set logscale xy 10 +set format y '$10^{%T}$' -# SERIAL, O3, GFORTRAN-SPECIFIC RESULTS (FIGURE 1) +# Make them evenly spaced this time +set xtics autofreq +set mxtics 10 +set mytics 10 -#set terminal x11 0 title "Fig. 1 N-scaling" persist -set terminal cairolatex pdf size 5in,3in -set output "f1_n_scaling.tex" -set logscale y 10 -set logscale x 10 +# And look good as well +set grid xtics ytics # Log-grid +set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 +set key above center horizontal +# === FIGURE 1: SERIAL GFORTRAN === +set terminal cairolatex pdf size 5in,2.5in +set output "f1_n_scaling.tex" set xlabel "Size [$N \\times N$]" set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid set xrange[70:15500] -plot 'gfortran_O3_serial.csv' using 1:($2 > 0 ? $2 : 1/0) with linespoints pt 7 ps 0.2 title "Row loop", \ - 'gfortran_O3_serial.csv' using 1:($3 > 0 ? $3 : 1/0) with linespoints pt 7 ps 0.2 title "Col loop",\ - 'gfortran_O3_serial.csv' using 1:4 with linespoints pt 7 ps 0.2 title "Matmul", \ - 'gfortran_O3_serial.csv' using 1:5 with linespoints pt 7 ps 0.2 title "DGEMM" +plot 'gfortran_O3_serial.csv' using 1:($2 > 0 ? $2 : 1/0) with linespoints title "Row-major loop", \ + 'gfortran_O3_serial.csv' using 1:($3 > 0 ? $3 : 1/0) with linespoints title "Col.-major loop", \ + 'gfortran_O3_serial.csv' using 1:4 with linespoints title "\\texttt{Matmul}", \ + 'gfortran_O3_serial.csv' using 1:5 with linespoints title "DGEMM", \ + 1e-11*x**3 with line lc rgb 'black' dt 2 notitle - -# SERIAL, O3, COMPILER-DEPENDENT WALL TIMES (LOOPS ONLY) (FIGURE 2) - -set xtics 1000 -#set terminal x11 1 title "Fig.2 Compiler" persist -set terminal cairolatex pdf size 5in,3in +# === FIGURE 2: COMPILER COMPARISON (LOOPS) === +#set xtics (100,150,200,300,400,500,700,1000,1500,2100,3000) set output "f2_compilers_scaling.tex" - -set logscale y 10 -set logscale x 10 - -set xlabel "Size [$N \\times N$]" -set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid -set xrange[70:5000] - -plot 'ifx_vs_gfortran_O3_serial_results.csv' index 0 using 2:($3 > 0 ? $3 : 1/0) with linespoints pt 7 ps 0.2 title "GCC: Row loop", \ - 'ifx_vs_gfortran_O3_serial_results.csv' index 0 using 2:($4 > 0 ? $4 : 1/0) with linespoints pt 7 ps 0.2 title "GCC: Col loop", \ - 'ifx_vs_gfortran_O3_serial_results.csv' index 1 using 2:($3 > 0 ? $3 : 1/0) with linespoints pt 7 ps 0.2 title "IFX: Row loop", \ - 'ifx_vs_gfortran_O3_serial_results.csv' index 1 using 2:($4 > 0 ? $4 : 1/0) with linespoints pt 7 ps 0.2 title "IFX: Col loop", \ +set xrange[40:10000] +plot 'ifx_vs_gfortran_O3_serial_results.csv' index 0 using 2:($3 > 0 ? $3 : 1/0) with linespoints title "\\texttt{gfortran}: Row-major", \ + 'ifx_vs_gfortran_O3_serial_results.csv' index 0 using 2:($4 > 0 ? $4 : 1/0) with linespoints title "\\texttt{gfortran}: Col.-major", \ + 'ifx_vs_gfortran_O3_serial_results.csv' index 1 using 2:($3 > 0 ? $3 : 1/0) with linespoints title "\\texttt{ifx}: Row-major", \ + 'ifx_vs_gfortran_O3_serial_results.csv' index 1 using 2:($4 > 0 ? $4 : 1/0) with linespoints title "\\texttt{ifx}: Col.-major", \ + 1e-11*x**3 with line lc rgb 'black' dt 2 notitle -# SERIAL, O3, COMPILER-DEPENDENT WALL TIMES (MATMUL/BLAS ONLY) (FIGURE 3) - -set xtics 2000 -#set terminal x11 2 title "Fig.3 Compiler" persist -set terminal cairolatex pdf size 5in,3in +# === FIGURE 3: COMPILER COMPARISON (BLAS) === +#set xtics (100,150,200,300,400,500,700,1000,1500,2100,3000,4500,7000,11000) set output "f3_compilers_scaling.tex" - -set logscale y 10 -set logscale x 10 - -set xlabel "Size [$N \\times N$]" -set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid set xrange[70:15500] -plot 'ifx_vs_gfortran_O3_serial_results.csv' index 0 using 2:($5 > 0 ? $5 : 1/0) with linespoints pt 7 ps 0.2 title 'GCC: \texttt{matmul}', \ - 'ifx_vs_gfortran_O3_serial_results.csv' index 0 using 2:($6 > 0 ? $6 : 1/0) with linespoints pt 7 ps 0.2 title 'GCC: OpenBLAS', \ - 'ifx_vs_gfortran_O3_serial_results.csv' index 1 using 2:($5 > 0 ? $5 : 1/0) with linespoints pt 7 ps 0.2 title 'IFX: \texttt{matmul}', \ - 'ifx_vs_gfortran_O3_serial_results.csv' index 1 using 2:($6 > 0 ? $6 : 1/0) with linespoints pt 7 ps 0.2 title 'IFX: MKL BLAS', \ - +plot "ifx_vs_gfortran_O3_serial_results.csv" index 0 using 2:($5 > 0 ? $5 : 1/0) with linespoints title "\\texttt{gfortran}: \\texttt{matmul}", \ + "ifx_vs_gfortran_O3_serial_results.csv" index 0 using 2:($6 > 0 ? $6 : 1/0) with linespoints title "\\texttt{gfortran}: OpenBLAS", \ + "ifx_vs_gfortran_O3_serial_results.csv" index 1 using 2:($5 > 0 ? $5 : 1/0) with linespoints title "\\texttt{ifx}: \\texttt{matmul}", \ + "ifx_vs_gfortran_O3_serial_results.csv" index 1 using 2:($6 > 0 ? $6 : 1/0) with linespoints title "\\texttt{ifx}: MKL BLAS", \ + 1e-11*x**3 with line lc rgb "black" dt 2 notitle -# PARALLEL, O3, COMPILER-DEPEDENT WALL TIMES. LOOPS ONLY (FIGURE 4) - -set xtics 1000 -set terminal cairolatex pdf size 5in,3in +# === FIGURE 4: PARALLEL LOOPS === set output "f4_compilers_scaling.tex" - -set logscale y 10 -set logscale x 10 - -set xlabel "Size [$N \\times N$]" -set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid -set xrange[70:5000] +set xrange[40:10000] -plot 'ifx_vs_gfortran_parallel_O3_results.csv' index 0 using 2:($3 > 0 ? $3 : 1/0) with linespoints pt 7 ps 0.2 title "GCC: Row loop", \ - 'ifx_vs_gfortran_parallel_O3_results.csv' index 0 using 2:($4 > 0 ? $4 : 1/0) with linespoints pt 7 ps 0.2 title "GCC: Col loop", \ - 'ifx_vs_gfortran_parallel_O3_results.csv' index 1 using 2:($3 > 0 ? $3 : 1/0) with linespoints pt 7 ps 0.2 title "IFX: Row loop", \ - 'ifx_vs_gfortran_parallel_O3_results.csv' index 1 using 2:($4 > 0 ? $4 : 1/0) with linespoints pt 7 ps 0.2 title "IFX: Col loop", \ +plot "ifx_vs_gfortran_parallel_O3_results.csv" index 0 using 2:($3 > 0 ? $3 : 1/0) with linespoints title "\\texttt{gfortran}: Row-major", \ + "ifx_vs_gfortran_parallel_O3_results.csv" index 0 using 2:($4 > 0 ? $4 : 1/0) with linespoints title "\\texttt{gfortran}: Col.-major", \ + "ifx_vs_gfortran_parallel_O3_results.csv" index 1 using 2:($3 > 0 ? $3 : 1/0) with linespoints title "\\texttt{ifx}: Row-major", \ + "ifx_vs_gfortran_parallel_O3_results.csv" index 1 using 2:($4 > 0 ? $4 : 1/0) with linespoints title "\\texttt{ifx}: Col.-major", \ + 1e-11*x**3 with line lc rgb 'black' dt 2 notitle -# PARALLEL, O3, COMPILER-DEPENDENT WALL TIMES. MATMUL/BLAS ONLY (FIGURE 5) - -set terminal cairolatex pdf size 5in,3in +# === FIGURE 5: PARALLEL BLAS === set output "f5_compilers_scaling.tex" - -set logscale y 10 -set logscale x 10 -set xtics 2000 - -set xlabel "Size [$N \\times N$]" -set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid set xrange[70:15500] -plot 'ifx_vs_gfortran_parallel_O3_results.csv' index 0 using 2:($5 > 0 ? $5 : 1/0) with linespoints pt 7 ps 0.2 title 'GCC: \texttt{matmul}', \ - 'ifx_vs_gfortran_parallel_O3_results.csv' index 0 using 2:($6 > 0 ? $6 : 1/0) with linespoints pt 7 ps 0.2 title 'GCC: OpenBLAS', \ - 'ifx_vs_gfortran_parallel_O3_results.csv' index 1 using 2:($5 > 0 ? $5 : 1/0) with linespoints pt 7 ps 0.2 title 'IFX: \texttt{matmul}', \ - 'ifx_vs_gfortran_parallel_O3_results.csv' index 1 using 2:($6 > 0 ? $6 : 1/0) with linespoints pt 7 ps 0.2 title 'IFX: MKL BLAS', \ - - -# COMPILER FLAGS COMPARISON. GFORTRAN ONLY. LOOP ONLY. (FIGURE 6) +plot "ifx_vs_gfortran_parallel_O3_results.csv" index 0 using 2:($5 > 0 ? $5 : 1/0) with linespoints title "\\texttt{gfortran}: \\texttt{matmul}", \ + "ifx_vs_gfortran_parallel_O3_results.csv" index 0 using 2:($6 > 0 ? $6 : 1/0) with linespoints title "\\texttt{gfortran}: OpenBLAS", \ + "ifx_vs_gfortran_parallel_O3_results.csv" index 1 using 2:($5 > 0 ? $5 : 1/0) with linespoints title "\\texttt{ifx}: \\texttt{matmul}", \ + "ifx_vs_gfortran_parallel_O3_results.csv" index 1 using 2:($6 > 0 ? $6 : 1/0) with linespoints title "\\texttt{ifx}: MKL BLAS", \ + 1e-11*x**3 with line lc rgb 'black' dt 2 notitle -#set terminal x11 persist -set terminal cairolatex pdf size 5in,3in +# === FIGURE 6: GFORTRAN FLAGS === set output "f6_optflags_scaling.tex" +set xrange[40:10000] -set logscale y 10 -set logscale x 10 -set xtics 1000 +plot "gfortran_rowloop_optflags.csv" using 1:2 with linespoints title "\\texttt{gfortran}: O1", \ + "gfortran_rowloop_optflags.csv" using 1:3 with linespoints title "\\texttt{gfortran}: O2", \ + "gfortran_rowloop_optflags.csv" using 1:4 with linespoints title "\\texttt{gfortran}: O3", \ + "gfortran_rowloop_optflags.csv" using 1:5 with linespoints title "\\texttt{gfortran}: Ofast", \ + 1e-10*x**3 with line lc rgb 'black' dt 2 notitle -set xlabel "Size [$N \\times N$]" -set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid -set xrange[70:5000] - -plot 'gfortran_rowloop_optflags.csv' using 1:2 with linespoints pt 7 ps 0.2 title 'GCC: O1', \ - 'gfortran_rowloop_optflags.csv' using 1:3 with linespoints pt 7 ps 0.2 title 'GCC: O2', \ - 'gfortran_rowloop_optflags.csv' using 1:4 with linespoints pt 7 ps 0.2 title 'GCC: O3', \ - 'gfortran_rowloop_optflags.csv' using 1:5 with linespoints pt 7 ps 0.2 title 'GCC: Ofast', \ - - -# COMPILER FLAGS COMPARISON. IFX ONLY. LOOP ONLY. (FIGURE 7) - -#set terminal x11 persist -set terminal cairolatex pdf size 5in,3in +# === FIGURE 7: IFX FLAGS === set output "f7_optflags_scaling.tex" +set xrange[40:10000] -set logscale y 10 -set logscale x 10 -set xtics 1000 +plot "ifx_rowloop_optflags.csv" using 1:2 with linespoints title "\\texttt{ifx}: O1", \ + "ifx_rowloop_optflags.csv" using 1:3 with linespoints title "\\texttt{ifx}: O2", \ + "ifx_rowloop_optflags.csv" using 1:4 with linespoints title "\\texttt{ifx}: O3", \ + "ifx_rowloop_optflags.csv" using 1:5 with linespoints title "\\texttt{ifx}: Ofast", \ + 1e-11*x**3 with line lc rgb 'black' dt 2 notitle -set xlabel "Size [$N \\times N$]" -set ylabel "Wall Time [s]" - -set format y '$10^{%T}$' -set offsets graph 0.05, graph 0.05, graph 0.05, graph 0.05 -set key bottom right -set grid -set xrange[70:5000] - -plot 'ifx_rowloop_optflags.csv' using 1:2 with linespoints pt 7 ps 0.2 title 'IFX: O1', \ - 'ifx_rowloop_optflags.csv' using 1:3 with linespoints pt 7 ps 0.2 title 'IFX: O2', \ - 'ifx_rowloop_optflags.csv' using 1:4 with linespoints pt 7 ps 0.2 title 'IFX: O3', \ - 'ifx_rowloop_optflags.csv' using 1:5 with linespoints pt 7 ps 0.2 title 'IFX: Ofast', \ -- cgit v1.2.3