Merge branch 'master' of github.com:cwpearson/cem17
This commit is contained in:
194
main.tex
194
main.tex
@@ -12,6 +12,8 @@
|
||||
\documentclass[10pt,conference,a4paper]{IEEEtran}
|
||||
\usepackage{times,amsmath,epsfig}
|
||||
\usepackage{makecell}
|
||||
\usepackage{todonotes}
|
||||
\usepackage{verbatim}
|
||||
|
||||
\title{Solving Problems Involving Inhomogeneous Media with MLFMA on GPU Clusters}
|
||||
\author{
|
||||
@@ -40,24 +42,22 @@ In order to achieve an efficient implementation on multiple graphics processing
|
||||
\section{Inverse-Scattering Formulation and Application Architecture}
|
||||
\label{sec:application}
|
||||
|
||||
Table \ref{tab:components} shows the breakdown of application component execution times on the Blue Waters supercomputer.
|
||||
Fig.~\ref{fig:app_breakdown} shows the amount of time the full inverse-solver application spends on MFLMM in two parallelized CPU executions.
|
||||
|
||||
\begin{table}{}
|
||||
\centering \caption{Breakdown of Application Component Time} \label{tab:components}
|
||||
\begin{tabular}{|c|c|}
|
||||
\hline \textbf{Component} & \textbf{Wall Time (s)} \\
|
||||
\hline
|
||||
\hline Preprocessing & 0 \\
|
||||
\hline Setup & 0 \\
|
||||
\hline Solution & 0 \\
|
||||
\hline Matvec & 0 \\
|
||||
\hline Solver & 0 \\
|
||||
\hline Postprocessing & 0 \\
|
||||
\hline Other & 0 \\
|
||||
\hline Total & 0 \\
|
||||
\hline
|
||||
``BW (32T)'' corresponds to a 32-thread OpenMP parallel run on a single XE node, and S822LC corresponds to a 160-thread OpenMP parallel run on the S822LC node.
|
||||
Non-MLFMM operations are a minority of the time, and become an even smaller proportion of the time as the object reconstructions grow larger.
|
||||
|
||||
\begin{figure}[b]
|
||||
\begin{center}
|
||||
\begin{tabular}{c}
|
||||
\mbox{\psfig{figure=figures/cpu_matvec.pdf,width=8cm}}
|
||||
\end{tabular}
|
||||
\end{table}
|
||||
\end{center}
|
||||
\caption{A three-dimensional plot with gray-scale format.}
|
||||
\label{fig:app_breakdown}
|
||||
\end{figure}
|
||||
|
||||
|
||||
|
||||
\section{MLFMM Results}
|
||||
|
||||
@@ -97,85 +97,100 @@ The P100s are connected to the Power8 CPUs via $80$~GB/s NVLink connections.
|
||||
|
||||
\subsection{MLFMM Performance}
|
||||
|
||||
\subsection{GPU Kernel Performance}
|
||||
All evaluations are done on a problem with these parameters. \todo{get from mert}
|
||||
|
||||
Table \ref{tab:mlfmm_breakdown} shows the breakdown of MLFMM kernel times in different execution environments.
|
||||
|
||||
Fig.~\ref{fig:kernel_breakdown} shows the amount of of MLFMM execution time spent in computational kernels.
|
||||
|
||||
\begin{figure}[b]
|
||||
\begin{center}
|
||||
\begin{tabular}{c}
|
||||
\mbox{\psfig{figure=figures/example_fig0.pdf,width=8cm}}
|
||||
\mbox{\psfig{figure=figures/mlfmm_bw.pdf,width=8cm}}
|
||||
\end{tabular}
|
||||
\end{center}
|
||||
\caption{A three-dimensional plot with gray-scale
|
||||
format.}\label{fig1}
|
||||
\caption{BW.}
|
||||
\label{fig:kernel_breakdown}
|
||||
\end{figure}
|
||||
|
||||
Fig.~\ref{fig:kernel_breakdown} shows the amount of of MLFMM execution time spent in computational kernels.
|
||||
|
||||
\begin{figure}[b]
|
||||
\begin{center}
|
||||
\begin{tabular}{c}
|
||||
\mbox{\psfig{figure=figures/mlfmm_minsky.pdf,width=8cm}}
|
||||
\end{tabular}
|
||||
\end{center}
|
||||
\caption{A three-dimensional plot with gray-scale format.}
|
||||
\label{fig:kernel_breakdown}
|
||||
\end{figure}
|
||||
|
||||
|
||||
|
||||
\subsection{Computation Kernel Breakdown}
|
||||
|
||||
Fig.~\ref{fig:kernel_breakdown} shows the amount of of MLFMM execution time spent in computational kernels.
|
||||
|
||||
\begin{figure}[b]
|
||||
\begin{center}
|
||||
\begin{tabular}{c}
|
||||
\mbox{\psfig{figure=figures/kernels.pdf,width=8cm}}
|
||||
\end{tabular}
|
||||
\end{center}
|
||||
\caption{A three-dimensional plot with gray-scale format.}
|
||||
\label{fig:kernel_breakdown}
|
||||
\end{figure}
|
||||
|
||||
|
||||
|
||||
This document is a template for authors preparing papers for the
|
||||
CEM'17 Computing and Electromagnetics Workshop in Barcelona, Spain.
|
||||
The papers are required to use the IEEE style by following the
|
||||
instructions provided in this document. The language is English.
|
||||
The papers are expected to be two-pages long.
|
||||
\begin{figure}[b]
|
||||
\begin{center}
|
||||
\begin{tabular}{c}
|
||||
\mbox{\psfig{figure=example_fig0.pdf,width=8cm}}
|
||||
\end{tabular}
|
||||
\end{center}
|
||||
\caption{A three-dimensional plot with gray-scale
|
||||
format.}\label{fig1}
|
||||
\end{figure}
|
||||
|
||||
\section{Text Format} Page size is A4, which is 210 mm (8.27 in) wide and 297 mm
|
||||
(11.69 in) long. The margins are as follows:
|
||||
\begin{itemize}
|
||||
\item Top: 19 mm (0.75 in) \item Bottom: 43 mm (1.69 in) \item
|
||||
Left-Right: 14.32 mm (0.56 in)
|
||||
\end{itemize}
|
||||
The paper is in two column format with a space of 4.22 mm (0.17 in)
|
||||
between columns. All title and author details must be in
|
||||
single-column format and must be centered. All paragraphs are
|
||||
indented. The entire document should be in Times New Roman or
|
||||
Times font. Recommended font size is 10~pt for the main text.
|
||||
Headings of the subsections are as follows, if required:
|
||||
\subsection{This is First-Level Subsection}
|
||||
You may use 1st level subsections, if required.
|
||||
\\
|
||||
\subsubsection{This is Second-Level Subsection}
|
||||
You may use 2nd level subsections, if required.
|
||||
\\
|
||||
\\
|
||||
\indent Page numbers, headers and footers should not be used. All
|
||||
hypertext links and bookmarks should be removed from papers. If
|
||||
you need to refer to an Internet email address or URL in your
|
||||
paper, you should type out the address or URL fully in regular
|
||||
font.
|
||||
|
||||
\begin{figure}[t]
|
||||
\begin{center}
|
||||
\begin{tabular}{c}
|
||||
\mbox{\psfig{figure=example_fig1.pdf,width=8cm}}\\
|
||||
{(a)}\\\\ \mbox{\psfig{figure=example_fig2.pdf,width=8cm}}\\{(b)}
|
||||
\end{tabular}
|
||||
\end{center}
|
||||
\caption{Three-dimensional plots with colors. Using (a)
|
||||
inappropriate and (b) appropriate colors for gray-scale
|
||||
prints.}\label{fig2}
|
||||
\end{figure}
|
||||
\section{Text Format}
|
||||
%Page size is A4, which is 210 mm (8.27 in) wide and 297 mm
|
||||
%(11.69 in) long. The margins are as follows:
|
||||
%\begin{itemize}
|
||||
%\item Top: 19 mm (0.75 in) \item Bottom: 43 mm (1.69 in) \item
|
||||
%Left-Right: 14.32 mm (0.56 in)
|
||||
%\end{itemize}
|
||||
%The paper is in two column format with a space of 4.22 mm (0.17 in)
|
||||
%between columns. All title and author details must be in
|
||||
%single-column format and must be centered. All paragraphs are
|
||||
%indented. The entire document should be in Times New Roman or
|
||||
%Times font. Recommended font size is 10~pt for the main text.
|
||||
%Headings of the subsections are as follows, if required:
|
||||
%\subsection{This is First-Level Subsection}
|
||||
%You may use 1st level subsections, if required.
|
||||
%\\
|
||||
%\subsubsection{This is Second-Level Subsection}
|
||||
%You may use 2nd level subsections, if required.
|
||||
%\\
|
||||
%\\
|
||||
%\indent Page numbers, headers and footers should not be used. All
|
||||
%hypertext links and bookmarks should be removed from papers. If
|
||||
%you need to refer to an Internet email address or URL in your
|
||||
%paper, you should type out the address or URL fully in regular
|
||||
%font.
|
||||
|
||||
\section{Figures and Tables}
|
||||
Figures should be centered in the column, but large figures may
|
||||
span across both columns, if they are positioned either at the top
|
||||
or at the bottom of the page. Graphics should have an adequate
|
||||
resolution. Fig.~\ref{fig1} presents an example plot in gray-scale
|
||||
format. Colors can be used; however, it is recommended that the
|
||||
graphics are checked to reproduce the required details in
|
||||
gray-scale copy. For example, the colors in Fig.~\ref{fig2}(a) are
|
||||
not appropriate for a gray-scale print. For the same plot,
|
||||
Fig.~\ref{fig2}(b) is more preferable. Figures are numbered using
|
||||
Arabic numerals and the captions are in 8~pt regular font. Tables
|
||||
should be numbered using uppercase Roman numerals and their
|
||||
captions are centered as in Table~\ref{table1}.
|
||||
|
||||
|
||||
|
||||
%\section{Figures and Tables}
|
||||
%Figures should be centered in the column, but large figures may
|
||||
%span across both columns, if they are positioned either at the top
|
||||
%or at the bottom of the page. Graphics should have an adequate
|
||||
%resolution. Fig.~\ref{fig1} presents an example plot in gray-scale
|
||||
%format. Colors can be used; however, it is recommended that the
|
||||
%graphics are checked to reproduce the required details in
|
||||
%gray-scale copy. For example, the colors in Fig.~\ref{fig2}(a) are
|
||||
%not appropriate for a gray-scale print. For the same plot,
|
||||
%Fig.~\ref{fig2}(b) is more preferable. Figures are numbered using
|
||||
%Arabic numerals and the captions are in 8~pt regular font. Tables
|
||||
%should be numbered using uppercase Roman numerals and their
|
||||
%captions are centered as in Table~\ref{table1}.
|
||||
|
||||
|
||||
|
||||
@@ -194,24 +209,25 @@ captions are centered as in Table~\ref{table1}.
|
||||
|
||||
|
||||
|
||||
\section{References} The heading of the references section is
|
||||
not be numbered and all reference items are in 8~pt font.
|
||||
References are required to be in IEEE style. Please refer to the
|
||||
examples for journals~\cite{journal}, for
|
||||
books~\cite{book1},~\cite{book2}, and for conference
|
||||
papers~\cite{conf1},~\cite{conf2}.
|
||||
\section{References}
|
||||
%The heading of the references section is
|
||||
%not be numbered and all reference items are in 8~pt font.
|
||||
%References are required to be in IEEE style. Please refer to the
|
||||
%examples for journals~\cite{journal}, for
|
||||
%books~\cite{book1},~\cite{book2}, and for conference
|
||||
%papers~\cite{conf1},~\cite{conf2}.
|
||||
|
||||
% the following vfill coursely balances the columns on the last page
|
||||
% the following vfill coarsely balances the columns on the last page
|
||||
\vfill \pagebreak
|
||||
|
||||
\section{Conclusions}
|
||||
This template uses IEEE style and provides necessary information
|
||||
to prepare papers for CEM'17 Workshop. Thank you for your
|
||||
contributions.
|
||||
%This template uses IEEE style and provides necessary information
|
||||
%to prepare papers for CEM'17 Workshop. Thank you for your
|
||||
%contributions.
|
||||
|
||||
|
||||
\section*{Acknowledgment}
|
||||
Acknowledgments should be here.
|
||||
%Acknowledgments should be here.
|
||||
|
||||
\bibliographystyle{IEEEtran}
|
||||
\begin{thebibliography}{99}
|
||||
|
Reference in New Issue
Block a user