Updates from ShareLaTeX
This commit is contained in:
@@ -12,6 +12,8 @@
|
|||||||
\documentclass[10pt,conference,a4paper]{IEEEtran}
|
\documentclass[10pt,conference,a4paper]{IEEEtran}
|
||||||
\usepackage{times,amsmath,epsfig}
|
\usepackage{times,amsmath,epsfig}
|
||||||
\usepackage{makecell}
|
\usepackage{makecell}
|
||||||
|
\usepackage{todonotes}
|
||||||
|
\usepackage{verbatim}
|
||||||
|
|
||||||
\title{Solving Problems Involving Inhomogeneous Media with MLFMA on GPU Clusters}
|
\title{Solving Problems Involving Inhomogeneous Media with MLFMA on GPU Clusters}
|
||||||
\author{
|
\author{
|
||||||
@@ -40,24 +42,22 @@ In order to achieve an efficient implementation on multiple graphics processing
|
|||||||
\section{Inverse-Scattering Formulation and Application Architecture}
|
\section{Inverse-Scattering Formulation and Application Architecture}
|
||||||
\label{sec:application}
|
\label{sec:application}
|
||||||
|
|
||||||
Table \ref{tab:components} shows the breakdown of application component execution times on the Blue Waters supercomputer.
|
Fig.~\ref{fig:app_breakdown} shows the amount of time the full inverse-solver application spends on MFLMM in two parallelized CPU executions.
|
||||||
|
|
||||||
\begin{table}{}
|
``BW (32T)'' corresponds to a 32-thread OpenMP parallel run on a single XE node, and S822LC corresponds to a 160-thread OpenMP parallel run on the S822LC node.
|
||||||
\centering \caption{Breakdown of Application Component Time} \label{tab:components}
|
Non-MLFMM operations are a minority of the time, and become an even smaller proportion of the time as the object reconstructions grow larger.
|
||||||
\begin{tabular}{|c|c|}
|
|
||||||
\hline \textbf{Component} & \textbf{Wall Time (s)} \\
|
\begin{figure}[b]
|
||||||
\hline
|
\begin{center}
|
||||||
\hline Preprocessing & 0 \\
|
\begin{tabular}{c}
|
||||||
\hline Setup & 0 \\
|
\mbox{\psfig{figure=figures/cpu_matvec.pdf,width=8cm}}
|
||||||
\hline Solution & 0 \\
|
|
||||||
\hline Matvec & 0 \\
|
|
||||||
\hline Solver & 0 \\
|
|
||||||
\hline Postprocessing & 0 \\
|
|
||||||
\hline Other & 0 \\
|
|
||||||
\hline Total & 0 \\
|
|
||||||
\hline
|
|
||||||
\end{tabular}
|
\end{tabular}
|
||||||
\end{table}
|
\end{center}
|
||||||
|
\caption{A three-dimensional plot with gray-scale format.}
|
||||||
|
\label{fig:app_breakdown}
|
||||||
|
\end{figure}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
\section{MLFMM Results}
|
\section{MLFMM Results}
|
||||||
|
|
||||||
@@ -97,85 +97,100 @@ The P100s are connected to the Power8 CPUs via $80$~GB/s NVLink connections.
|
|||||||
|
|
||||||
\subsection{MLFMM Performance}
|
\subsection{MLFMM Performance}
|
||||||
|
|
||||||
\subsection{GPU Kernel Performance}
|
All evaluations are done on a problem with these parameters. \todo{get from mert}
|
||||||
|
|
||||||
Table \ref{tab:mlfmm_breakdown} shows the breakdown of MLFMM kernel times in different execution environments.
|
|
||||||
|
Fig.~\ref{fig:kernel_breakdown} shows the amount of of MLFMM execution time spent in computational kernels.
|
||||||
|
|
||||||
\begin{figure}[b]
|
\begin{figure}[b]
|
||||||
\begin{center}
|
\begin{center}
|
||||||
\begin{tabular}{c}
|
\begin{tabular}{c}
|
||||||
\mbox{\psfig{figure=figures/example_fig0.pdf,width=8cm}}
|
\mbox{\psfig{figure=figures/mlfmm_bw.pdf,width=8cm}}
|
||||||
\end{tabular}
|
\end{tabular}
|
||||||
\end{center}
|
\end{center}
|
||||||
\caption{A three-dimensional plot with gray-scale
|
\caption{BW.}
|
||||||
format.}\label{fig1}
|
\label{fig:kernel_breakdown}
|
||||||
\end{figure}
|
\end{figure}
|
||||||
|
|
||||||
|
Fig.~\ref{fig:kernel_breakdown} shows the amount of of MLFMM execution time spent in computational kernels.
|
||||||
|
|
||||||
|
\begin{figure}[b]
|
||||||
|
\begin{center}
|
||||||
|
\begin{tabular}{c}
|
||||||
|
\mbox{\psfig{figure=figures/mlfmm_minsky.pdf,width=8cm}}
|
||||||
|
\end{tabular}
|
||||||
|
\end{center}
|
||||||
|
\caption{A three-dimensional plot with gray-scale format.}
|
||||||
|
\label{fig:kernel_breakdown}
|
||||||
|
\end{figure}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
\subsection{Computation Kernel Breakdown}
|
||||||
|
|
||||||
|
Fig.~\ref{fig:kernel_breakdown} shows the amount of of MLFMM execution time spent in computational kernels.
|
||||||
|
|
||||||
|
\begin{figure}[b]
|
||||||
|
\begin{center}
|
||||||
|
\begin{tabular}{c}
|
||||||
|
\mbox{\psfig{figure=figures/kernels.pdf,width=8cm}}
|
||||||
|
\end{tabular}
|
||||||
|
\end{center}
|
||||||
|
\caption{A three-dimensional plot with gray-scale format.}
|
||||||
|
\label{fig:kernel_breakdown}
|
||||||
|
\end{figure}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
This document is a template for authors preparing papers for the
|
This document is a template for authors preparing papers for the
|
||||||
CEM'17 Computing and Electromagnetics Workshop in Barcelona, Spain.
|
CEM'17 Computing and Electromagnetics Workshop in Barcelona, Spain.
|
||||||
The papers are required to use the IEEE style by following the
|
The papers are required to use the IEEE style by following the
|
||||||
instructions provided in this document. The language is English.
|
instructions provided in this document. The language is English.
|
||||||
The papers are expected to be two-pages long.
|
The papers are expected to be two-pages long.
|
||||||
\begin{figure}[b]
|
|
||||||
\begin{center}
|
|
||||||
\begin{tabular}{c}
|
|
||||||
\mbox{\psfig{figure=example_fig0.pdf,width=8cm}}
|
|
||||||
\end{tabular}
|
|
||||||
\end{center}
|
|
||||||
\caption{A three-dimensional plot with gray-scale
|
|
||||||
format.}\label{fig1}
|
|
||||||
\end{figure}
|
|
||||||
|
|
||||||
\section{Text Format} Page size is A4, which is 210 mm (8.27 in) wide and 297 mm
|
|
||||||
(11.69 in) long. The margins are as follows:
|
|
||||||
\begin{itemize}
|
|
||||||
\item Top: 19 mm (0.75 in) \item Bottom: 43 mm (1.69 in) \item
|
|
||||||
Left-Right: 14.32 mm (0.56 in)
|
|
||||||
\end{itemize}
|
|
||||||
The paper is in two column format with a space of 4.22 mm (0.17 in)
|
|
||||||
between columns. All title and author details must be in
|
|
||||||
single-column format and must be centered. All paragraphs are
|
|
||||||
indented. The entire document should be in Times New Roman or
|
|
||||||
Times font. Recommended font size is 10~pt for the main text.
|
|
||||||
Headings of the subsections are as follows, if required:
|
|
||||||
\subsection{This is First-Level Subsection}
|
|
||||||
You may use 1st level subsections, if required.
|
|
||||||
\\
|
|
||||||
\subsubsection{This is Second-Level Subsection}
|
|
||||||
You may use 2nd level subsections, if required.
|
|
||||||
\\
|
|
||||||
\\
|
|
||||||
\indent Page numbers, headers and footers should not be used. All
|
|
||||||
hypertext links and bookmarks should be removed from papers. If
|
|
||||||
you need to refer to an Internet email address or URL in your
|
|
||||||
paper, you should type out the address or URL fully in regular
|
|
||||||
font.
|
|
||||||
|
|
||||||
\begin{figure}[t]
|
\section{Text Format}
|
||||||
\begin{center}
|
%Page size is A4, which is 210 mm (8.27 in) wide and 297 mm
|
||||||
\begin{tabular}{c}
|
%(11.69 in) long. The margins are as follows:
|
||||||
\mbox{\psfig{figure=example_fig1.pdf,width=8cm}}\\
|
%\begin{itemize}
|
||||||
{(a)}\\\\ \mbox{\psfig{figure=example_fig2.pdf,width=8cm}}\\{(b)}
|
%\item Top: 19 mm (0.75 in) \item Bottom: 43 mm (1.69 in) \item
|
||||||
\end{tabular}
|
%Left-Right: 14.32 mm (0.56 in)
|
||||||
\end{center}
|
%\end{itemize}
|
||||||
\caption{Three-dimensional plots with colors. Using (a)
|
%The paper is in two column format with a space of 4.22 mm (0.17 in)
|
||||||
inappropriate and (b) appropriate colors for gray-scale
|
%between columns. All title and author details must be in
|
||||||
prints.}\label{fig2}
|
%single-column format and must be centered. All paragraphs are
|
||||||
\end{figure}
|
%indented. The entire document should be in Times New Roman or
|
||||||
|
%Times font. Recommended font size is 10~pt for the main text.
|
||||||
|
%Headings of the subsections are as follows, if required:
|
||||||
|
%\subsection{This is First-Level Subsection}
|
||||||
|
%You may use 1st level subsections, if required.
|
||||||
|
%\\
|
||||||
|
%\subsubsection{This is Second-Level Subsection}
|
||||||
|
%You may use 2nd level subsections, if required.
|
||||||
|
%\\
|
||||||
|
%\\
|
||||||
|
%\indent Page numbers, headers and footers should not be used. All
|
||||||
|
%hypertext links and bookmarks should be removed from papers. If
|
||||||
|
%you need to refer to an Internet email address or URL in your
|
||||||
|
%paper, you should type out the address or URL fully in regular
|
||||||
|
%font.
|
||||||
|
|
||||||
\section{Figures and Tables}
|
|
||||||
Figures should be centered in the column, but large figures may
|
|
||||||
span across both columns, if they are positioned either at the top
|
|
||||||
or at the bottom of the page. Graphics should have an adequate
|
%\section{Figures and Tables}
|
||||||
resolution. Fig.~\ref{fig1} presents an example plot in gray-scale
|
%Figures should be centered in the column, but large figures may
|
||||||
format. Colors can be used; however, it is recommended that the
|
%span across both columns, if they are positioned either at the top
|
||||||
graphics are checked to reproduce the required details in
|
%or at the bottom of the page. Graphics should have an adequate
|
||||||
gray-scale copy. For example, the colors in Fig.~\ref{fig2}(a) are
|
%resolution. Fig.~\ref{fig1} presents an example plot in gray-scale
|
||||||
not appropriate for a gray-scale print. For the same plot,
|
%format. Colors can be used; however, it is recommended that the
|
||||||
Fig.~\ref{fig2}(b) is more preferable. Figures are numbered using
|
%graphics are checked to reproduce the required details in
|
||||||
Arabic numerals and the captions are in 8~pt regular font. Tables
|
%gray-scale copy. For example, the colors in Fig.~\ref{fig2}(a) are
|
||||||
should be numbered using uppercase Roman numerals and their
|
%not appropriate for a gray-scale print. For the same plot,
|
||||||
captions are centered as in Table~\ref{table1}.
|
%Fig.~\ref{fig2}(b) is more preferable. Figures are numbered using
|
||||||
|
%Arabic numerals and the captions are in 8~pt regular font. Tables
|
||||||
|
%should be numbered using uppercase Roman numerals and their
|
||||||
|
%captions are centered as in Table~\ref{table1}.
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
@@ -194,24 +209,25 @@ captions are centered as in Table~\ref{table1}.
|
|||||||
|
|
||||||
|
|
||||||
|
|
||||||
\section{References} The heading of the references section is
|
\section{References}
|
||||||
not be numbered and all reference items are in 8~pt font.
|
%The heading of the references section is
|
||||||
References are required to be in IEEE style. Please refer to the
|
%not be numbered and all reference items are in 8~pt font.
|
||||||
examples for journals~\cite{journal}, for
|
%References are required to be in IEEE style. Please refer to the
|
||||||
books~\cite{book1},~\cite{book2}, and for conference
|
%examples for journals~\cite{journal}, for
|
||||||
papers~\cite{conf1},~\cite{conf2}.
|
%books~\cite{book1},~\cite{book2}, and for conference
|
||||||
|
%papers~\cite{conf1},~\cite{conf2}.
|
||||||
|
|
||||||
% the following vfill coursely balances the columns on the last page
|
% the following vfill coarsely balances the columns on the last page
|
||||||
\vfill \pagebreak
|
\vfill \pagebreak
|
||||||
|
|
||||||
\section{Conclusions}
|
\section{Conclusions}
|
||||||
This template uses IEEE style and provides necessary information
|
%This template uses IEEE style and provides necessary information
|
||||||
to prepare papers for CEM'17 Workshop. Thank you for your
|
%to prepare papers for CEM'17 Workshop. Thank you for your
|
||||||
contributions.
|
%contributions.
|
||||||
|
|
||||||
|
|
||||||
\section*{Acknowledgment}
|
\section*{Acknowledgment}
|
||||||
Acknowledgments should be here.
|
%Acknowledgments should be here.
|
||||||
|
|
||||||
\bibliographystyle{IEEEtran}
|
\bibliographystyle{IEEEtran}
|
||||||
\begin{thebibliography}{99}
|
\begin{thebibliography}{99}
|
||||||
|
Reference in New Issue
Block a user