diff --git a/cs677/hw7/hw.tex b/cs677/hw7/hw.tex index b79e1e4..5416898 100644 --- a/cs677/hw7/hw.tex +++ b/cs677/hw7/hw.tex @@ -54,6 +54,23 @@ array. } +\vskip 2em +\item[3.]{ + My OpenMP solution to Floyd's algorithm was implemented by + using a \texttt{\#pragma omp parallel for} on the second \texttt{for} + loop of the algorithm. + Thus, for each $k$ value, the rows are broken up for different + threads to process. + The same thread computes an entire row of the matrix. + + The run times nicely grow exponentially as $n$ grows linearly. + On eos24, with $n >= 400$, the speedup was $\approx 3.6$. + + As the number of threads increased, the run time decreased + exponentially until $t > 4$, where more threads did not gain + anything since there were only 4 processing cores. +} + \end{enumerate} \end{document}