numpex · prudhomm · Oct 14, 2024 · Oct 11, 2024 · Oct 14, 2024
diff --git a/software/composyx/WP3/WP3.tex b/software/composyx/WP3/WP3.tex
@@ -57,6 +57,7 @@ \subsection{Software Overview}
 \rowcolor{white}    "singular value decomposition (SVD) and eigenvalue solver" & Provide randomized EVD and SVD partial decomposition \\
 \rowcolor{numpexlightergray}    direct solver & provide interface to MUMPS, PaStiX and qr\_mumps \\
 \rowcolor{white}    krylov solver & provide interface to Fabulous that implement various subspace methods and their block-counterpart \\
+        \bottomrule
 \end{tabular}
         }
     }
@@ -70,8 +71,8 @@ \subsection{Parallel Capabilities}
 
 
 \begin{itemize}
-    \item describe the parallel programming  environment : MPI+ threads and MPI+StarPU for heterogeneous manycores.
-    \item describe the parallel computation environment: distributed manycores
+    \item \textbf{Parallel Environment :} MPI+ threads and not fully assess MPI+StarPU for heterogeneous manycores.
+    \item \textbf{Computation environment :} Distributed manycores (GENCI platforms, BSC)
     %\item describe the parallel capabilities of the software
     \item \textbf{Scalability:} weak scalability on up-to $\approx$ 20~000 cores for the solution of a $\approx 10^9$ linear system. 
     \item \textbf{Integration with Other Systems:} No integration into other Exa-Ma software yet.
@@ -84,35 +85,30 @@ \subsection{Initial Performance Metrics}
 This section provides a summary of initial performance benchmarks performed in the context of WP3. It ensures reproducibility by detailing input/output datasets, benchmarking tools, and the results. All data should be publicly available, ideally with a DOI for future reference.
 
 \begin{itemize}
-    \item \textbf{Overall Performance:} Summarize the software's computational performance, energy efficiency, and scalability results across different architectures (e.g., CPU, GPU, hybrid systems).
-    \item \textbf{Input/Output Dataset:} we do not have I/O as we generate at runtime the local matrices used for the  benchmark
-    \item \textbf{open-data Access:} Indicate whether the datasets used for the benchmark are open access, and provide a DOI or a direct link for download. Where applicable, highlight any licensing constraints.
-    \item \textbf{Challenges:} Identify any significant bottlenecks or challenges observed during the benchmarking process, including data handling and computational performance.
+    \item \textbf{Overall Performance:} weak scalability on up-to $\approx$ 20~000 cores for the solution of a $\approx 10^9$ linear system. 
+    \item \textbf{Input/Output Dataset:} not applicable.
+    \item \textbf{open-data Access:} Benchmark on matrix generator distributed on the gitlab of the package.
+%    \item \textbf{Challenges:} Identify any significant bottlenecks or challenges observed during the benchmarking process, including data handling and computational performance.
     \item \textbf{Future Improvements:} perform more exhaustive experiments on heteroneous nodes, that is using the MPI+StarPU option.
 \end{itemize}
 
-\subsubsection{Benchmark \#1}
+\subsubsection{Benchmark \#1: heterogeneous diffusion }
 \begin{itemize}
-    \item \textbf{Description:} Briefly describe the benchmark case, including the problem size, target architecture (e.g., CPU, GPU), and the input data. Mention the specific goals of the benchmark (e.g., testing scalability, energy efficiency).
-    \item \textbf{Benchmarking Tools Used:} List the tools used for performance analysis, such as Extrae, Score-P, TAU, Vampir, or Nsight, and specify what metrics were measured (e.g., execution time, FLOPS, energy consumption).
-    \item \textbf{Input/Output Dataset Description:}
-        \begin{itemize}
-            \item \textbf{Input Data:} Describe the input dataset (size, format, data type) and provide a DOI or link to access it.
-            \item \textbf{Output Data:} Specify the structure of the results (e.g., memory usage, runtime logs) and how they can be accessed or replicated.
-            \item \textbf{Data Repository:} Indicate where the data is stored (e.g., Zenodo, institutional repository) and provide a DOI or URL for accessing the data.
-        \end{itemize}
-    \item \textbf{Results Summary:} Include a summary of key metrics (execution time, memory usage, FLOPS) and their comparison across architectures (e.g., CPU, GPU).
-    \item \textbf{Challenges Identified:} Describe any bottlenecks encountered (e.g., memory usage, parallelization inefficiencies) and how they impacted the benchmark.
+    \item \textbf{Description:} Solution of a 3D heterogenous diffusion équations in a cube to enable a parallel generation of the benchmark.
+    \item \textbf{Benchmarking Tools Used:} Metrics are memory consumption and elapsed time to solution.
+    \item \textbf{Input/Output Dataset Description:} internal processing of the output to perform 
+    \item \textbf{Results Summary:} Speedups
+    \item \textbf{Challenges Identified:} scalability at extreme scale.
 \end{itemize}
 
 \subsection{12-Month Roadmap}
 \label{sec:WP3:Composyx:roadmap}
 
 In this section, describe the roadmap for improving benchmarks and addressing the challenges identified. This should include:
 \begin{itemize}
-    \item \textbf{Data Improvements:} Plans for improving input/output data management, including making datasets more accessible and ensuring reproducibility through open-data initiatives.
+    \item \textbf{Data Improvements:} Use other matrix generator using some of the packages developped within Ex-Ma such as FreeFEM++ and/or Feel++.
     \item \textbf{Methodology Application:} Implementation of the benchmarking methodology proposed in this deliverable to streamline reproducibility and dataset management.
-    \item \textbf{Results Retention:} Plans to maintain benchmark results in a publicly accessible repository with appropriate metadata and documentation, ensuring long-term usability.
+    \item \textbf{Results Retention:} We will consider to publish  on the gitlab of the packages the performance results produced by the CI.
 \end{itemize}
 
 In~\cref{tab:WP3:Composyx:bottlenecks}, we briefly discuss the bottleneck roadmap associated to the software and relevant to the work package.
@@ -130,13 +126,13 @@ \subsection{12-Month Roadmap}
 
     \rowcolor{numpexgray}{\rule{0pt}{2.5ex}\color{white}\bf Bottlenecks} &  {\rule{0pt}{2.5ex}\color{white}\bf Short Description }\\ 
 
-\rowcolor{white}    B10 - Scientific Productivity & provide short description here \\
+\rowcolor{white}    B10 - Scientific Productivity & Guix-HPC \\
 \rowcolor{numpexlightergray}    B11 - Reproducibility and Replicability of Computation & Guix-HPC \\
 \rowcolor{white}    B6 - Data Management & not applicable \\
-\rowcolor{numpexlightergray}    B7 - Exascale Algorithms & Tune CPU and GPU features - Possibly add numerical resiliency \\
+\rowcolor{numpexlightergray}    B7 - Exascale Algorithms & Tune CPU and GPU features - Possibly add numerical resiliency eventhough we still believe that the resilincy should be addressed in an hollistic fashion as advocated in~\cite{agullo_resiliency_2022}. \\
 \end{tabular}
         }
     }
     \caption{WP3: Composyx plan with Respect to Relevant Bottlenecks}
     \label{tab:WP3:Composyx:bottlenecks}
-\end{table}
+\end{table}
diff --git a/software/composyx/composyx.tex b/software/composyx/composyx.tex
@@ -51,7 +51,7 @@ \subsection{Software summary}
 
 \subsection{Purpose}
 \label{sec:Composyx:purpose}
-Solution of large sparse linear systems using preconditioned subspace methods. For that purpose it relies on the Fabulous packages that implements various techniques including block variants for multiple right-hand sides~\cite{giraud_block_2022}
+Solution of large sparse linear systems using preconditioned subspace methods. For that purpose it relies on the Fabulous packages that implements various techniques including block variants for multiple right-hand sides~\cite{giraud_block_2022}.
 
 \subsection{Programming and Computational Environment}
 \label{sec::Composyx:environment_capabilities}
@@ -70,7 +70,7 @@ \subsection{Programming and Computational Environment}
         \rowcolor{numpexgray}{\rule{0pt}{2.5ex}\color{white}\bf Category}  & {\rule{0pt}{2.5ex}\color{white}\bf Details} & {\rule{0pt}{2.5ex}\color{white}\bf Description}\\
         \rowcolor{white}Languages  & \begin{tabular}{l}
 C\\
-C++\\
+C++20\\
 Fortran\\
 \end{tabular} & Programming languages and language standards supported by the software \\
         \rowcolor{numpexlightergray}Parallelism  & \begin{tabular}{l}