├── .gitignore ├── .latexmkrc ├── ConfluenceProductDictionaryExample.png ├── Deliverables-Overview.tex ├── DependencyDashboard-EditPanel.png ├── Design.tex ├── E4S-AWS-public-image.png ├── E4S-Build-Cache-Binaries-2020.pdf ├── E4S-Build-Tree.png ├── E4S-Community-Policies-V1.png ├── E4S-GCP.png ├── E4S-Hierarchy-old.png ├── E4S-Hierarchy.pdf ├── E4S-Lifecycle-old.png ├── E4S-Lifecycle.pdf ├── E4S-Summary.png ├── ECP-ST-CAR-V30-FINAL.pdf ├── ECP-ST-CAR-V30-Submitted.pdf ├── ECP-ST-CAR.tex ├── ECP-ST-Leads.pdf ├── ECP-ST-Leads_orig.jpeg ├── ECP-ST-Leads_v2.jpeg ├── ECP-ST-Leads_v3.png ├── ECP-ST-Leads_v4.png ├── ECP20.png ├── ECP21.png ├── ECP22.pdf ├── ECPSTV1.jpeg ├── ECPSTV2.jpeg ├── ECPSTV3.png ├── ECP_ST_CAR_PUBLIC 20220818.pdf ├── IntegratedML.png ├── Introduction.tex ├── KPP-Definitions-old.png ├── KPP-Definitions.pdf ├── L3-Overview-old.png ├── L3-Overview.pdf ├── LICENSE ├── Makefile ├── PETSc-TAO-Dependencies.png ├── Planning-Process.png ├── ProductDictionary.tex ├── ProductDictionaryOverview.png ├── ProductDocumentationGitHub.png ├── ProductDocumentationGoals.png ├── ProductsOverview.jpeg ├── Project-Management.tex ├── Projects.tex ├── README.md ├── SDKs.pptx ├── ST-HI-Interplay.jpeg ├── STFY20WBS.png ├── STFY20WBS_v1.png ├── STFY22WBS.png ├── STFY22WBS.pptx ├── SoftwareStack.jpeg ├── Standards.tex ├── StandardsInvolvement.jpeg ├── abstract.tex ├── cover.pdf ├── ecp-small.png ├── ecp.png ├── ecpreport-publicv1.cls ├── ecpreportv2.cls ├── projects ├── 2.3.1-PMR │ ├── 2.3.1-PMR.bib │ ├── 2.3.1-PMR.tex │ ├── 2.3.1.01-PMR-SDKs │ │ ├── 2.3.1.01-PMR-SDKs.bib │ │ └── 2.3.1.01-PMR-SDKs.tex │ ├── 2.3.1.07-Exascale-MPI │ │ ├── 2.3.1.07-Exascale-MPI.bib │ │ ├── 2.3.1.07-Exascale-MPI.tex │ │ ├── MPICH-recent-milestones.pdf │ │ └── MS-figure-raw.pptx │ ├── 2.3.1.08-Legion │ │ ├── 2.3.1.08-Legion.bib │ │ └── 2.3.1.08-Legion.tex │ ├── 2.3.1.09-ParSEC │ │ ├── 2.3.1.09-ParSEC.bib │ │ ├── 2.3.1.09-ParSEC.tex │ │ ├── PaRSEC-diagram.png │ │ ├── cc_abcd.csv │ │ ├── cc_abcd.pdf │ │ ├── dpotrf-ttg │ │ │ ├── dpotrf_1403612-page3.pdf │ │ │ └── dpotrf_1403612.pdf │ │ ├── gemm_summit_mean.pdf │ │ ├── irr-bs-gemm-combined.pdf │ │ ├── irr-bs-gemm-v3-perf.dat │ │ ├── irr-bs-gemm-v3-time.dat │ │ ├── irr-bs-gemm.gnp │ │ ├── irr-bs-gemm.pdf │ │ ├── make.plt │ │ ├── project-1e-13.pdf │ │ ├── rwalk-10.pdf │ │ ├── scalapack_GEMM.pdf │ │ ├── scalapack_POTRF.pdf │ │ ├── scalapack_cpu_GEMM.pdf │ │ ├── scalapack_cpu_POTRF.pdf │ │ ├── scalapack_gpu_GEMM.pdf │ │ ├── scalapack_gpu_POTRF.pdf │ │ ├── slate_updated_nacl.pdf │ │ ├── spock-gemm-pbscal1.pdf │ │ ├── spock-mqpc-density1.pdf │ │ ├── spock-po-pbscal1.pdf │ │ └── spock-po-pbscal4.pdf │ ├── 2.3.1.14-UPCxx-GASNet │ │ ├── 2.3.1.14-GASNet-EX.bib │ │ ├── 2.3.1.14-GASNet-EX.tex │ │ ├── 2.3.1.14-UPCxx.bib │ │ ├── 2.3.1.14-UPCxx.tex │ │ ├── Summit-slide-BW.pdf │ │ ├── all-cori-haswell-out-inserts-wait.png │ │ ├── all-cori-knl-out-inserts-wait.png │ │ ├── latency_bars.pdf │ │ ├── paw21_interop_strong_scaling1.pdf │ │ ├── ss_Flan_1565_complex.pdf │ │ ├── ss_boneS10_comm.pdf │ │ └── upcxx-spock.pdf │ ├── 2.3.1.16-SICM │ │ ├── 2.3.1.16-SICM.bib │ │ ├── 2.3.1.16-SICM.tex │ │ ├── mike-excelent.pdf │ │ └── sicm-online-diagram.pdf │ ├── 2.3.1.17-OMPI-X │ │ ├── 2.3.1.17-OMPI-X.bib │ │ ├── 2.3.1.17-OMPI-X.tex │ │ ├── p2p-threading-performance.png │ │ ├── partitioned-comms-code.jpg │ │ ├── partitioned-communications-early-receive.png │ │ ├── partitioned-communications-partial-sends.png │ │ ├── reinit-performance.jpg │ │ ├── reinit.png │ │ ├── rma-threading-performance.png │ │ └── ult-performance.png │ ├── 2.3.1.18-RAJA-Kokkos │ │ ├── 2.3.1.18-RAJA-Kokkos.bib │ │ ├── 2.3.1.18-RAJA-Kokkos.tex │ │ └── ecp-small.png │ └── 2.3.1.19-Argo-PowerSteering │ │ ├── 2.3.1.19-Argo-PowerSteering.bib │ │ ├── 2.3.1.19-Argo-PowerSteering.tex │ │ ├── PowerStack_v2.png │ │ ├── aml-components.pdf │ │ ├── aml-xsbench.pdf │ │ ├── aml.tex │ │ ├── argo-global.pdf │ │ ├── argo-node.pdf │ │ ├── cpd.png │ │ ├── nrm-energy.png │ │ ├── nrm-loop.pdf │ │ ├── nrm-runtime.png │ │ ├── nrm.tex │ │ ├── power_model.png │ │ ├── powerstack.tex │ │ ├── sensors.jpg │ │ ├── umap-arch.pdf │ │ └── umap.tex ├── 2.3.2-Tools │ ├── 2.3.2-Tools.bib │ ├── 2.3.2-Tools.tex │ ├── 2.3.2.01-Tools-SDKs │ │ ├── 2.3.2.01-Tools-SDKs.bib │ │ └── 2.3.2.01-Tools-SDKs.tex │ ├── 2.3.2.06-EXA-PAPI │ │ ├── 2.3.2.06-EXA-PAPI.bib │ │ ├── 2.3.2.06-EXA-PAPI.tex │ │ ├── 2.3.2.06-EXA-PAPI_old.tex │ │ ├── Exa-PAPI_sde_magma.pdf │ │ ├── Exa-PAPI_sde_parsec.pdf │ │ ├── cat-DP-flops-arch-comparison-1.pdf │ │ └── papi_sde.pdf │ ├── 2.3.2.08-HPCToolkit │ │ ├── 2.3.2.08-HPCToolkit.bib │ │ ├── 2.3.2.08-HPCToolkit.tex │ │ ├── hpctoolkit-lammps-traces.pdf │ │ ├── hpctoolkit-many-threads.pdf │ │ ├── hpctoolkit-nyx-trace.pdf │ │ ├── hpctoolkit-pelec-profiles.pdf │ │ ├── hpctoolkit-qs.pdf │ │ ├── hpctoolkit-raja-perf.pdf │ │ └── hpctoolkit-vec-add-ompt.pdf │ ├── 2.3.2.10-PROTEAS-YTUNE │ │ ├── 2.3.2.10-Autotuning.bib │ │ ├── 2.3.2.10-Autotuning.tex │ │ ├── 2.3.2.10-Bricks.bib │ │ ├── 2.3.2.10-Bricks.tex │ │ ├── 2.3.2.10-CLACC.bib │ │ ├── 2.3.2.10-CLACC.tex │ │ ├── 2.3.2.10-FLACC-MLIR.tex │ │ ├── 2.3.2.10-LLVM-DOE.tex │ │ ├── 2.3.2.10-LLVM.bib │ │ ├── 2.3.2.10-LLVM.tex │ │ ├── 2.3.2.10-PAPYRUS.bib │ │ ├── 2.3.2.10-PAPYRUS.tex │ │ ├── 2.3.2.10-PROTEAS.bib │ │ ├── 2.3.2.10-PROTEAS.tex │ │ ├── 2.3.2.10-SYCL.bib │ │ ├── 2.3.2.10-SYCL.tex │ │ ├── 2.3.2.10-TAU.bib │ │ ├── 2.3.2.10-TAU.tex │ │ ├── Bricks-mpi-parts.pdf │ │ ├── YTune-searchtree.pdf │ │ ├── YTune-solution.jpg │ │ ├── YTune-solution.png │ │ ├── clacc.png │ │ ├── clacc_tau.png │ │ ├── miniFE_openmp_tau.png │ │ ├── papyrus-fig.jpg │ │ ├── papyrus-fig_orig.pdf │ │ ├── papyrus-meraculous-eval.pdf │ │ ├── papyrus-meraculous.pdf │ │ ├── tau-3d-candle.png │ │ ├── tau-3d.jpg │ │ ├── tau-3d_orig.pdf │ │ └── tau-papyruskv.png │ ├── 2.3.2.11-SOLLVE │ │ ├── 2.3.2.11-SOLLVE-ARGOBOTS.bib │ │ ├── 2.3.2.11-SOLLVE-ARGOBOTS.tex │ │ ├── 2.3.2.11-SOLLVE-BOLT.bib │ │ ├── 2.3.2.11-SOLLVE-BOLT.tex │ │ ├── 2.3.2.11-SOLLVE-HeteroLoopSchedRTS.tex │ │ ├── 2.3.2.11-SOLLVE-LLVM.tex │ │ ├── 2.3.2.11-SOLLVE-LLVM_enhancement.bib │ │ ├── 2.3.2.11-SOLLVE-LLVM_enhancement.tex │ │ ├── 2.3.2.11-SOLLVE-VV.bib │ │ ├── 2.3.2.11-SOLLVE-VV.tex │ │ ├── 2.3.2.11-SOLLVE-training.tex │ │ ├── 2.3.2.11-SOLLVE.bib │ │ ├── 2.3.2.11-SOLLVE.tex │ │ ├── LLVM-Implementation-Figures │ │ │ ├── LLVM-opt-kernel-times.jpg │ │ │ ├── openmc.tex │ │ │ ├── t_1024.tex │ │ │ └── t_256.tex │ │ ├── LLVM-opt-kernel-times.jpg │ │ ├── SOLLVE-ARGOBOTS.pdf │ │ ├── SOLLVE-BOLT.pdf │ │ ├── SOLLVE-progress.pdf │ │ ├── mgpu-Spock.pdf │ │ ├── multi_gpu_spock.png │ │ ├── multi_gpu_spock2.png │ │ ├── one_gpu_spock.png │ │ ├── onegpu-Spock.pdf │ │ ├── sollve-figure-ecp-car-source-empty.pptx │ │ ├── text-for-sollve-progress-diagram.txt │ │ ├── tiling.pdf │ │ └── unroll.pdf │ └── 2.3.2.12-Flang │ │ ├── 2.3.2.12-Flang.bib │ │ ├── 2.3.2.12-Flang.tex │ │ └── flang-performance.png ├── 2.3.3-MathLibs │ ├── 2.3.3-MathLibs.bib │ ├── 2.3.3-MathLibs.tex │ ├── 2.3.3.01-xSDK │ │ ├── 2.3.3.01-xSDK.bib │ │ ├── 2.3.3.01-xSDK.tex │ │ ├── 2.3.3.01-xsdk-batchsprsla.tex │ │ ├── 2.3.3.01-xsdk-multiprecision.tex │ │ ├── xsdk-0.6.0.png │ │ ├── xsdk-examples-diagram.png │ │ └── xsdk-machinebalance.pdf │ ├── 2.3.3.06-PETSc-TAO │ │ ├── 2.3.3.06-PETSc-TAO.bib │ │ ├── 2.3.3.06-PETSc-TAO.tex │ │ ├── petsc_arch.png │ │ └── petsc_perf.pdf │ ├── 2.3.3.07-STRUMPACK-SuperLU │ │ ├── 2.3.3.07-STRUMPACK-SuperLU.bib │ │ ├── 2.3.3.07-STRUMPACK-SuperLU.tex │ │ ├── P3_V100.pdf │ │ ├── periodic-cube-scaling-strumpack.pdf │ │ ├── periodic-cube-scaling-strumpack_metis.pdf │ │ ├── speedup_SOA.jpg │ │ ├── strumpack-Summit.pdf │ │ ├── strumpack-scaling.jpg │ │ ├── strumpack-scaling.pdf │ │ ├── superlu-solve-Summit.pdf │ │ └── superlu-trisolve-scaling.pdf │ ├── 2.3.3.12-SUNDIALS-hypre │ │ ├── 2.3.3.12-SUNDIALS.bib │ │ ├── 2.3.3.12-SUNDIALS.tex │ │ ├── 2.3.3.12-hypre.bib │ │ ├── 2.3.3.12-hypre.tex │ │ ├── AMReX_CVODE_OpenMP_GPU-Streams-2.png │ │ ├── AMS-PCG.png │ │ ├── PeleC_fig.pdf │ │ ├── Spock-AMG-PCG.png │ │ ├── SpockResults-Dec2021.png │ │ ├── crusher-AMG-PCG.png │ │ ├── crusher-spock-1e7-Feb2022.png │ │ ├── hypre-mixed-int.png │ │ ├── hypre-rap-1gpu.png │ │ ├── manyvector_v2.pdf │ │ └── sunorg1.pdf │ ├── 2.3.3.13-CLOVER │ │ ├── 2.3.3.13-CLOVER.tex │ │ ├── 2.3.3.13-FFT-ECP.tex │ │ ├── 2.3.3.13-FFT.bib │ │ ├── 2.3.3.13-GINKGO.bib │ │ ├── 2.3.3.13-GINKGO.tex │ │ ├── 2.3.3.13-SLATE.bib │ │ ├── 2.3.3.13-SLATE.tex │ │ ├── SLATE-architecture.jpg │ │ ├── batchedFFT-Spock.pdf │ │ ├── ffttransormations.pdf │ │ ├── ginkgo_eas │ │ │ ├── bw_cg_solver.pdf │ │ │ ├── bw_csr_spmv.pdf │ │ │ ├── bw_ell_spmv.pdf │ │ │ └── bw_gmres_solver.pdf │ │ ├── ginkgo_portability_crop.png │ │ ├── heFFTeAcceleration.png │ │ ├── heFFTeScalability.png │ │ ├── heFFTeStrongScalability.pdf │ │ ├── heffte.png │ │ ├── heffte_conv_dst.pdf │ │ ├── runtime2.pdf │ │ ├── slate-he2hb-1node.pdf │ │ ├── slate-he2hb-4node.pdf │ │ ├── slate-spock-gemm.pdf │ │ └── slate-spock-trf.pdf │ ├── 2.3.3.14-ALExa-ForTrilinos │ │ ├── 2.3.3.14-ALExa.bib │ │ ├── 2.3.3.14-ALExa.tex │ │ ├── 2.3.3.14-ForTrilinos.bib │ │ ├── ForTrilinos_ioc.pdf │ │ ├── arborx_summit.png │ │ ├── dtk-gpu.png │ │ ├── dtk_exaam_pit.png │ │ ├── tasmanian-gpu.png │ │ └── tasmanian_exastar.png │ └── 2.3.3.15-Sake │ │ ├── 2.3.3.15-KokkosKernels.tex │ │ ├── 2.3.3.15-Sake.tex │ │ └── 2.3.3.15-Trilinos.tex ├── 2.3.4-DataViz │ ├── 2.3.4-DataViz.bib │ ├── 2.3.4-DataViz.tex │ ├── 2.3.4.01-DataViz-SDK │ │ ├── 2.3.4.01-DataViz-SDK.bib │ │ ├── 2.3.4.01-DataViz-SDK.tex │ │ ├── HDF5-Arch-small.png │ │ ├── HDF5-Arch.png │ │ └── VOL-improvements.png │ ├── 2.3.4.09-ADIOS │ │ ├── 2.3.4.09-ADIOS.bib │ │ ├── 2.3.4.09-ADIOS.tex │ │ └── ADIOS_in_ECP.png │ ├── 2.3.4.10-DataLib │ │ ├── 2.3.4.10-DataLib.tex │ │ └── pnetcdf-figure.pdf │ ├── 2.3.4.13-ECP-VTK-m │ │ ├── 2.3.4.13-ECP-VTK-m.bib │ │ ├── 2.3.4.13-ECP-VTK-m.tex │ │ ├── VTKm-Bubbles-Components.png │ │ ├── VTKm-Bubbles-Density.png │ │ ├── VTKm-Clip.png │ │ ├── VTKm-FTLE.png │ │ ├── VTKm-Streamlines.png │ │ ├── VTKm-contour-cell-types.jpg │ │ ├── VTKm-extruded-cell-set.png │ │ ├── VTKm-flying-edges.png │ │ ├── VTKm-particle-density.png │ │ ├── VTKm-particle-spheres.png │ │ ├── VTKm-spock-timing.png │ │ ├── VTKm-warpx-flow.png │ │ ├── VTKm-warpx-in-situ.png │ │ ├── VTKm-wdm-in-situ.png │ │ └── snl-logos.png │ ├── 2.3.4.14-VeloC-SZ │ │ ├── 2.3.4.14-EZ.bib │ │ ├── 2.3.4.14-EZ.tex │ │ ├── 2.3.4.14-VeloC.bib │ │ ├── 2.3.4.14-VeloC.tex │ │ ├── 200718_workflow.pdf │ │ ├── SZ-Huffman.eps │ │ ├── Visual-quality-NYX-SZ.png │ │ ├── qmcpackbig-a.eps │ │ ├── sz-illu.png │ │ ├── time-based-comp-and-random.jpg │ │ ├── veloc-arch.png │ │ ├── veloc-hacc.eps │ │ ├── veloc-lqcd.eps │ │ └── xSDK-diagram.jpeg │ ├── 2.3.4.15-HDF5-UnifyCR │ │ ├── 2.3.4.15-ExaHDF5.tex │ │ ├── 2.3.4.15-UNIFYCR.bib │ │ ├── 2.3.4.15-UNIFYCR.tex │ │ ├── UnifyCR-overview.png │ │ ├── UnifyFS-overview.png │ │ ├── VOL-Overview.pdf │ │ ├── async_io_overview.pdf │ │ ├── milestone2.png │ │ └── usingUnifyFS.png │ ├── 2.3.4.16-ALPINE-ZFP │ │ ├── 2.3.4.16-ALPINE.bib │ │ ├── 2.3.4.16-ALPINE.tex │ │ ├── 2.3.4.16-ZFP.bib │ │ ├── 2.3.4.16-ZFP.tex │ │ ├── ZFP.png │ │ ├── alpine-cinema-mfixexa-workflow.png │ │ ├── alpine_infrastructure.png │ │ ├── alpine_nyxSamplingExample.png │ │ ├── alpine_topology.jpg │ │ ├── alpine_topology_orig.png │ │ ├── zfp-performance.pdf │ │ ├── zfp-sw4-hdf5.png │ │ └── zfp-sw4.png │ ├── DataViz-storage-notional-diagram.pdf │ ├── DataViz-storage-specs-current.pdf │ └── DataViz-storage-specs-next.pdf ├── 2.3.5-Ecosystem │ ├── 2.3.5-Ecosystem.bib │ ├── 2.3.5-Ecosystem.tex │ ├── 2.3.5.01-Ecosystem-SDK │ │ ├── 2.3.5.01-Ecosystem-SDK.bib │ │ ├── 2.3.5.01-Ecosystem-SDK.tex │ │ ├── E4S-policy-comment.png │ │ ├── E4S_Nalu_AWS.png │ │ ├── E4S_Pantheon.png │ │ ├── E4S_Pantheon_small.png │ │ ├── E4S_WDMApp.png │ │ ├── E4S_buildcache_Feb22.png │ │ ├── E4S_buildcache_Jun22.png │ │ ├── E4S_buildcache_Oct21.png │ │ ├── SDKdefinition1.png │ │ ├── SDKdefinition2.png │ │ ├── SDKdefinition3.png │ │ ├── SDKdefinitionV2.png │ │ ├── SDKfig.png │ │ └── SpackBuildCacheWDMapp.png │ ├── 2.3.5.09-SW-Packaging │ │ ├── 2.3.5.09-SW-Packaging.bib │ │ └── 2.3.5.09-SW-Packaging.tex │ └── 2.3.5.10-ExaWorks │ │ ├── 2.3.5.10-ExaWorks.bib │ │ ├── 2.3.5.10-ExaWorks.tex │ │ ├── exaworks-circle.png │ │ └── exaworks.png └── 2.3.6-NNSA │ ├── 2.3.6-NNSA.bib │ ├── 2.3.6-NNSA.tex │ ├── 2.3.6.01-LANL-ATDM │ ├── 2.3.6.01-LANL-ATDM-ST.bib │ ├── 2.3.6.01-LANL-ATDM-ST.tex │ ├── ECPReviewScreenshot.png │ ├── cinema-cis-stone-coolwarm.png │ ├── cinema-cis-stone-grayscale.png │ ├── cinema-cis-stone-water.png │ ├── cinema-cis-streamlines.png │ ├── cinema-jnc-nyx-volume.png │ ├── control-replication-performance.png │ ├── hxhim-main.png │ ├── mesh.pdf │ ├── pantheon-workflow.png │ └── tracing-performance.png │ ├── 2.3.6.02-LLNL-ATDM │ ├── 2.3.6.02-LLNL-ATDM-ST.bib │ ├── 2.3.6.02-LLNL-ATDM-ST.tex │ ├── HO-LO.pdf │ ├── New.pdf │ ├── Old.pdf │ ├── ROSE-raja.png │ ├── mfem-amr.jpg │ ├── mfem-gpu.pdf │ ├── mfem-hp-refinement.png │ ├── raja-umpire-chai-support.pdf │ ├── spack-pipelines.pdf │ └── xSDK-diagram.jpeg │ └── 2.3.6.03-SNL-ATDM │ ├── 2.3.6.03-SNL-ATDM-ST.bib │ ├── 2.3.6.03-SNL-ATDM-ST.tex │ └── kokkos-abstractions.jpg ├── references.bib ├── xSDK-Diagram.jpeg └── xSDK-Policies.jpeg /.gitignore: -------------------------------------------------------------------------------- 1 | ## Core latex/pdflatex auxiliary files: 2 | *.aux 3 | *.lof 4 | *.log 5 | *.lot 6 | *.fls 7 | *.out 8 | *.toc 9 | *.fmt 10 | *.fot 11 | *.cb 12 | *.cb2 13 | .*.lb 14 | 15 | ## Intermediate documents: 16 | *.dvi 17 | *.xdv 18 | *-converted-to.* 19 | # these rules might exclude image files for figures etc. 20 | # *.ps 21 | # *.eps 22 | # *.pdf 23 | 24 | ## Generated if empty string is given at "Please type another file name for output:" 25 | .pdf 26 | 27 | ## Bibliography auxiliary files (bibtex/biblatex/biber): 28 | *.bbl 29 | *.bcf 30 | *.blg 31 | *-blx.aux 32 | *-blx.bib 33 | *.run.xml 34 | 35 | ## Build tool auxiliary files: 36 | *.fdb_latexmk 37 | *.synctex 38 | *.synctex(busy) 39 | *.synctex.gz 40 | *.synctex.gz(busy) 41 | *.pdfsync 42 | 43 | ## Auxiliary and intermediate files from other packages: 44 | # algorithms 45 | *.alg 46 | *.loa 47 | 48 | # achemso 49 | acs-*.bib 50 | 51 | # amsthm 52 | *.thm 53 | 54 | # beamer 55 | *.nav 56 | *.pre 57 | *.snm 58 | *.vrb 59 | 60 | # changes 61 | *.soc 62 | 63 | # cprotect 64 | *.cpt 65 | 66 | # elsarticle (documentclass of Elsevier journals) 67 | *.spl 68 | 69 | # endnotes 70 | *.ent 71 | 72 | # fixme 73 | *.lox 74 | 75 | # feynmf/feynmp 76 | *.mf 77 | *.mp 78 | *.t[1-9] 79 | *.t[1-9][0-9] 80 | *.tfm 81 | 82 | #(r)(e)ledmac/(r)(e)ledpar 83 | *.end 84 | *.?end 85 | *.[1-9] 86 | *.[1-9][0-9] 87 | *.[1-9][0-9][0-9] 88 | *.[1-9]R 89 | *.[1-9][0-9]R 90 | *.[1-9][0-9][0-9]R 91 | *.eledsec[1-9] 92 | *.eledsec[1-9]R 93 | *.eledsec[1-9][0-9] 94 | *.eledsec[1-9][0-9]R 95 | *.eledsec[1-9][0-9][0-9] 96 | *.eledsec[1-9][0-9][0-9]R 97 | 98 | # glossaries 99 | *.acn 100 | *.acr 101 | *.glg 102 | *.glo 103 | *.gls 104 | *.glsdefs 105 | 106 | # gnuplottex 107 | *-gnuplottex-* 108 | 109 | # gregoriotex 110 | *.gaux 111 | *.gtex 112 | 113 | # htlatex 114 | *.4ct 115 | *.4tc 116 | *.idv 117 | *.lg 118 | *.trc 119 | *.xref 120 | 121 | # hyperref 122 | *.brf 123 | 124 | # knitr 125 | *-concordance.tex 126 | # TODO Comment the next line if you want to keep your tikz graphics files 127 | *.tikz 128 | *-tikzDictionary 129 | 130 | # listings 131 | *.lol 132 | 133 | # makeidx 134 | *.idx 135 | *.ilg 136 | *.ind 137 | *.ist 138 | 139 | # minitoc 140 | *.maf 141 | *.mlf 142 | *.mlt 143 | *.mtc[0-9]* 144 | *.slf[0-9]* 145 | *.slt[0-9]* 146 | *.stc[0-9]* 147 | 148 | # minted 149 | _minted* 150 | *.pyg 151 | 152 | # morewrites 153 | *.mw 154 | 155 | # nomencl 156 | *.nlg 157 | *.nlo 158 | *.nls 159 | 160 | # pax 161 | *.pax 162 | 163 | # pdfpcnotes 164 | *.pdfpc 165 | 166 | # sagetex 167 | *.sagetex.sage 168 | *.sagetex.py 169 | *.sagetex.scmd 170 | 171 | # scrwfile 172 | *.wrt 173 | 174 | # sympy 175 | *.sout 176 | *.sympy 177 | sympy-plots-for-*.tex/ 178 | 179 | # pdfcomment 180 | *.upa 181 | *.upb 182 | 183 | # pythontex 184 | *.pytxcode 185 | pythontex-files-*/ 186 | 187 | # thmtools 188 | *.loe 189 | 190 | # TikZ & PGF 191 | *.dpth 192 | *.md5 193 | *.auxlock 194 | 195 | # todonotes 196 | *.tdo 197 | 198 | # easy-todo 199 | *.lod 200 | 201 | # xmpincl 202 | *.xmpi 203 | 204 | # xindy 205 | *.xdy 206 | 207 | # xypic precompiled matrices 208 | *.xyc 209 | 210 | # endfloat 211 | *.ttt 212 | *.fff 213 | 214 | # Latexian 215 | TSWLatexianTemp* 216 | 217 | ## Editors: 218 | # WinEdt 219 | *.bak 220 | *.sav 221 | 222 | # Texpad 223 | .texpadtmp 224 | 225 | # Kile 226 | *.backup 227 | 228 | # KBibTeX 229 | *~[0-9]* 230 | 231 | # auto folder when using emacs and auctex 232 | ./auto/* 233 | *.el 234 | 235 | # expex forward references with \gathertags 236 | *-tags.tex 237 | 238 | # standalone packages 239 | *.sta 240 | 241 | # generated if using elsarticle.cls 242 | *.spl 243 | .DS_Store 244 | ECP-ST-CAR.pdf 245 | ECP-ST-CAR.pdf 246 | 247 | # generated file from main Makefile 248 | ECP-ST-CAR.aux.make 249 | ECP-ST-CAR.auxbbl.make 250 | ECP-ST-CAR.auxtarget.make 251 | ECP-ST-CAR.d 252 | ECP-ST-CAR.lof.make 253 | ECP-ST-CAR.lot.make 254 | ECP-ST-CAR.out.make 255 | ECP-ST-CAR.toc.make 256 | ECP-ST-CAR.aux.make 257 | ECP-ST-CAR.auxbbl.make.temp 258 | -------------------------------------------------------------------------------- /.latexmkrc: -------------------------------------------------------------------------------- 1 | add_cus_dep('glo', 'gls', 0, 'makeglo2gls'); 2 | sub makeglo2gls { 3 | system("makeindex -s '$_[0]'.ist -t '$_[0]'.glg -o '$_[0]'.gls '$_[0]'.glo"); 4 | } 5 | 6 | add_cus_dep('acn', 'acr', 0, 'makeacn2acr'); 7 | sub makeacn2acr { 8 | system("makeindex -s '$_[0]'.ist -t '$_[0]'.alg -o '$_[0]'.acr '$_[0]'.acn"); 9 | } 10 | 11 | @default_files = ('ECP-ST-CAR.tex'); 12 | 13 | $pdflatex = 'pdflatex %O --shell-escape %S'; 14 | 15 | $clean_ext = "cut glsdefs cut ist xml run.xml ucf ist acn acr alg bbl glo snm nav vrb listing lol"; 16 | -------------------------------------------------------------------------------- /ConfluenceProductDictionaryExample.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ConfluenceProductDictionaryExample.png -------------------------------------------------------------------------------- /Deliverables-Overview.tex: -------------------------------------------------------------------------------- 1 | \begin{wrapfigure}{r}{0.5\textwidth} 2 | \begin{mdframed} 3 | \large{ECP ST contributes to the HPC software ecosystem through direct product development, contributions to industry and de facto standards, and shaping the requirements, design, and prototyping of products delivery by vendors and other third parties.} 4 | \end{mdframed} 5 | \end{wrapfigure} 6 | ECP ST efforts contribute to the HPC software ecosystem in a variety of ways. The most tangible way was to include contributions to software products, many of which are already widely deployed and being transformed for use with exascale systems. However, the ECP ST contributes to industry and de facto standards efforts. Finally, some ECP ST efforts contribute to the upstream processes of requirements, analysis, design, and prototyping that inform the implementation of vendor and other third-party software products. Although they do not receive the most attention, these upstream efforts are very impactful and low cost without a product to support. 7 | 8 | %\begin{figure}[htb] 9 | % \begin{center} 10 | % \includegraphics[width=0.7\textwidth]{ProductsOverview} 11 | % 12 | % \caption{\label{fig:productsoverview}{\small{The 33 ECP ST Projects contribute to 70 user-facing software product suites. ECP ST products are delivered to users via many mechanisms. Provides experience we can leverage across projects. Building via Spack is required for participating in ECP ST releases: 50 of the 70 ST product suites are available in the Extreme-scale Scientific Software Stack (E4S) V1.0, release in November 2019.}}} 13 | % \end{center} 14 | %\end{figure} 15 | -------------------------------------------------------------------------------- /DependencyDashboard-EditPanel.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/DependencyDashboard-EditPanel.png -------------------------------------------------------------------------------- /Design.tex: -------------------------------------------------------------------------------- 1 | \subsection{Contributions to External Software Products}\label{subsection:external-contributions} 2 | Although many ECP ST efforts focus on the product that it will develop and support, some of the important work---and certainly some of the most sustainable and highly leveraged work---is done by providing requirements, analysis, design, and prototype capabilities to vendor and other third-party software. Many software studies have shown that 70\%--80\% of the cost of a successful software product goes into post-delivery maintenance. The effort summarized in Table~\ref{table:externalproducts} expressly eliminates this large cost for DOE because the product is developed and supported outside DOE. 3 | 4 | 5 | \begin{table} 6 | %\begin{tabular}{|L{1.5in}|L{4in}|}\hline 7 | \begin{tabularx}{\textwidth}{|l|X|}\hline 8 | \rowcolor{LightCyan} 9 | \textbf{Product} & \textbf{Contribution}\\\hline 10 | Kokkos and RAJA & ECP efforts to provide portable on-node parallel programming and execution environments have led to new features in C++ standards. \\\hline 11 | MPI Forum & ECP ST staff maintain several chapters of the MPI Forum, an effort that requires constant involvement with the other authors, as well as participation in the online discussions related to the chapter and regular attendance of the MPI Forum's face-to-face activities.\\\hline 12 | Flang & ECP funds the development of the new open-source Fortran compiler front end called Flang. Flang provides Fortran language support for LLVM back ends in a way similar to how Clang provides support for C and C++.\\\hline 13 | All \tools\ work & Starting in FY20, the \tools\ efforts are organized around delivering capabilities into the LLVM ecosystem. \\\hline 14 | SWIG & The ECP ST ForTrilinos efforts contribute the capability to generate automatic Fortran bindings from C++ code.\\\hline 15 | TotalView debugger & ECP ST staff, along with RogueWave engineers, are engaged in the co-design of OMPD, the new debugging interface for OpenMP programs. This effort helps RogueWave improve its main debugging product, TotalView, by making it aware and compatible with recent advances in OpenMP debugging.\\\hline 16 | LLVM & An ECP ST staff member is co-leading design discussions around the parallel intermediate representation (IR) and loop-optimization infrastructure.\\\hline 17 | SLATE & ECP ST Mathematical Library efforts inform the design, implementation, and optimization of dense numerical linear algebra routines on most vendor platforms.\\\hline 18 | Cray MPICH MPI-IO & As part of the ExaHDF5 ECP project, the ALCF worked with Cray MPI-IO developers to merge the upstream ROMIO code into the downstream proprietary Cray MPICH MPI-IO, leveraging Cray’s extensive suite of I/O performance tests and further tuning the algorithm. Cray is currently targeting its deployment in an experimental release.\\\hline 19 | OpenHPC & An ECP ST staff member serves on the OpenHPC Technical Steering Committee as a component development representative.\\\hline 20 | \end{tabularx} 21 | \centering 22 | \caption{\label{table:externalproducts} External products to which ECP ST activities contribute. Participation in requirements, analysis, design, and prototyping activities for third-party products is some of the most effective software work that can be done.} 23 | \end{table} 24 | -------------------------------------------------------------------------------- /E4S-AWS-public-image.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-AWS-public-image.png -------------------------------------------------------------------------------- /E4S-Build-Cache-Binaries-2020.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Build-Cache-Binaries-2020.pdf -------------------------------------------------------------------------------- /E4S-Build-Tree.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Build-Tree.png -------------------------------------------------------------------------------- /E4S-Community-Policies-V1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Community-Policies-V1.png -------------------------------------------------------------------------------- /E4S-GCP.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-GCP.png -------------------------------------------------------------------------------- /E4S-Hierarchy-old.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Hierarchy-old.png -------------------------------------------------------------------------------- /E4S-Hierarchy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Hierarchy.pdf -------------------------------------------------------------------------------- /E4S-Lifecycle-old.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Lifecycle-old.png -------------------------------------------------------------------------------- /E4S-Lifecycle.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Lifecycle.pdf -------------------------------------------------------------------------------- /E4S-Summary.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/E4S-Summary.png -------------------------------------------------------------------------------- /ECP-ST-CAR-V30-FINAL.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-CAR-V30-FINAL.pdf -------------------------------------------------------------------------------- /ECP-ST-CAR-V30-Submitted.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-CAR-V30-Submitted.pdf -------------------------------------------------------------------------------- /ECP-ST-Leads.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-Leads.pdf -------------------------------------------------------------------------------- /ECP-ST-Leads_orig.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-Leads_orig.jpeg -------------------------------------------------------------------------------- /ECP-ST-Leads_v2.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-Leads_v2.jpeg -------------------------------------------------------------------------------- /ECP-ST-Leads_v3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-Leads_v3.png -------------------------------------------------------------------------------- /ECP-ST-Leads_v4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP-ST-Leads_v4.png -------------------------------------------------------------------------------- /ECP20.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP20.png -------------------------------------------------------------------------------- /ECP21.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP21.png -------------------------------------------------------------------------------- /ECP22.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP22.pdf -------------------------------------------------------------------------------- /ECPSTV1.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECPSTV1.jpeg -------------------------------------------------------------------------------- /ECPSTV2.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECPSTV2.jpeg -------------------------------------------------------------------------------- /ECPSTV3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECPSTV3.png -------------------------------------------------------------------------------- /ECP_ST_CAR_PUBLIC 20220818.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ECP_ST_CAR_PUBLIC 20220818.pdf -------------------------------------------------------------------------------- /IntegratedML.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/IntegratedML.png -------------------------------------------------------------------------------- /KPP-Definitions-old.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/KPP-Definitions-old.png -------------------------------------------------------------------------------- /KPP-Definitions.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/KPP-Definitions.pdf -------------------------------------------------------------------------------- /L3-Overview-old.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/L3-Overview-old.png -------------------------------------------------------------------------------- /L3-Overview.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/L3-Overview.pdf -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | BSD 2-Clause License 2 | 3 | Copyright (c) 2018, E4S-Project 4 | All rights reserved. 5 | 6 | Redistribution and use in source and binary forms, with or without 7 | modification, are permitted provided that the following conditions are met: 8 | 9 | * Redistributions of source code must retain the above copyright notice, this 10 | list of conditions and the following disclaimer. 11 | 12 | * Redistributions in binary form must reproduce the above copyright notice, 13 | this list of conditions and the following disclaimer in the documentation 14 | and/or other materials provided with the distribution. 15 | 16 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 17 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 19 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE 20 | FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21 | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 22 | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 23 | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 24 | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 25 | OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26 | -------------------------------------------------------------------------------- /PETSc-TAO-Dependencies.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/PETSc-TAO-Dependencies.png -------------------------------------------------------------------------------- /Planning-Process.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/Planning-Process.png -------------------------------------------------------------------------------- /ProductDictionary.tex: -------------------------------------------------------------------------------- 1 | %ECP ST Product Dictionary 2 | %Note: This page is still under construction. 3 | % 4 | %The ECP Software Technology (ST) Product Dictionary is the official list of publicly recognized 5 | %names to which ECP ST efforts contribute. While ST teams use an expanded product 6 | %namespace, the list on this page indicates the eventual access point for ST product development 7 | %efforts. 8 | % 9 | %This table lists only those products that are typically recognizable to users. Examples: 10 | %1. MPI is commonly known by users. MPICH and OpenMPI both provide implementations 11 | %of that product. 12 | %2. Fortran is a product. Flang is a particular Fortran product. LLVM is a backend for some 13 | %Fortran compilers. 14 | %3. FFT is a product. FFTX, FFT-ECP provide FFT capabilities through interchangeable 15 | %interfaces. 16 | %4. C++ is a product. Clacc provides capabilities for Clang, as does LLVM. 17 | % 18 | %Product 19 | %Dictionary 20 | %List 21 | %ST products that deliver capabilities through public products 22 | %(comma separated list) 23 | % 24 | %ADIOS 25 | % 26 | %AML 27 | % 28 | %ALPINE: Ascent, ParaView, Catalyst, Visit, LibSim, In Situ Algorithms 29 | % 30 | %BLAS 31 | % 32 | %SLATE 33 | % 34 | %C 35 | % 36 | %LLVM 37 | % 38 | %C++ 39 | % 40 | %LLVM 41 | % 42 | %Caliper 43 | % 44 | %Catalyst 45 | % 46 | %CHAI 47 | % 48 | %Cinema 49 | % 50 | %CUDA 51 | % 52 | %Darshan 53 | % 54 | %DTK 55 | % 56 | %Dyninst 57 | % 58 | %E4S 59 | % 60 | %FFT 61 | %FFTX, FFT\_ECP 62 | %FleCSI 63 | % 64 | %Flux 65 | % 66 | %Fortran 67 | %LLVM/Flang 68 | %GASNet 69 | % 70 | %Ginkgo 71 | % 72 | %HDF5 73 | % 74 | %HPCToolkit 75 | % 76 | %hypre 77 | % 78 | %Kokkos 79 | % 80 | %KokkosKernels 81 | % 82 | %LAPACK 83 | % 84 | %Legion 85 | % 86 | %libEnsemble 87 | % 88 | %MarFS 89 | % 90 | %MFEM 91 | % 92 | %MPI 93 | %MPICH, Open MPI 94 | %OpenACC 95 | %Clacc/LLVM 96 | %OpenCL 97 | %- 98 | %OpenMP 99 | %SOLLVE/LLVM 100 | %PAPI 101 | % 102 | %Papyrus 103 | % 104 | %Paraview 105 | % 106 | %PaRSEC 107 | % 108 | %PETSc/TAO 109 | % 110 | %PnetCDF 111 | % 112 | %PowerStack 113 | % 114 | %RAJA 115 | % 116 | %MPI-IO 117 | %ROMIO 118 | %ScaLAPACK 119 | %SLATE 120 | %SCR 121 | % 122 | %SICM 123 | % 124 | %Spack 125 | % 126 | %SPOT 127 | % 128 | %STRUMPACK 129 | % 130 | %SUNDIALS 131 | % 132 | %SuperLU 133 | % 134 | %SYCL 135 | % 136 | %SZ 137 | % 138 | %TASMANIAN 139 | % 140 | %TAU 141 | % 142 | %Trilinos 143 | % 144 | %UMap 145 | % 146 | %Umpire 147 | % 148 | %Unify 149 | % 150 | %UPC++ 151 | % 152 | %VeloC 153 | % 154 | %VisIt 155 | % 156 | %VTK-m 157 | % 158 | %xSDK 159 | % 160 | %ZFP 161 | % 162 | % 163 | -------------------------------------------------------------------------------- /ProductDictionaryOverview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ProductDictionaryOverview.png -------------------------------------------------------------------------------- /ProductDocumentationGitHub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ProductDocumentationGitHub.png -------------------------------------------------------------------------------- /ProductDocumentationGoals.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ProductDocumentationGoals.png -------------------------------------------------------------------------------- /ProductsOverview.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ProductsOverview.jpeg -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # ECP-ST-CAR-PUBLIC 2 | The Exascale Computing Project Software Technologies Capability Assessment Report - Public Version 3 | -------------------------------------------------------------------------------- /SDKs.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/SDKs.pptx -------------------------------------------------------------------------------- /ST-HI-Interplay.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ST-HI-Interplay.jpeg -------------------------------------------------------------------------------- /STFY20WBS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/STFY20WBS.png -------------------------------------------------------------------------------- /STFY20WBS_v1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/STFY20WBS_v1.png -------------------------------------------------------------------------------- /STFY22WBS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/STFY22WBS.png -------------------------------------------------------------------------------- /STFY22WBS.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/STFY22WBS.pptx -------------------------------------------------------------------------------- /SoftwareStack.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/SoftwareStack.jpeg -------------------------------------------------------------------------------- /Standards.tex: -------------------------------------------------------------------------------- 1 | %\newpage 2 | \subsection{Standards Committees} 3 | Participating in standards efforts is an important activity for ECP ST staff. In many instances, the software will not be sustainable if it is not tightly connected to a standard. Additionally, any standard must account for the emerging requirements that exascale platforms need to meet to achieve performance and portability. Table~\ref{table:standards} summarizes ECP ST staff involvement in the major standards efforts that impact the ECP. 4 | 5 | ECP ST staff are heavily involved in the MPI and OpenMP standards efforts and hold several key leadership positions within the standardizing bodies. ECP ST staff also play a critical role in C++ standards efforts. Although DOE staff have only recently engaged in C++ standards, ECP ST staff efforts are essential for ensuring that HPC requirements are considered, especially by contributing working code that demonstrates requirements and design. The ECP ST sponsors the newest open-source Fortran compiler, Flang~\ref{subsubsect:flang} as a front end for LLVM. This compiler is rapidly emerging as an essential part of the HPC ecosystem. In particular, although ARM processors are not explicitly part of the pre-exascale ecosystem, they are emerging as a strong contender in the future. Flang is \textit{the} Fortran compiler for ARM-based systems. ECP ST involvement in other committees provides valuable leverage and improved uniformity for HPC software. 6 | %Lastly, the Visualization Toolkit (VTK) Architecture Review Board (ARB) [...]\todo{Please complete this sentence.}. Although this is only one instance, the team intends to explore the ARB model as part of its SDK efforts. 7 | 8 | \iffalse % Converted to editable table below. –STC 9 | \begin{figure}[htb] 10 | \begin{center} 11 | \includegraphics[width=0.5\textwidth]{StandardsInvolvement} 12 | 13 | \caption{\label{fig:standards} ECP ST staff are involved in a variety of official and de facto standards committees. Involvement in standards efforts is essential for ensuring the sustainability of ECT ST products and ensuring that emerging exascale requirements are addressed by these standards.} 14 | \end{center} 15 | \todo[inline]{Please convert this figure into a table.} 16 | \end{figure} 17 | \fi 18 | 19 | \begin{table}[h!] 20 | \centering 21 | \begin{tabular}{|l|l|} 22 | \hline 23 | \rowcolor{LightCyan} 24 | \textbf{Standards effort} & \textbf{ECP ST participants} \\ \hline 25 | MPI Forum & 15 \\ \hline 26 | OpenMP & 15 \\ \hline 27 | BLAS & 6 \\ \hline 28 | C++ & 4 \\ \hline 29 | Fortran & 4 \\ \hline 30 | OpenACC & 3 \\ \hline 31 | LLVM & 2 \\ \hline 32 | PowerAPI & 1 \\ \hline 33 | VTK ARB & 1 \\ \hline 34 | \end{tabular} 35 | \caption{\label{table:standards} ECP ST staff are involved in a variety of official and de facto standards committees. Involvement in standards efforts is essential for ensuring the sustainability of ECT ST products and ensuring that emerging exascale requirements are addressed by these standards.} 36 | \end{table} -------------------------------------------------------------------------------- /StandardsInvolvement.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/StandardsInvolvement.jpeg -------------------------------------------------------------------------------- /cover.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/cover.pdf -------------------------------------------------------------------------------- /ecp-small.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ecp-small.png -------------------------------------------------------------------------------- /ecp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/ecp.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1-PMR.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.01-PMR-SDKs/2.3.1.01-PMR-SDKs.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.01-PMR-SDKs/2.3.1.01-PMR-SDKs.tex: -------------------------------------------------------------------------------- 1 | 2 | \subsubsection{\stid{1.01} \pmr\ Software Development Kits} 3 | 4 | \paragraph{Overview} 5 | The \pmr\ SDK effort is focused on identifying meaningful aggregations of products in this technical area. SDK efforts are in the early stages of planning and execution. Most of the work on SDKs has been driven from the \ecosystem\ technical area. A description of the SDK effort can be found in Section~\ref{subsubsect:ecosystem-sdk}. 6 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.07-Exascale-MPI/MPICH-recent-milestones.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.07-Exascale-MPI/MPICH-recent-milestones.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.07-Exascale-MPI/MS-figure-raw.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.07-Exascale-MPI/MS-figure-raw.pptx -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.08-Legion/2.3.1.08-Legion.bib: -------------------------------------------------------------------------------- 1 | @incollection{2.3.1.08:Treichler:2017, 2 | booktitle={Exascale Scientific Applications: Scalability and Performance Portability}, 3 | editor={Straatsma, T.P. and Antypas, K.B. and Williams, T.J.}, 4 | title = "{S3D-Legion: An Exascale Software for Direct Numerical Simulation of Turbulent Combustion with Complex Multicomponent Chemistry}", 5 | author={Treichler, Sean and Bauer, Michael A. and Bhagatwala, Ankit V. and Borghesi, Giulio and Sankaran, Ramanan and Kolla, Hemanth and Larkin, Jeffrey M. and Slaughter, Elliott and Lee, Wonchan and Aiken, Alex and Chen, Jacqueline H. and McCormick, Patrick S.}, 6 | isbn={9781351999236}, 7 | series={Chapman \& Hall/CRC Computational Science}, 8 | url={https://books.google.com/books?id=rGQ-DwAAQBAJ}, 9 | month={11}, 10 | year={2017}, 11 | publisher={CRC Press} 12 | } 13 | 14 | 15 | @article{2.3.1.08:Jia:2018:1, 16 | author = {Zhihao Jia and 17 | Sina Lin and 18 | Charles R. Qi and 19 | Alex Aiken}, 20 | title = {Exploring Hidden Dimensions in Parallelizing Convolutional Neural 21 | Networks}, 22 | journal = {CoRR}, 23 | volume = {abs/1802.04924}, 24 | year = {2018}, 25 | url = {http://arxiv.org/abs/1802.04924}, 26 | archivePrefix = {arXiv}, 27 | eprint = {1802.04924}, 28 | timestamp = {Mon, 13 Aug 2018 16:48:55 +0200}, 29 | biburl = {https://dblp.org/rec/bib/journals/corr/abs-1802-04924}, 30 | bibsource = {dblp computer science bibliography, https://dblp.org} 31 | } 32 | 33 | @article{2.3.1.08:Jia:2018:2, 34 | author = {Zhihao Jia and 35 | Matei Zaharia and 36 | Alex Aiken}, 37 | title = {Beyond Data and Model Parallelism for Deep Neural Networks}, 38 | journal = {CoRR}, 39 | volume = {abs/1807.05358}, 40 | year = {2018}, 41 | url = {http://arxiv.org/abs/1807.05358}, 42 | archivePrefix = {arXiv}, 43 | eprint = {1807.05358}, 44 | timestamp = {Mon, 13 Aug 2018 16:47:43 +0200}, 45 | biburl = {https://dblp.org/rec/bib/journals/corr/abs-1807-05358}, 46 | bibsource = {dblp computer science bibliography, https://dblp.org} 47 | } 48 | 49 | 50 | @inproceedings{2.3.1.08:Lee:2018:1, 51 | author = {Lee, Wonchan and Slaughter, Elliott and Bauer, Michael and Treichler, Sean and Warszawski, Todd and Garland, Michael and Aiken, Alex}, 52 | title = {Dynamic Tracing: Memoization of Task Graphs for Dynamic Task-based Runtimes}, 53 | booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage, and Analysis}, 54 | series = {SC '18}, 55 | year = {2018}, 56 | location = {Dallas, Texas}, 57 | pages = {34:1--34:13}, 58 | articleno = {34}, 59 | numpages = {13}, 60 | url = {http://dl.acm.org/citation.cfm?id=3291656.3291702}, 61 | acmid = {3291702}, 62 | publisher = {IEEE Press}, 63 | address = {Piscataway, NJ, USA}, 64 | } 65 | 66 | @inproceedings{2.3.1.08:Lee:2018:2, 67 | author = {Lee, Wonchan and Stelle, George and McCormick, Patrick and Aiken, Alex}, 68 | title = {Correctness of Dynamic Dependence Analysis for Implicitly Parallel Tasking Systems}, 69 | booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage, and Analysis}, 70 | year = {2018}, 71 | location = {Dallas, Texas}, 72 | } 73 | 74 | @inproceedings{2.3.1.08:2018:2, 75 | author = {Lee, Wonchan and Slaughter, Elliott and Bauer, Michael and Treichler, Sean and Warszawski, Todd and Garland, Michael and Aiken, Alex}, 76 | title = {Dynamic Tracing: Memoization of Task Graphs for Dynamic Task-based Runtimes}, 77 | booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage, and Analysis}, 78 | series = {SC '18}, 79 | year = {2018}, 80 | location = {Dallas, Texas}, 81 | pages = {34:1--34:13}, 82 | articleno = {34}, 83 | numpages = {13}, 84 | url = {https://doi.org/10.1109/SC.2018.00037}, 85 | doi = {10.1109/SC.2018.00037}, 86 | acmid = {3291702}, 87 | publisher = {IEEE Press}, 88 | address = {Piscataway, NJ, USA}, 89 | } 90 | 91 | @inproceedings{2.3.1.08:Bauer:2019, 92 | author = {Bauer, Michael and Garland, Michael}, 93 | title = {Legate NumPy: Accelerated and Distributed Array Computing}, 94 | booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage, and Analysis}, 95 | series = {SC '19}, 96 | year = {2019}, 97 | location = {Denver, Colorado}, 98 | pages = {to appear}, 99 | } 100 | 101 | @inproceedings{2.3.1.08:Slaughter:2019, 102 | author = {Slaughter, Elliott and Aiken, Alex}, 103 | title = {Pygion: Flexible, Scalable Task-Based Parallelism with Python}, 104 | booktitle = {Proceedings of Parallel Applications Workshop, Alternatives To MPI+X, co-located with SC19}, 105 | year = {2019}, 106 | location = {Denver, Colorado}, 107 | pages = {to appear}, 108 | } 109 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/PaRSEC-diagram.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/PaRSEC-diagram.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/cc_abcd.csv: -------------------------------------------------------------------------------- 1 | TA,1,1,1233.3759999999997,1221.24,1241.47,0,0.0,0.0 2 | TA,2,1,2646.7619999999997,2593.79,2685.63,0,0.0,0.0 3 | TA,4,1,4345.42,4234.15,4411.99,0,0.0,0.0 4 | TA,8,1,7412.014,7158.11,7611.38,0,0.0,0.0 5 | TA,12,1,8429.651999999998,8175.36,8673.07,0,0.0,0.0 6 | TA,2,2,2047.36,2007.3,2100.53,0,0.0,0.0 7 | TA,4,2,2711.16,2640.64,2779.94,0,0.0,0.0 8 | TA,8,2,4719.182000000001,4541.62,4821.58,0,0.0,0.0 9 | TA,16,2,3845.952,3774.56,3917.57,0,0.0,0.0 10 | TA,24,2,5503.638,5344.23,5597.07,0,0.0,0.0 11 | TA,32,2,7099.204000000001,6862.75,7282.15,0,0.0,0.0 12 | TESSE,1,1,1120.7220000000002,1038.75,1187.79,81897,15.779276122191316,0.06196679275877985 13 | TESSE,2,1,2437.446,2235.38,2704.85,81108,14.172339376245242,0.1526869587517014 14 | TESSE,4,1,4628.136,4089.01,5290.63,80869,12.713800770130605,0.25028482961416804 15 | TESSE,8,1,8657.706,7898.35,9416.57,79770,11.459371596481901,0.5078254590675239 16 | TESSE,12,1,11055.526000000002,9145.43,13008.0,78390,10.529784209371506,0.7732891104568393 17 | TESSE,1,2,2312.8900000000003,2216.56,2447.97,82094,15.138034501828388,0.06184349198847178 18 | TESSE,2,2,4450.125999999999,3864.99,4997.92,81720,13.417708076358295,0.124128046989721 19 | TESSE,4,2,8812.416000000001,8307.8,9404.74,81558,12.302669681260637,0.24847055130776816 20 | TESSE,8,2,17992.84,16532.5,19960.2,81119,11.214395337255116,0.5004395485184838 21 | TESSE,12,2,22185.98,20169.0,24272.1,80552,10.152666600456847,0.7562284238752607 22 | TESSE,16,2,31307.18,25055.2,35160.6,80182,9.343300790701154,1.0147027512409268 23 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/cc_abcd.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/cc_abcd.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/dpotrf-ttg/dpotrf_1403612-page3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/dpotrf-ttg/dpotrf_1403612-page3.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/dpotrf-ttg/dpotrf_1403612.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/dpotrf-ttg/dpotrf_1403612.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/gemm_summit_mean.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/gemm_summit_mean.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/irr-bs-gemm-combined.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/irr-bs-gemm-combined.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/irr-bs-gemm-v3-perf.dat: -------------------------------------------------------------------------------- 1 | #idx #GPU Q1 min max Q3 mean 2 | 0 3 6593.591064 6160.775014 6668.766522999999 6648.931156000001 6542.404519199999 3 | 1 6 13977.942531 13146.413468 14400.792501 14287.584641999998 13969.4503468 4 | 2 12 24015.339227 21344.207861000003 25781.74653 24362.528406 23923.2605732 5 | 3 18 31723.674946 27767.193644 35250.169176999996 34073.961368000004 32424.403011 6 | 4 36 42077.074176 38584.350905 44563.975431 44229.849956 42334.377379 7 | 5 72 62836.046211 56317.655684000005 67785.67101399999 67058.029482 63867.14778819999 8 | 6 108 80256.611765 74689.59581900001 86479.212423 85677.544574 82537.368158 9 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/irr-bs-gemm-v3-time.dat: -------------------------------------------------------------------------------- 1 | #idx #GPU Q1 min max Q3 mean 2 | 0 3 181.90400000000002 181.363 196.31799999999998 183.43099999999998 185.0332 3 | 1 6 84.6517 83.9862 91.9999 86.5269 86.66855999999999 4 | 2 12 49.6446 46.9118 56.6649 50.3623 50.748599999999996 5 | 3 18 35.4954 34.311 43.5575 38.1251 37.560340000000004 6 | 4 36 27.3451 27.14 31.3461 28.7441 28.64488 7 | 5 72 18.0361 17.8425 21.4758 19.248 19.022660000000002 8 | 6 108 14.1165 13.9857 16.1933 15.07 14.6995 9 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/irr-bs-gemm.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/irr-bs-gemm.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/project-1e-13.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/project-1e-13.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/rwalk-10.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/rwalk-10.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_GEMM.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_GEMM.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_POTRF.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_POTRF.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_cpu_GEMM.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_cpu_GEMM.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_cpu_POTRF.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_cpu_POTRF.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_gpu_GEMM.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_gpu_GEMM.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_gpu_POTRF.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/scalapack_gpu_POTRF.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/slate_updated_nacl.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/slate_updated_nacl.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-gemm-pbscal1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-gemm-pbscal1.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-mqpc-density1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-mqpc-density1.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-po-pbscal1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-po-pbscal1.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-po-pbscal4.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.09-ParSEC/spock-po-pbscal4.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/2.3.1.14-UPCxx.bib: -------------------------------------------------------------------------------- 1 | 2 | @misc{upcxx-site, 3 | author = {{UPC++ website}}, 4 | title = {\url{https://upcxx.lbl.gov/}} 5 | } 6 | 7 | @TechReport{upcxx-spec, 8 | author = "Dan Bonachea and Amir Kamil", 9 | title = "{UPC++ v1.0 Specification, Revision 2021.9.0}", 10 | institution = {Lawrence Berkeley National Laboratory}, 11 | number = {LBNL-2001425}, 12 | month = "September", 13 | year = 2021, 14 | doi = {10.25344/S4XK53}, 15 | note = {\url{https://doi.org/10.25344/S4XK53}}, 16 | url = {https://escholarship.org/uc/item/9870n7th}, 17 | } 18 | 19 | @TechReport{upcxx-guide, 20 | author = "John Bachan and Scott B. Baden and Dan Bonachea and Max Grossman and Paul H. Hargrove and Steven Hofmeyr and Mathias Jacquelin and Amir Kamil and Brian van Straalen and Daniel Waters", 21 | title = "{UPC++ v1.0 Programmer's Guide, Revision 2021.9.0}", 22 | institution = {Lawrence Berkeley National Laboratory}, 23 | number = {LBNL-2001424}, 24 | month = "September", 25 | year = 2021, 26 | doi = {10.25344/S4SW2T}, 27 | note = {\url{https://doi.org/10.25344/S4SW2T}}, 28 | url = {https://escholarship.org/uc/item/52k9h79s}, 29 | } 30 | 31 | @inproceedings{pawatm21-upcxx-kokkos, 32 | author = "Daniel Waters and Colin A. MacLean and Dan Bonachea and Paul H. Hargrove", 33 | title = "Demonstrating {UPC++/Kokkos} Interoperability in a Heat Conduction Simulation (Extended Abstract)", 34 | month = "November", 35 | year = 2021, 36 | location = {St. Louis, MO, USA}, 37 | booktitle = {2021 IEEE/ACM Parallel Applications Workshop, Alternatives To MPI+X (PAW-ATM)}, 38 | numpages = {5}, 39 | doi = {10.25344/S4630V}, 40 | note = {\url{https://doi.org/10.25344/S4630V}}, 41 | } 42 | 43 | @inproceedings{pawatm21-upcxx-as_eager, 44 | author = "Amir Kamil and Dan Bonachea", 45 | title = "Optimization of Asynchronous Communication Operations through Eager Notifications", 46 | month = "November", 47 | year = 2021, 48 | location = {St. Louis, MO, USA}, 49 | booktitle = {2021 IEEE/ACM Parallel Applications Workshop, Alternatives To MPI+X (PAW-ATM)}, 50 | numpages = {10}, 51 | doi = {10.25344/S42C71}, 52 | note = {\url{https://doi.org/10.25344/S42C71}}, 53 | } 54 | 55 | @inproceedings{sc21-upcxx-tutorial, 56 | author = "Katherine A. Yelick and Amir Kamil and Damian Rouson and Dan Bonachea and Paul H. Hargrove", 57 | title = "{UPC++}: An Asynchronous {RMA/RPC} Library for Distributed {C++} Applications", 58 | month = "November", 59 | year = 2021, 60 | location = {St. Louis, MO, USA}, 61 | booktitle = {International Conference for High Performance Computing, Networking, Storage, and Analysis (SC21)}, 62 | note = {Half-day tutorial at SC21. \url{https://go.lbl.gov/sc21}}, 63 | } 64 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/Summit-slide-BW.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/Summit-slide-BW.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/all-cori-haswell-out-inserts-wait.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/all-cori-haswell-out-inserts-wait.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/all-cori-knl-out-inserts-wait.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/all-cori-knl-out-inserts-wait.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/latency_bars.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/latency_bars.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/paw21_interop_strong_scaling1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/paw21_interop_strong_scaling1.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/ss_Flan_1565_complex.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/ss_Flan_1565_complex.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/ss_boneS10_comm.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/ss_boneS10_comm.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/upcxx-spock.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.14-UPCxx-GASNet/upcxx-spock.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.16-SICM/2.3.1.16-SICM.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | @inproceedings{Doudali:2017:CTE:3132402.3132418, 3 | author = {Doudali, Thaleia Dimitra and Gavrilovska, Ada}, 4 | title = {{CoMerge}: Toward Efficient Data Placement in Shared Heterogeneous Memory Systems}, 5 | booktitle = {Proceedings of the International Symposium on Memory Systems}, 6 | series = {MEMSYS '17}, 7 | year = {2017}, 8 | isbn = {978-1-4503-5335-9}, 9 | location = {Alexandria, Virginia}, 10 | pages = {251--261}, 11 | numpages = {11}, 12 | url = {http://doi.acm.org/10.1145/3132402.3132418}, 13 | doi = {10.1145/3132402.3132418}, 14 | acmid = {3132418}, 15 | publisher = {ACM}, 16 | address = {New York, NY, USA}, 17 | keywords = {data tiering, hybrid memory management, shared heterogeneous memory systems}, 18 | } 19 | 20 | @inproceedings{Williams:2017:NDH:3145617.3145620, 21 | author = {Williams, Sean and Ionkov, Latchesar and Lang, Michael}, 22 | title = {{NUMA} Distance for Heterogeneous Memory}, 23 | booktitle = {Proceedings of the Workshop on Memory Centric Programming for HPC}, 24 | series = {MCHPC'17}, 25 | year = {2017}, 26 | isbn = {978-1-4503-5131-7}, 27 | location = {Denver, CO, USA}, 28 | pages = {30--34}, 29 | numpages = {5}, 30 | url = {http://doi.acm.org/10.1145/3145617.3145620}, 31 | doi = {10.1145/3145617.3145620}, 32 | acmid = {3145620}, 33 | publisher = {ACM}, 34 | address = {New York, NY, USA}, 35 | } 36 | 37 | @misc{olson2021online, 38 | title={Online Application Guidance for Heterogeneous Memory Systems}, 39 | author={M. Ben Olson and Brandon Kammerdiener and Kshitij A. Doshi and Terry Jones and Michael R. Jantz}, 40 | year={2021}, 41 | eprint={2110.02150}, 42 | archivePrefix={arXiv}, 43 | primaryClass={cs.PF} 44 | } -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.16-SICM/mike-excelent.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.16-SICM/mike-excelent.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.16-SICM/sicm-online-diagram.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.16-SICM/sicm-online-diagram.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/2.3.1.17-OMPI-X.bib: -------------------------------------------------------------------------------- 1 | @Article{Bernholdt:2018:SMU, 2 | author = {David E. Bernholdt and Swen Boehm and George Bosilca 3 | and Manjunath {Gorentla Venkata} and Ryan E. Grant 4 | and Thomas Naughton and Howard P. Pritchard and 5 | Martin Schulz and Geoffroy R. Vallee}, 6 | title = {A Survey of {MPI} Usage in the {U.S.} {E}xascale 7 | {C}omputing {P}rogram}, 8 | journal = {Concurrency and Computing: Practice and Experience}, 9 | year = {2018}, 10 | doi = {10.1002/cpe.4851}, 11 | ornlptsid = {112643}, 12 | ornlepm = {} 13 | } 14 | 15 | @TechReport{Bernholdt:2018:SMU-tr, 16 | author = {David E. Bernholdt and Swen Boehm and George Bosilca 17 | and Manjunath {Gorentla Venkata} and Ryan E. Grant 18 | and Thomas Naughton and Howard P. Pritchard and 19 | Martin Schulz and Geoffroy R. Vallee}, 20 | title = {A Survey of {MPI} Usage in the {U.S.} {E}xascale 21 | {C}omputing {P}rogram}, 22 | institution = {Oak Ridge National Laboratory}, 23 | year = 2018, 24 | number = {ORNL/SPR-2018/790}, 25 | doi = {10.2172/1462877}, 26 | note = {\url{https://doi.org/10.2172/1462877}}, 27 | ornlptsid = {108588}, 28 | ornlepm = {2018} 29 | } 30 | 31 | @Misc{Bernholdt:2017:smu-talk, 32 | author = {David E. Bernholdt and Swen Boehm and George Bosilca 33 | and Manjunath {Gorentla Venkata} and Ryan E. Grant 34 | and Thomas Naughton and Howard P. Pritchard and 35 | Martin Schulz and Geoffroy R. Vallee}, 36 | title = {A Survey of {MPI} Usage in the {U.S.} {E}xascale 37 | {C}omputing {P}rogram}, 38 | howpublished = {talk at ExaMPI 2017 workshop, Denver, CO}, 39 | month = {November}, 40 | year = 2017} 41 | 42 | @inproceedings{icl:957, 43 | author = {Eberius, D. and Patinyasakdikul, T. and Bosilca, G.}, 44 | title = {{Using Software-Based Performance Counters to Expose Low-Level Open MPI Performance Information}}, 45 | booktitle = {Proceedings of the 24th European MPI Users' Group Meeting}, 46 | institution = {Innovative Computing Laboratory, University of Tennessee}, 47 | pages = {Article No. 7}, 48 | address = {Chicago, IL}, 49 | month = {September}, 50 | year = {2017} 51 | } 52 | # Put your BibTeX entries in this file. 53 | 54 | @inproceedings{wheeler2008qthreads, 55 | title = {Qthreads: {{An API}} for Programming with Millions of Lightweight Threads}, 56 | doi = {10.1109/IPDPS.2008.4536359}, 57 | abstract = {Large scale hardware-supported multithreading, an attractive means of increasing computational power, benefits significantly from low per-thread costs. Hardware support for lightweight threads is a developing area of research. Each architecture with such support provides a unique interface, hindering development for them and comparisons between them. A portable abstraction that provides basic lightweight thread control and synchronization primitives is needed. Such an abstraction would assist in exploring both the architectural needs of large scale threading and the semantic power of existing languages. Managing thread resources is a problem that must be addressed if massive parallelism is to be popularized. The qthread abstraction enables development of large-scale multithreading applications on commodity architectures. This paper introduces the qthread API and its Unix implementation, discusses resource management, and presents performance results from the HPCCG benchmark.}, 58 | timestamp = {2016-02-17T21:14:11Z}, 59 | booktitle = {{{IEEE International Symposium}} on {{Parallel}} and {{Distributed Processing Workshops}}, 2008. {{IPDPSW}} 2008}, 60 | author = {Wheeler, K.B. and Murphy, R.C. and Thain, D.}, 61 | month = apr, 62 | year = {2008}, 63 | keywords = {API,application program interfaces,Computer architecture,Costs,Hardware,HPCCG benchmark,Laboratories,large scale hardware supported multithreading,Large-scale systems,lightweight threads,Multithreading,multi-threading,Parallel processing,Programming profession,qthread abstraction,qthread API,Qthreads,resource allocation,resource management,Unix,Unix implementation,Yarn}, 64 | pages = {1--8}, 65 | } 66 | 67 | @misc{qthreads-github, 68 | title = {{Qthreads lightweight locality-aware user-level threading runtime}}, 69 | author = {{Sandia National Laboratories}}, 70 | note = {\url{https://github.com/Qthreads/qthreads}} 71 | } 72 | 73 | @inproceedings{evans2018qthreads-model, 74 | title = {Verifying Qthreads: Is Model Checking Viable for User Level Tasking Runtimes?}, 75 | booktitle = {2nd International Workshop on Software Correctness for HPC Applications (Correctness 2018)}, 76 | author = {Evans, Noah}, 77 | year = {2018}, 78 | month = {November} 79 | } 80 | 81 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/p2p-threading-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/p2p-threading-performance.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/partitioned-comms-code.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/partitioned-comms-code.jpg -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/partitioned-communications-early-receive.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/partitioned-communications-early-receive.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/partitioned-communications-partial-sends.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/partitioned-communications-partial-sends.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/reinit-performance.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/reinit-performance.jpg -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/reinit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/reinit.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/rma-threading-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/rma-threading-performance.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.17-OMPI-X/ult-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.17-OMPI-X/ult-performance.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.18-RAJA-Kokkos/2.3.1.18-RAJA-Kokkos.bib: -------------------------------------------------------------------------------- 1 | @misc{RAJA-github, 2 | title = "{{RAJA} Performance Portability Layer}", 3 | note = {\url{https://github.com/LLNL/RAJA}} 4 | } 5 | 6 | @misc{RAJAPerf-github, 7 | title = "{{RAJA} Performance Suite}", 8 | note = {\url{https://github.com/LLNL/RAJAPerf}} 9 | } 10 | 11 | @misc{CHAI-github, 12 | title = "{{CHAI} Copy-hiding Array Abstraction}", 13 | note = {\url{https://github.com/LLNL/CHAI}} 14 | } 15 | 16 | @misc{Umpire-github, 17 | title = "{Umpire Application-focused Memory Management API}", 18 | note = {\url{https://github.com/LLNL/Umpire}} 19 | } 20 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.18-RAJA-Kokkos/ecp-small.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.18-RAJA-Kokkos/ecp-small.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/2.3.1.19-Argo-PowerSteering.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | # Put your BibTeX entries in this file. 3 | 4 | @INPROCEEDINGS{Ellsworth:argo, 5 | author={D. Ellsworth and T. Patki and S. Perarnau and S. Seo and A. Amer and J. Zounmevo and R. Gupta and K. Yoshii and H. Hoffman and A. Malony and M. Schulz and P. Beckman}, 6 | booktitle={2016 IEEE International Parallel and Distributed Processing Symposium Workshops (IPDPSW)}, 7 | title={Systemwide Power Management with {Argo}}, 8 | year={2016}, 9 | pages={1118-1121}, 10 | doi={10.1109/IPDPSW.2016.81}, 11 | } 12 | 13 | @inproceedings{ellsworth_e2sc2016, 14 | author = {Ellsworth, Daniel and Patki, Tapasya and Schulz, Martin and Rountree, Barry and Malony, Allen}, 15 | title = {A Unified Platform for Exploring Power Management Strategies}, 16 | booktitle = {Proc. 4th International Workshop on Energy Efficient Supercomputing}, 17 | year = {2016}, 18 | location = {Salt Lake City, Utah}, 19 | } 20 | 21 | @inproceedings{sakamoto2017, 22 | author = {Sakamoto, Ryuichi and Cao, Thang and Knoda, Masaaki and Inoue, Koji and Ueda, Masatsugu and Patki, Tapasya and Ellsworth, Daniel and Rountree, Barry and Schulz, Martin}, 23 | title = {Production Hardware Overprovisioning: Real-world Performance Optimization Using an Extensible Power-aware Resource Management Framework}, 24 | booktitle = {Proc. 31st Internation Parallel and Distributed Processing Symposium}, 25 | year = {2017}, 26 | location = {Orlando, Florida, USA} 27 | } 28 | 29 | @InProceedings{patki2016, 30 | author="Patki, Tapasya 31 | and Bates, Natalie 32 | and Ghatikar, Girish 33 | and Clausen, Anders 34 | and Klingert, Sonja 35 | and Abdulla, Ghaleb 36 | and Sheikhalishahi, Mehdi", 37 | editor="Kunkel, Julian M. 38 | and Balaji, Pavan 39 | and Dongarra, Jack", 40 | title="Supercomputing Centers and Electricity Service Providers: A Geographically Distributed Perspective on Demand Management in {Europe} and the {United States}", 41 | booktitle=" International Supercomputing Conference (High Performance Computing), ISC-HPC", 42 | year="2016", 43 | 44 | } 45 | 46 | @misc{osti_1353371, 47 | title = {Addressing Thermal and Performance Variability Issues in Dynamic Processors}, 48 | author = {Yoshii, Kazutomo and Llopis, Pablo and Zhang, Kaicheng and Luo, Yingyi and Ogrenci-Memik, Seda and Memik, Gokhan and Sankaran, Rajesh and Beckman, Pete}, 49 | doi = {10.2172/1353371}, 50 | year = {2017}, 51 | month = {3} 52 | } 53 | 54 | @inproceedings{zhang2015minimizing, 55 | title={Minimizing Thermal Variation Across System Components}, 56 | author={Zhang, Kaicheng and Ogrenci-Memik, Seda and Memik, Gokhan and Yoshii, Kazutomo and Sankaran, Rajesh and Beckman, Pete}, 57 | booktitle={Parallel and Distributed Processing Symposium (IPDPS), 2015 IEEE International}, 58 | pages={1139--1148}, 59 | year={2015}, 60 | organization={IEEE} 61 | } 62 | 63 | @inproceedings{zounmevo2015container, 64 | title={A Container-Based Approach to {OS} Specialization for Exascale Computing}, 65 | author={Zounmevo, Judicael A and Perarnau, Swann and Iskra, Kamil and Yoshii, Kazutomo and Gioiosa, Roberto and Van Essen, Brian C and Gokhale, Maya B and Leon, Edgar A}, 66 | booktitle={Containers, 1st Workshop on (WoC)}, 67 | year={2015} 68 | } 69 | 70 | @inproceedings{perarnau2015distributed, 71 | title={Distributed Monitoring and Management of Exascale Systems in the {Argo} Project}, 72 | author={Perarnau, Swann and Thakur, Rajeev and Iskra, Kamil and Raffenetti, Ken and Cappello, Franck and Gupta, Rinku and Beckman, Pete and Snir, Marc and Hoffmann, Henry and Schulz, Martin and others}, 73 | booktitle={Distributed Applications and Interoperable Systems}, 74 | pages={173--178}, 75 | year={2015}, 76 | organization={Springer International Publishing} 77 | } 78 | 79 | @inproceedings{perarnau2016exploring, 80 | title={Exploring Data Migration for Future Deep-Memory Many-Core Systems}, 81 | author={Perarnau, Swann and Zounmevo, Judicael A and Gerofi, Balazs and Iskra, Kamil and Beckman, Pete}, 82 | booktitle={IEEE Cluster}, 83 | year={2016} 84 | } 85 | 86 | @inproceedings{perarnau2017argo, 87 | title={{Argo NodeOS}: Toward Unified Resource Management for Exascale}, 88 | author={Perarnau, Swann and Zounmevo, Judicael A and Dreher, Matthieu and Van Essen, Brian C and Gioiosa, Roberto and Iskra, Kamil and Gokhale, Maya B and Yoshii, Kazutomo and Beckman, Pete}, 89 | booktitle={Parallel and Distributed Processing Symposium (IPDPS), 2017 IEEE International}, 90 | pages={153--162}, 91 | year={2017}, 92 | organization={IEEE} 93 | } 94 | 95 | @inproceedings{dreher2017situ, 96 | title={In Situ Workflows at Exascale: System Software to the Rescue}, 97 | author={Dreher, Matthieu and Perarnau, Swann and Peterka, Tom and Iskra, Kamil and Beckman, Pete}, 98 | booktitle={Proceedings of the In Situ Infrastructures on Enabling Extreme-Scale Analysis and Visualization}, 99 | pages={22--26}, 100 | year={2017}, 101 | organization={ACM} 102 | } 103 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/2.3.1.19-Argo-PowerSteering.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{1.19} Argo: Low-Level Resource Management for the OS and Runtime} 2 | 3 | The goal of the Argo project~\cite{perarnau2017argo} is to augment and 4 | optimize existing OS/R components for use in production HPC systems, 5 | providing portable, open source, integrated software that improves the 6 | performance and scalability of and that offers increased functionality to 7 | exascale applications and runtime systems. 8 | 9 | System resources should be managed in cooperation with applications and 10 | runtime systems to provide improved performance and resilience. This is 11 | motivated by the increasing complexity of HPC hardware and application 12 | software, which needs to be matched by corresponding increases in the 13 | capabilities of system management solutions. 14 | 15 | The Argo software is developed as a toolbox---a collection of autonomous 16 | components that can be freely mixed and matched to best meet the user's 17 | needs. 18 | 19 | Project activities focus around four products: 20 | \begin{enumerate} 21 | \item AML: a library providing explicit, application-aware memory 22 | management for deep memory systems 23 | 24 | \item UMap: a user level library incorporating NVRAM into complex memory 25 | hierarchy using a high performance \texttt{mmap}-like interface 26 | 27 | \item PowerStack: power management infrastructure for optimizing performance 28 | of exascale applications under power or energy constraints 29 | 30 | \item NRM: a daemon to centralize node management activities such as 31 | job management, resource management, and power management 32 | \end{enumerate} 33 | 34 | \input projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/aml 35 | \input projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/umap 36 | \input projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/powerstack 37 | \input projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm 38 | -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/PowerStack_v2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/PowerStack_v2.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/aml-components.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/aml-components.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/aml-xsbench.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/aml-xsbench.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/argo-global.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/argo-global.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/argo-node.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/argo-node.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/cpd.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/cpd.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm-energy.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm-energy.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm-loop.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm-loop.pdf -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm-runtime.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/nrm-runtime.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/power_model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/power_model.png -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/sensors.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/sensors.jpg -------------------------------------------------------------------------------- /projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/umap-arch.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.1-PMR/2.3.1.19-Argo-PowerSteering/umap-arch.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2-Tools.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.01-Tools-SDKs/2.3.2.01-Tools-SDKs.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/2.3.2.06-EXA-PAPI.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @techreport{PWN-2020-01, 4 | title = {Formulation of Requirements for new PAPI++ Software Package: Part I: Survey Results}, 5 | journal = {PAPI++ Working Notes}, 6 | number = {1, ICL-UT-20-02}, 7 | year = {2020}, 8 | month = {2020-01}, 9 | publisher = {Innovative Computing Laboratory, University of Tennessee Knoxville}, 10 | author = {Heike Jagode and Anthony Danalis and Jack Dongarra} 11 | } 12 | 13 | 14 | @techreport{PWN-2020-07, 15 | title = {Roadmap for Refactoring classic PAPI to PAPI++: Part II: Formulation of Roadmap based on Survey Results}, 16 | journal = {PAPI++ Working Notes}, 17 | number = {2, ICL-UT-20-09}, 18 | year = {2020}, 19 | month = {2020-07}, 20 | publisher = {Innovative Computing Laboratory, University of Tennessee}, 21 | author = {Heike Jagode and Anthony Danalis and Damien Genet} 22 | } 23 | 24 | 25 | @conference{toolsWS-2020-09, 26 | title = {Effortless Monitoring of Arithmetic Intensity with PAPI{\textquoteright}s Counter Analysis Toolkit}, 27 | booktitle = {13th International Workshop on Parallel Tools for High Performance Computing}, 28 | year = {2020}, 29 | month = {2020-09}, 30 | publisher = {Springer International Publishing}, 31 | organization = {Springer International Publishing}, 32 | address = {Dresden, Germany}, 33 | author = {Daniel Barry and Anthony Danalis and Heike Jagode} 34 | } 35 | 36 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/2.3.2.06-EXA-PAPI_old.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/2.3.2.06-EXA-PAPI_old.tex -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/Exa-PAPI_sde_magma.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/Exa-PAPI_sde_magma.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/Exa-PAPI_sde_parsec.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/Exa-PAPI_sde_parsec.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/cat-DP-flops-arch-comparison-1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/cat-DP-flops-arch-comparison-1.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/papi_sde.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.06-EXA-PAPI/papi_sde.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/2.3.2.08-HPCToolkit.bib: -------------------------------------------------------------------------------- 1 | 2 | 3 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-lammps-traces.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-lammps-traces.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-many-threads.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-many-threads.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-nyx-trace.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-nyx-trace.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-pelec-profiles.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-pelec-profiles.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-qs.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-qs.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-raja-perf.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-raja-perf.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-vec-add-ompt.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.08-HPCToolkit/hpctoolkit-vec-add-ompt.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-Autotuning.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @inproceedings{P3HPC_Bricks, 4 | author = {Zhao,Tuowen and Williams, Samuel and Hall, Mary and Johansen, Hans}, 5 | title = {Delivering Performance Portable Stencil Computations on CPUs and GPUs 6 | Using Bricks}, 7 | booktitle = {Proceedings of the International Workshop on Performance, 8 | Portability and Productivity in HPC (P3HPC), SC'18}, 9 | month = {Nov}, 10 | year = {2018}, 11 | location = {Dallas, TX, USA}, 12 | } 13 | 14 | @inproceedings{nelson2015surf, 15 | author = {T. Nelson and A. Rivera and P. Balaprakash and M. Hall and P. D. Hovland and E. Jessup and B. Norris}, 16 | booktitle = {Proceedings of the 44th International Conference on Parallel Processing (ICPP)}, 17 | title = {Generating efficient tensor contractions for {GPU}s}, 18 | year = {2015} 19 | } 20 | 21 | @inproceedings{kruse2018pragmas, 22 | author = {Kruse, Michael and Finkel, Hal}, 23 | title = {{User-Directed Loop-Transformations in Clang}}, 24 | booktitle = {Proceedings of the 5th Workshop on the LLVM Compiler Infrastructure in HPC (LLVM-HPC 2018. November 12. Dallas, USA)}, 25 | year = 2018, 26 | publisher = {IEEE}, 27 | } 28 | 29 | @InProceedings{sreenivasan2019openmp, 30 | author={Sreenivasan, Vinu and Javali, Rajath and Hall, Mary and Balaprakash, Prasanna and Scogland, Thomas R. W. and de Supinski, Bronis R.}, 31 | title={{A Framework for Enabling OpenMP Autotuning}}, 32 | booktitle={OpenMP: Conquering the Full Hardware Spectrum}, 33 | year={2019}, 34 | publisher={Springer International Publishing}, 35 | pages={50--60}, 36 | } 37 | 38 | 39 | @article{wu2020autotuning, 40 | title={{Autotuning PolyBench Benchmarks with LLVM Clang/Polly Loop Optimization Pragmas Using Bayesian Optimization}}, 41 | author={Wu, Xingfu abd Kruse, Michael and Balaprakash, Prasanna and Finkel, Hal and Hovland, Paul and Taylor, Valerie}, 42 | journal={PMBS Workshop @SC}, 43 | year={2020} 44 | } 45 | 46 | @article{wu2021autotuning, 47 | title={{Customized Monte Carlo Tree Search for LLVM/Polly's Composable Loop Optimization Transformations}}, 48 | author={Wu, Xingfu abd Kruse, Michael and Balaprakash, Prasanna and Finkel, Hal and Hovland, Paul and Taylor, Valerie}, 49 | journal={PMBS Workshop @SC21}, 50 | year={2021} 51 | } 52 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-Bricks.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @INPROCEEDINGS{zhao2018, 4 | author={T. {Zhao} and S. {Williams} and M. {Hall} and H. {Johansen}}, 5 | booktitle={2018 IEEE/ACM International Workshop, P3HPC}, 6 | title={Delivering Performance-Portable Stencil Computations on {CPU}s and {GPU}s Using Bricks}, 7 | year={2018}, 8 | volume={}, 9 | number={}, 10 | pages={59-70}, 11 | doi={10.1109/P3HPC.2018.00009}, 12 | ISSN={}, 13 | month={Nov},} 14 | 15 | @INPROCEEDINGS{zhao2019, 16 | author={T. {Zhao} and P. {Basu} and S. {Williams} and M. {Hall} and H. {Johansen}}, 17 | booktitle={accepted and to appear, SC 2019}, 18 | title={Exploiting Reuse and Vectorization in Blocked Stencil Computations on 19 | {CPU}s and {GPU}s}, 20 | year={2019}, 21 | volume={}, 22 | number={}, 23 | ISSN={}, 24 | month={Nov},} 25 | 26 | @INPROCEEDINGS{zhaoMPI2019, 27 | author={T. {Zhao} and S. {Williams} and M. {Hall} and H. {Johansen}}, 28 | booktitle={submitted to IPDPS '20}, 29 | title={Pack-Free Stencil Ghost Zone Exchange}, 30 | year={2019}, 31 | volume={}, 32 | number={}, 33 | ISSN={}, 34 | month={},} 35 | 36 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-CLACC.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @Misc{openaccOrgTools, 4 | title = {{OpenACC: Commerical Compilers}}, 5 | howpublished = "{[Online]. Available:} 6 | \url{http://openacc.org/tools}" 7 | } 8 | 9 | @Misc{specAccel, 10 | title= {{SPEC ACCEL}}, 11 | howpublished = "{[Online]. Available:} 12 | \url{https://www.spec.org/accel/}" 13 | } 14 | 15 | @InProceedings{openACCValidationSuite, 16 | author="Friedline, Kyle 17 | and Chandrasekaran, Sunita 18 | and Lopez, M. Graham 19 | and Hernandez, Oscar", 20 | title={{OpenACC 2.5 Validation Testsuite Targeting Multiple Architectures}}, 21 | booktitle="High Performance Computing", 22 | year="2017", 23 | publisher="Springer International Publishing", 24 | address="Cham", 25 | pages="557--575", 26 | abstract="Heterogeneous computing has emerged as a promising fit for scientific domains such as molecular dynamics simulations, bioinformatics, weather prediction. Such a computing paradigm includes x86 processors coupled with GPUs, FPGAs, DSPs or a coprocessor paradigm that takes advantage of all the cores and caches on a single die such as the Knights Landing. OpenACC, a high-level directive-based parallel programming model has emerged as a programming paradigm that can tackle the intensity of heterogeneity in architectures. Data-driven large scientific codes are increasingly using OpenACC, which makes it essential to analyze the accuracy of OpenACC compilers while they port code to various types of platforms. In response, we have been creating a validation suite to validate and verify the implementations of OpenACC features in conformance with the specification. The validation suite also provides a tool to compiler developers as a standard for the compiler to be tested against and to users and compiler developers alike in clarifying the OpenACC specification. This testsuite has been integrated into the harness infrastructure of the TITAN and Summitdev systems at Oak Ridge National Lab and is being used for production.", 27 | isbn="978-3-319-67630-2" 28 | } 29 | 30 | @inproceedings{clacc:2018:denny, 31 | author = {J.E. Denny and S. Lee and J.S. Vetter}, 32 | title = {{Clacc: Translating OpenACC to OpenMP in Clang}}, 33 | booktitle = {2018 IEEE/ACM 5th Workshop on the LLVM Compiler Infrastructure in HPC (LLVM-HPC)}, 34 | address = {Dallas, TX, USA}, 35 | publisher = {IEEE}, 36 | year = {2018}, 37 | } 38 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-LLVM-DOE.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{2.10} PROTEAS-TUNE - LLVM-DOE: Creating and Maintaining a DOE Fork of LLVM}\label{s:llvm-doe} 2 | 3 | \paragraph{Overview} 4 | 5 | The ECP funds multiple projects that develop compiler technologies, based on the 6 | popular, open-source LLVM compiler infrastructure project. This ecosystem allows 7 | customization to meet the unique needs of ECP, and a level of well-established 8 | mechanisms to deploy technologies through vendors and at DOE’s leadership 9 | facilities. Importantly, this provides an alternative open-source compiler 10 | ecosystem to those provided by the vendor, thus reducing the dependence on the 11 | vendor’s compilers, timelines, and staff (Risk 10032 that ST product will not 12 | function or meet performance targets). 13 | 14 | In addition, most today’s vendors already rely on LLVM as the foundation for 15 | their compiler ecosystems. This means ECP technology has a path back to vendors 16 | via LLVM itself or through a DOE-/ECP-focused fork of LLVM’s open source 17 | repository. This work will focus on deployment to reduce Risk 10020. 18 | 19 | More broadly, there are eight LLVM-related projects supported by ECP that have 20 | a risk of not being used if developers cannot easily access their contributions. 21 | This fork of LLVM will provide an opportunity for these projects to work 22 | collectively on establishing synergies, interoperability, address the unique 23 | needs of ECP, and mechanisms for making contributions back into the mainstream 24 | LLVM code base. The tasks to setup the DOE Fork of LLVM are as follows: 25 | 26 | \begin{enumerate} 27 | 28 | \item Set up a fork of the llvm-project upstream repository (see \url{https://github.com/llvm-doe-org}). 29 | 30 | \item Enable continuous integration for the fork on various hardware of interests. 31 | 32 | \item Enable LLVM ECP related projects to be able to push and test branches. 33 | 34 | \item Setup status information for the continuous information results. 35 | 36 | \end{enumerate} 37 | 38 | 39 | \paragraph{Solution Strategy} 40 | 41 | %\begin{enumerate} 42 | 43 | The DOE LLVM repository is set up on GitHub as a fork of the llvm-project 44 | main repository also hosted on GitHub. This makes it easier to have a 45 | seamless synchronization with the main repository and keep all the 46 | GitHub main-fork integrated features. 47 | % 48 | The GitHub repository is automatically mirrored in the GitLab premium 49 | instance hosted at ORNL. 50 | % 51 | Furthermore, the continuous integration takes advantage of the GitLab CI infrastructure. 52 | This infrastructure is available on several machines from the ExCL lab as 53 | well as on Summit and Theta. 54 | 55 | %\end{enumerate} 56 | 57 | 58 | \paragraph{Recent Progress} 59 | 60 | %\begin{enumerate} 61 | The fork has been set up with an automatic mirroring with the upstream repository. 62 | The mirroring is using GitHub Actions, and the fork is integrated with E4S releases. 63 | %\end{enumerate} 64 | 65 | 66 | \paragraph{Next Steps} 67 | 68 | %\begin{enumerate} 69 | The team will add continuous integration on more hardware (i.e., most recent versions of Frontier and Aurora test nodes) and 70 | improve the test suite for the CI (e.g., OpenACC tests). 71 | %\end{enumerate} 72 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-LLVM.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @article{kruse2018loop, 4 | title={Loop Optimization Framework}, 5 | author={Kruse, Michael and Finkel, Hal}, 6 | journal={LCPC 2018; arXiv:1811.00632}, 7 | year={2018} 8 | } 9 | 10 | @inproceedings{kruse2018user, 11 | title={User-Directed Loop-Transformations in Clang}, 12 | author={Kruse, Michael and Finkel, Hal}, 13 | booktitle={2018 IEEE/ACM 5th Workshop on the LLVM Compiler Infrastructure in HPC (LLVM-HPC)}, 14 | pages={49--58}, 15 | year={2018}, 16 | organization={IEEE} 17 | } 18 | 19 | @inproceedings{doerfert2018compiler, 20 | title={Compiler optimizations for OpenMP}, 21 | author={Doerfert, Johannes and Finkel, Hal}, 22 | booktitle={International Workshop on OpenMP}, 23 | pages={113--127}, 24 | year={2018}, 25 | organization={Springer} 26 | } 27 | 28 | @inproceedings{doerfert2019tregion, 29 | title={The TRegion Interface and Compiler Optimizations for OpenMP Target Regions}, 30 | author={Doerfert, Johannes and Diaz, Jose Manuel Monsalve and Finkel, Hal}, 31 | booktitle={International Workshop on OpenMP}, 32 | pages={153--167}, 33 | year={2019}, 34 | organization={Springer} 35 | } 36 | 37 | @misc{P1609R0, 38 | title={P1609R0: C++ Should Support Just-in-Time Compilation}, 39 | author={Finkel, Hal}, 40 | howpublished={\url{http://wg21.link/p1609r0}}, 41 | year={2019} 42 | } 43 | 44 | @article{finkel2019clangjit, 45 | title={ClangJIT: Enhancing C++ with Just-in-Time Compilation}, 46 | author={Finkel, Hal and Poliakoff, David and Richards, David F}, 47 | journal={arXiv preprint arXiv:1904.08555}, 48 | year={2019} 49 | } 50 | 51 | 52 | @InProceedings{giorgis2020, 53 | author="Georgakoudis, Giorgis 54 | and Doerfert, Johannes 55 | and Laguna, Ignacio 56 | and Scogland, Thomas R. W.", 57 | editor="Milfeld, Kent 58 | and de Supinski, Bronis R. 59 | and Koesterke, Lars 60 | and Klinkenberg, Jannis", 61 | title={{FAROS: A Framework to Analyze OpenMP Compilation Through Benchmarking and Compiler Optimization Analysis}}, 62 | booktitle="OpenMP: Portable Multi-Level Parallelism on Modern Systems", 63 | year="2020", 64 | publisher="Springer International Publishing", 65 | address="Cham", 66 | pages="3--17", 67 | abstract="Compilers optimize OpenMP programs differently than their serial elision. Early outlining of parallel regions and invocation of parallel code via OpenMP runtime functions are two of the most profound differences. Understanding the interplay between compiler optimizations, OpenMP compilation, and application performance is hard and usually requires specialized benchmarks and compilation analysis tools.", 68 | isbn="978-3-030-58144-2" 69 | } 70 | 71 | 72 | @misc{OpenMPOpt2020, 73 | title={{(OpenMP) Parallelism Aware Optimizations}}, 74 | author={Doerfert, Johannes and Huber, Joseph and Stipanovic, Stefan and Georgakoudis, Giorgis and Tobon Mosquera, Hamilton and Tian, Shilei}, 75 | howpublished={\url{https://whova.com/embedded/session/llvm_202010/1162344/}}, 76 | year={2020} 77 | } 78 | 79 | @article{kruse2020search, 80 | title={{Autotuning Search Space for Loop Transformations}}, 81 | author={Kruse, Michael and Finkel, Hal and Wu, Xingfu}, 82 | journal={LLVM-HPC Workshop @SC}, 83 | year={2020} 84 | } 85 | 86 | @article{finkel2020dsl, 87 | title={{\emph{Really} Embedding Domain-Specific Languages into C++}}, 88 | author={Finkel, Hal and McCaskey, Alex and Popoola, Tobi and Lyakh, Dmitry and Doerfert, Johannes}, 89 | journal={LLVM-HPC Workshop @SC}, 90 | year={2020} 91 | } 92 | 93 | @misc{kruse2020openmpbooth, 94 | author = {Kruse, Michael}, 95 | title = {{OpenMP 5.1 Features: Loop Transformation Constructs}}, 96 | howpublished = {OpenMP Booth Talk at SC20}, 97 | year = {2020}, 98 | url = {https://www.openmp.org/events/openmp-sc20/}, 99 | } 100 | 101 | 102 | @misc{kruse2021openmpbooth, 103 | author = {Kruse, Michael}, 104 | title = {{Using OpenMP loop transformations with Clang}}, 105 | howpublished = {OpenMP Booth Talk at SC21}, 106 | year = {2020}, 107 | url = {https://www.openmp.org/events/sc21/#booth-talks}, 108 | } 109 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-PAPYRUS.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{Kim:2017:PHP, 2 | author = {Kim, Jungwon and Lee, Seyong and Vetter, Jeffrey S.}, 3 | title = {{PapyrusKV}: A High-performance Parallel Key-value Store for Distributed {NVM} Architectures}, 4 | booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis}, 5 | series = {SC '17}, 6 | year = {2017}, 7 | location = {Denver, Colorado}, 8 | pages = {57:1--57:14}, 9 | articleno = {57}, 10 | numpages = {14}, 11 | } 12 | 13 | @inproceedings{Kim:2017:DIP, 14 | author = {Kim, Jungwon and Sajjapongse, Kittisak and Lee, Seyong and Vetter, Jeffrey S.}, 15 | title = "{Design and Implementation of Papyrus: Parallel Aggregate Persistent Storage}", 16 | booktitle = "{Proceedings of the 31st IEEE International Parallel and Distributed Processing Symposium}", 17 | series = {IPDPS '17}, 18 | year = {2017}, 19 | pages = {1151--1162}, 20 | } 21 | 22 | @inproceedings{Georganas:2014:PDB, 23 | author = {Georganas, Evangelos and Bulu\c{c}, Aydin and Chapman, Jarrod and Oliker, Leonid and Rokhsar, Daniel and Yelick, Katherine}, 24 | title = "{Parallel De Bruijn Graph Construction and Traversal for De Novo Genome Assembly}", 25 | booktitle = "{Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis}", 26 | series = {SC '14}, 27 | year = {2014}, 28 | pages = {437--448}, 29 | } 30 | 31 | @article{Kim:2019:IED, 32 | author = {Kim, Jungwon Kim and Vetter, Jeffrey S.}, 33 | title = "{Implementing Efficient Data Compression and Encryption in a Persistent Key-value Store for HPC}", 34 | journal = "{The International Journal of High Performance Computing Applications}", 35 | volume = {33}, 36 | number = {6}, 37 | pages = {1098-1112}, 38 | year = {2019}, 39 | }, 40 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-PROTEAS.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @TechReport{vetter:2018:extreme, 4 | author = "J. S. Vetter and R. Brightwell and M. Gokhale and P. 5 | McCormick and R. Ross and J. Shalf and K. Antypas and 6 | D. Donofrio and T. Humble and C. Schuman and B. Van 7 | Essen and S. Yoo and A. Aiken and D. Bernholdt and S. 8 | Byna and K. Cameron and F. Cappello and B. Chapman and 9 | A. Chien and M. Hall and R. Hartman-Baker and Z. Lan 10 | and M. Lang and J. Leidel and S. Li and R. Lucas and J. 11 | Mellor-Crummey and P. Peltz Jr. and T. Peterka and M. 12 | Strout and J. Wilke", 13 | title = "Extreme Heterogeneity 2018 - Productive Computational 14 | Science in the Era of Extreme Heterogeneity: Report for 15 | {DOE} {ASCR} Workshop on Extreme Heterogeneity", 16 | institution = "USDOE Office of Science (SC) (United States)", 17 | year = "2018", 18 | doi = "10.2172/1473756", 19 | } 20 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-SYCL.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{dpct, 2 | author={Jin, Zheming and Vetter, Jeffrey}, 3 | booktitle={2021 IEEE International Parallel and Distributed Processing Symposium Workshops (IPDPSW)}, 4 | title={Evaluating CUDA Portability with HIPCL and DPCT}, 5 | year={2021}, 6 | pages={371-376}, 7 | doi={10.1109/IPDPSW52791.2021.00065} 8 | } 9 | 10 | @inproceedings{reduction, 11 | author = {Jin, Zheming and Vetter, Jeffrey}, 12 | title = {Evaluating the Performance of Integer Sum Reduction in SYCL on GPUs}, 13 | year = {2021}, 14 | isbn = {9781450384414}, 15 | publisher = {Association for Computing Machinery}, 16 | address = {New York, NY, USA}, 17 | url = {https://doi.org/10.1145/3458744.3473360}, 18 | doi = {10.1145/3458744.3473360}, 19 | booktitle = {50th International Conference on Parallel Processing Workshop}, 20 | articleno = {34}, 21 | numpages = {8}, 22 | keywords = {SYCL, OpenCL, Reduction, GPGPU, CUDA}, 23 | location = {Lemont, IL, USA}, 24 | series = {ICPP Workshops '21} 25 | } 26 | 27 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-SYCL.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{2.10} PROTEAS-TUNE - SYCL}\label{s:sycl} 2 | 3 | \paragraph{Overview} 4 | OpenCL is an open standard maintained by the Khronos group. It offers programming portability across a wide range of software and hardware for graphics processing units (GPUs), multi-core processors (CPUs), and other accelerators. As opposed to the OpenCL programming model in which host and device codes are written in two languages, the SYCL standard specifies a cross-platform abstraction layer that enables programming of heterogeneous computing system using standard C++. It can combine host and device codes for an application in a type-safe way to improve development productivity. SYCL is a promising programming model for exascale computing. The relevant topics are migration from CUDA only to SYCL, performance and expressiveness of SYCL programs, maturity of SYCL compilers, and accesses to SYCL programs. 5 | 6 | 7 | The PROTEAS-TUNE objectives for SYCL are as follows: 8 | \begin{enumerate} 9 | \item Develop a SYCL suite comprised of kernels from open-source benchmarks, scientific, and machine learning applications 10 | \item Evaluate the performance of these kernels with contemporary SYCL implementations on heterogeneous computing platforms 11 | \item Understand the impacts of SYCL compilers and computing platforms upon the performance gaps of these kernels 12 | \item Propose SYCL features that can improve functional and performance portability 13 | \item Engage with vendors, facilities, universities, and communities for the development of SYCL applications and compilers 14 | \end{enumerate} 15 | 16 | 17 | 18 | \paragraph{Key Challenges} 19 | Acknowledging CUDA's established presence in high-performance computing, SYCL has been striving for a portability-enhancing path for a wider set of platforms. While SYCL can achieve functional portability, it does not solve performance portability. To address the challenge, understanding the applications, programming models, SYCL features, SYCL compilers, and the architectures of heterogeneous computing platforms are critical. There are many scientific and AI applications. Major programming models for the target platforms are CUDA, HIP, OpenMP, and SYCL. Major SYCL features are extension to OpenCL C, single source, USM and buffer styles, and asynchronous programming. Major SYCL compilers are DPC++ with OpenCL and Level Zero backends, DPC++ with CUDA and HIP support, hipSYCL, and ComputeCpp. AMD, Intel, and Nvidia GPUs are different in their computing architectures. CPUs, GPUs, and FPGAs have fundamentally different architectures. The combination of applications, languages, features, toolchains, and architectures will characterize the performance of a SYCL program. 20 | 21 | 22 | \paragraph{Solution Strategy} 23 | To mitigate these challenges, the team proposes the following actions for each effort. 24 | \begin{itemize} 25 | \item Develop a diverse set of SYCL programs with compute- and memory-bound kernels for performance analysis 26 | \item Have a good understanding of the characteristics of these programs 27 | \item Evaluate the performance of SYCL programs with the latest SYCL compilers on computing platforms 28 | \item Analyze the performance of SYCL kernels through performance profilers 29 | \item Identify and summarize these performance differences 30 | \item Engage with SYCL compiler developers to fix bugs and improve kernel performance 31 | \item Collaborate with PROTEAS teams and SYCL developers on performance optimization and tuning 32 | \end{itemize} 33 | 34 | 35 | \paragraph{Recent Progress} 36 | Recent progress in this area includes several key developments listed below. 37 | \begin{itemize} 38 | \item Investigated the use of vendor and academic conversion tools by evaluating CUDA portability with HIPCL and DPCT \cite{dpct} 39 | \item Investigated the performance of integer sum reduction in SYCL and CUDA on GPUs \cite{reduction} 40 | \item Developing 200+ SYCL programs in the open-source GitHub repository (\url{https://github.com/zjin-lcf/HeCBench.git}) 41 | \end{itemize} 42 | 43 | 44 | \paragraph{Next Steps} 45 | The following efforts have been identified for the next phase of the project. 46 | \begin{itemize} 47 | \item Continue developing SYCL programs with codes of interest to ECP 48 | \item Evaluate kernel performance with SYCL compilers on target platforms 49 | \item Analyze the performance of SYCL kernels through performance profilers 50 | \item Sum up the optimization techniques for SYCL kernels on target platforms 51 | \item Engage with SYCL developers to fix bugs and improve performance and portability 52 | \item Support compiler installation, feature requests, and bug reporting for ECP users 53 | \end{itemize} 54 | 55 | %eof 56 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/2.3.2.10-TAU.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @misc{vampir.eu, 4 | title = "Vampir", 5 | author = "GWT-TUD GmbH", 6 | howpublished = "\url{https://vampir.eu}", 7 | year = 2020, 8 | note = "Accessed: 2020-10-15" 9 | } 10 | 11 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/Bricks-mpi-parts.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/Bricks-mpi-parts.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/YTune-searchtree.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/YTune-searchtree.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/YTune-solution.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/YTune-solution.jpg -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/YTune-solution.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/YTune-solution.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/clacc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/clacc.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/clacc_tau.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/clacc_tau.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/miniFE_openmp_tau.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/miniFE_openmp_tau.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-fig.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-fig.jpg -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-fig_orig.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-fig_orig.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-meraculous-eval.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-meraculous-eval.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-meraculous.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/papyrus-meraculous.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-3d-candle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-3d-candle.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-3d.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-3d.jpg -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-3d_orig.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-3d_orig.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-papyruskv.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.10-PROTEAS-YTUNE/tau-papyruskv.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-BOLT.bib: -------------------------------------------------------------------------------- 1 | @INPROCEEDINGS{ccgrid, 2 | author={H. V. Dang and S. Seo and A. Amer and P. Balaji}, 3 | booktitle={2017 17th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid Computing ({CCGRID})}, 4 | title={Advanced Thread Synchronization for Multithreaded MPI Implementations}, 5 | year={2017}, 6 | volume={}, 7 | number={}, 8 | pages={314-324}, 9 | keywords={concurrency control;message passing;multi-threading;open systems;resource allocation;synchronisation;MPI resource;active threads;communication progress;concurrent multithreaded;cooperative progress model;data locality;first-in-first-out arbitration;hybrid MPI applications;interoperability;locality-preserving lock;message passing interface;multithreaded MPI;ownership passing;residual wasted resource acquisitions;thread synchronization;waiting threads;Benchmark testing;Context;Message systems;Production;Safety;Synchronization;Yarn;MPI;OpenMP;lock;mutex;synchronization;thread safety;threads}, 10 | doi={10.1109/CCGRID.2017.65}, 11 | ISSN={}, 12 | month={May},} 13 | 14 | 15 | 16 | 17 | @article{ppopp, 18 | author = {Amer, Abdelhalim and Lu, Huiwei and Wei, Yanjie and Balaji, Pavan and Matsuoka, Satoshi}, 19 | title = {MPI+Threads: Runtime Contention and Remedies}, 20 | journal = {SIGPLAN Not.}, 21 | issue_date = {August 2015}, 22 | volume = {50}, 23 | number = {8}, 24 | month = jan, 25 | year = {2015}, 26 | issn = {0362-1340}, 27 | pages = {239--248}, 28 | numpages = {10}, 29 | url = {http://doi.acm.org/10.1145/2858788.2688522}, 30 | doi = {10.1145/2858788.2688522}, 31 | acmid = {2688522}, 32 | publisher = {ACM}, 33 | address = {New York, NY, USA}, 34 | keywords = {MPI, critical section, runtime contention, threads}, 35 | } 36 | 37 | @article{amer2018, 38 | title={Lock Contention Management in Multithreaded MPI}, 39 | author={Amer, Abdelhalim Amer and Chabbi, Milind and Lu, Huiwei and 40 | Wei, Yanji and Hammond, Jeff and Matsuoka, Satoshi and Balaji, Pavan}, 41 | journal={ACM Transactions on Parallel Computing}, 42 | year={2018}, 43 | publisher={ACM} 44 | } 45 | 46 | @inproceedings{ExaMPI20MCAThreads, 47 | author = {N. Evans and J. Ciesko and S. Olivier and H. Pritchard and S. Iwasaki and K. Raffenetti and P. Balaji}, 48 | title = {Implementing Flexible Threading Support in {Open MPI}}, 49 | booktitle={Proceedings of the Workshop on Exascale MPI in conjunction with International Conference for High Performance Computing, Networking, Storage, and Analysis (ExaMPI '20)}, 50 | year = {2020}, 51 | month = {Nov.}, 52 | } 53 | 54 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-HeteroLoopSchedRTS.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{2.11} OpenMP Heterogeneous Loop Scheduling Runtime Library} 2 | 3 | \paragraph{Overview} 4 | 5 | 6 | Applications running on ECP Systems DoE's Exascale supercomputers suffer from load imbalance, either due to irregularities in applications or performance perturbances of the platform. To handle this load imbalance across the heterogeneous processors of a node, a reactive load balancing in the form of loop scheduling is needed. 7 | The SOLLVE's OpenMP loop scheduling runtime (\url{https://github.com/sollve/openmprts}) facilitates for scheduling of application's computation onto heterogeneous processing elements of a node. These processing elements can be cores of a multi-core processor, a GPU (accelerator) of multi-GPU (multi-accelerator), or a partition of a GPU (accelerator). Note that the xPU could also be partition of a GPU, i.e., a sub-device. 8 | 9 | \paragraph{Key Challenges} 10 | 11 | Scheduling overheads due to queueing and data locality need to be handled when scheduling across accelerators of a node. Also, conventionally, MPI parallelizes applications across accelerators of a node. OpenMP can be used to parallelize the work across accelerator with a small non-negligible (~8\%) overhead for a stencil computation on Summit. Using OpenMP across the entire node is advantageous to reduce programming complexity and having to think about multiple programming models to program the node. Additionally, the cost of load balancing is lower when using OpenMP instead of MPI. 12 | 13 | \paragraph{Solution Strategy} 14 | 15 | We develop a prototype runtime library, to be part of the LLVM OpenMP runtime system, that provides several multi-xPU scheduling strategies. The core strategies that we expect to provide are a static, dynamic, and guided scheduling. We also allowed for user-defined scheduling strategies in our library. 16 | 17 | \paragraph{Recent Progress} 18 | 19 | We have experimented with our strategy in an OpenMP offload version of AutoDock-GPU, a molecular biology code which is being used for simulations for COVID-19 therapeutics and for other molecular biology and AI/ML applications, using LLVM 12 and LLVM 13 using one node of the Spock system. Results obtained on one GPU of a node of Spock (Figure~\ref{fig:llvmadspck}) show that LLVM 13’s(rocm4.5) OpenMP improves performance over LLVM 12 (rocm4.2) OpenMP of the AutoDock-GPU by 14.28\% for the largest problem size, the 3er5 ligand. LLVM OpenMP implementation has a significant impact on large problem size. Figure~\ref{fig:mgpuSpock} shows results for strategies for an OpenMP parallelization of AutoDock-GPU (using a collection containing the three ligands in Figure~\ref{fig:llvmspck}) across the 4 GPUs of Spock, specifically showing the impact of dynamic load balancing strategy across multiple GPUs of the node. The round-robin scheduler under LLVM13’s OpenMP (rocm4.5) improves performance over the round-robin scheduler in LLVM12’s OpenMP (rocm4.2) by 39\%. This is much more significant than the performance gain of 14.28\% seen in Figure~\ref{fig:llvmadspck}. Under LLVM 13’s OpenMP (rocm4.5), using a random schedule (OpenMP chunks of a loop are assigned to randomly chosen GPU) as opposed to a round-robin scheduler (OpenMP chunks are assigned to a GPU based on chunk number) improves performance 30\%. Through using the newer LLVM 13 over LLVM 12 and using appropriate load balancing across GPUs, the performance for AutoDock-GPU code improves by a total of 57.24\%. 20 | 21 | 22 | \begin{figure}[h!] 23 | \centering 24 | \includegraphics[scale=0.2]{projects/2.3.2-Tools/2.3.2.11-SOLLVE/AutoDockGPU-problemszLLVMOMP.pdf} 25 | \caption{Running AutoDock-GPU on Spock with LLVM's OpenMP.} 26 | \label{fig:llvmadspck} 27 | \end{figure}\begin{figure}[h!] 28 | \centering 29 | \includegraphics[scale=0.2]{projects/2.3.2-Tools/2.3.2.11-SOLLVE/Impact-lb-LLVMOpenMP-Spock.pdf} 30 | \caption{Impact of OpenMP multi-xPU scheduling strategies on Spock with LLVM's OpenMP.} 31 | \label{fig:mgpuSpock} 32 | \end{figure} 33 | 34 | \paragraph{Next Steps} 35 | 36 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-LLVM_enhancement.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{barua2019ompsan, 2 | title={OMPSan: static verification of OpenMP’s data mapping constructs}, 3 | author={Barua, Prithayan and Shirako, Jun and Tsang, Whitney and Paudel, Jeeva and Chen, Wang and Sarkar, Vivek}, 4 | booktitle={International Workshop on OpenMP}, 5 | pages={3--18}, 6 | year={2019}, 7 | organization={Springer} 8 | } 9 | 10 | @inproceedings{barua2020ompmemopt, 11 | title={OmpMemOpt: Optimized Memory Movement for Heterogeneous Computing}, 12 | author={Barua, Prithayan and Zhao, Jisheng and Sarkar, Vivek}, 13 | booktitle={European Conference on Parallel Processing}, 14 | pages={200--216}, 15 | year={2020}, 16 | organization={Springer} 17 | } 18 | 19 | @inproceedings{yu2021arbalest, 20 | title={ARBALEST: Dynamic Detection of Data Mapping Issues in Heterogeneous OpenMP Applications}, 21 | author={Yu, Lechen and Protze, Joachim and Hernandez, Oscar and Sarkar, Vivek}, 22 | booktitle={2021 IEEE International Parallel and Distributed Processing Symposium (IPDPS)}, 23 | pages={464--474}, 24 | year={2021}, 25 | organization={IEEE} 26 | } 27 | 28 | @inproceedings{yu2020study, 29 | title={A Study of Memory Anomalies in OpenMP Applications}, 30 | author={Yu, Lechen and Protze, Joachim and Hernandez, Oscar and Sarkar, Vivek}, 31 | booktitle={International Workshop on OpenMP}, 32 | pages={328--342}, 33 | year={2020}, 34 | organization={Springer} 35 | } 36 | 37 | @inproceedings{atzeni2016archer, 38 | title={ARCHER: effectively spotting data races in large OpenMP applications}, 39 | author={Atzeni, Simone and Gopalakrishnan, Ganesh and Rakamaric, Zvonimir and Ahn, Dong H and Laguna, Ignacio and Schulz, Martin and Lee, Gregory L and Protze, Joachim and M{\"u}ller, Matthias S}, 40 | booktitle={2016 IEEE international parallel and distributed processing symposium (IPDPS)}, 41 | pages={53--62}, 42 | year={2016}, 43 | organization={IEEE} 44 | } 45 | 46 | @INPROCEEDINGS{OpenMPEncoding, 47 | title={{Efficient Execution of OpenMP on GPUs}}, 48 | booktitle={{Code Generation and Optimizations (CGO)}}, 49 | author={{J. Huber, M. Cornelius, G. Georgakoudis, S. Tian, J. Diaz, K. Dinel, B. Chapman, \underline{J. Doerfert}}}, 50 | year=2022, 51 | pubstate={toappear}, 52 | } 53 | @INPROCEEDINGS{NewOpenMPRT, 54 | title={{Co-Designing an OpenMP GPU Runtime and Optimizations for Near-Zero Overhead Execution}}, 55 | booktitle={{International Parallel Distributed Processing Symposium (IPDPS)}}, 56 | year=2022, 57 | author={{\underline{J. Doerfert}, A. Patel, S. Tian, J. Huber, J. Diaz, B. Chapman, G. Georgakoudis}}, 58 | pubstate={toappear}, 59 | } 60 | 61 | @inproceedings{RS_Tramm_2014, 62 | author="Tramm, John R. and Siegel, Andrew R. and Forget, Benoit and Josey, Colin", 63 | title="Performance Analysis of a Reduced Data Movement Algorithm for Neutron Cross Section Data in Monte Carlo Simulations", 64 | booktitle = {{EASC} 2014 - Solving Software Challenges for Exascale}, 65 | address = {Stockholm}, 66 | year = "2014", 67 | url = "https://doi.org/10.1007/978-3-319-15976-8_3" 68 | } 69 | 70 | @inproceedings{XS_Tramm_2014, 71 | author = {Tramm, John R and Siegel, Andrew R and Islam, Tanzima and Schulz, Martin}, 72 | title = {{XSBench} - The Development and Verification of a Performance Abstraction for {M}onte {C}arlo Reactor Analysis}, 73 | booktitle = {{PHYSOR} 2014 - The Role of Reactor Physics toward a Sustainable Future}, 74 | address = {Kyoto}, 75 | year = 2014, 76 | url = "https://www.mcs.anl.gov/papers/P5064-0114.pdf" 77 | } 78 | 79 | @article{romano2013openmc, 80 | title={The OpenMC monte carlo particle transport code}, 81 | author={Romano, Paul K and Forget, Benoit}, 82 | journal={Annals of Nuclear Energy}, 83 | volume={51}, 84 | pages={274--281}, 85 | year={2013}, 86 | publisher={Elsevier} 87 | } 88 | 89 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-LLVM_enhancement.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{2.11} Building tools to detect and debug bugs and performance issues with OMP offloading} 2 | 3 | \paragraph{Overview} 4 | Starting from the 4.0 version, OpenMP has introduced a new feature, target offloading, which enables programmers to leverage additional computing devices connected to the host (e.g., GPU, application-specific accelerator). 5 | With a group of hardware-agnostic constructs (device directives), target offloading makes it possible to write accelerated OpenMP applications in a performance-portable manner. However, concurrency bugs and performance issues may still arise due to incorrect usage of device directives. 6 | Our group at Georgia Tech has conducted a comprehensive study of such issues~\cite{yu2020study}. We found that most of these issues are related to the data mappings between the host and target device. 7 | For example, incorrect data mappings can lead to uninitialized memory accesses or even buffer overflow on the target device. In addition, programmers may also declare data mappings that incur unnecessary time and memory overhead due to redundant copies. 8 | 9 | To help programmers detect and debug these concurrency bugs and performance issues, we have developed a toolset for OpenMP applications: 10 | \begin{itemize} 11 | \item OMPSan~\cite{barua2019ompsan} is a static analyzer that can report all suspicious data mappings that may lead to concurrency bugs and memory issues; 12 | \item ARBALEST~\cite{yu2021arbalest} is a dynamic analyzer that can pinpoint incorrect data mappings that result in concurrency bugs or memory issues at runtime; 13 | \item OmpMemOpt~\cite{barua2020ompmemopt} is a static optimizer identifies redundant data mappings and replaces them by more optimized data mappings. 14 | \end{itemize} 15 | 16 | \paragraph{Key Challenges} 17 | With respect to incorrect data mappings, multiple kinds of bugs may arise at runtime, such as use of uninitialized memory, use of stale data, buffer overflow, and data race. Currently, there exists no tool that can recognize all these bugs' behavior. 18 | Even if programmers apply multiple analysis tools when testing a single OpenMP application, some incorrect data mappings may still be missed since they may only trigger bugs in a specific thread interleaving. 19 | On the other hand, detecting redundant data mappings may also be challenging. OpenMP utilizes a reference-count algorithm to manage the lifecycle of each data mapping. Memory transfer is only carried out when a data mapping is first encountered. 20 | The analysis tool needs to correctly model this reference-count-based mechanism and all memory accesses related to data mappings to determine whether a data mapping is redundant. 21 | 22 | \paragraph{Solution Strategy} 23 | As a static analysis tool, OMPSan~\cite{barua2019ompsan} compares the def-use information in an OpenMP application with the application's serial-elision version. OMPSan assumes that the serial-elision version contains the correct def-use information. Any inconsistent def-use chain incurred by data mappings can be statically reported as a potential bug. 24 | 25 | ARBALEST is a dynamic analysis tool designed for incorrect data mappings. It is an extension to the Archer data race detector~\cite{atzeni2016archer}. ARBALEST leverages a state-transition diagram to record the state of each data mapping, i.e., whether the memory section on the host/target device has a valid value. ARBALEST also utilizes the happens-before relations maintained by Archer to detect conflicting memory accesses when the runtime conducts memory transfer for a data mapping. 26 | According to the evaluation in~\cite{yu2021arbalest}, ARBALEST can accurately identify all incorrect data mappings with acceptable time and memory overhead. 27 | 28 | OmpMemOpt\cite{barua2020ompmemopt} is a static optimizer that can generate optimal data mappings for an OpenMP application. 29 | The optimization framework in OmpMemOpt casts the problem of detection and removal of redundant data movements into a partial redundancy elimination (PRE) problem and applies 30 | the lazy code motion technique to optimize these data movements. 31 | The evaluation on ten benchmarks shows that OmpMemOpt achieved a geometric speedup of 2.3x, and reduced on average 50\% of the total bytes transferred between the host and GPU. 32 | 33 | \paragraph{Recent Progress} 34 | We have achieved a number of publications for the toolset. OMPSan has been presented at IWOMP 2019 and was selected as the best paper award recipient in that two workshops. The other two papers on ARBALEST and OmpMemOpt were presented at IPDPS 2021 and Euro-Par 2020 respectively. 35 | 36 | \paragraph{Next Steps} 37 | We are working with the LLVM OpenMP subcommunity to develop a new version of ARBALEST. The new implementation will be built on the latest LLVM and apply a number of optimization techniques to reduce the time overhead. Besides, we are also helping improve the OpenMP Tool Interface design based on our experience of developing analysis tools. 38 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-VV.bib: -------------------------------------------------------------------------------- 1 | @Misc{sollvevvgithub, 2 | howpublished = "\url{https://github.com/SOLLVE/sollve_vv/}", 3 | title = "SOLLVE OpenMP Validation and Verification Testsuite.", 4 | year = "2019.", 5 | } 6 | 7 | @Misc{sollvevvwebsite, 8 | howpublished = "\url{https://crpl.cis.udel.edu/ompvvsollve/}", 9 | title = "SOLLVE OpenMP Validation and Verification Website.", 10 | year = "2019", 11 | } 12 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-VV.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{2.11} Validation and Verification Testsuite} 2 | 3 | \paragraph{Overview} 4 | The OpenMP Validation and Verification Testsuite (OMPVV) presents the community with a test suite comprised of functional tests and application kernels that are written with the intention of verifying usability of OpenMP features. The test suite aims to accomplish several goals of equal importance. The first goal is to provide vendors with a straightforward way to examine the status of their implementations. The next goal is to support application developers in identifying whether their system can support the specific OpenMP features they wish to utilize. Both of these are accomplished by running the full test suite and generating a report summary, which provides the user with a simple pass-fail report for OpenMP features. These insights also include where the tests are failing (compile time or runtime) and what is the error encountered. Our full suite of OpenMP tests is made publicly available on Github \cite{sollvevvgithub} and full documentation in available the corresponding website \cite{sollvevvwebsite}. 5 | 6 | \paragraph{Key Challenges} 7 | Every few years, the OpenMP Architecture Review Board releases new versions of their specification. These new releases of the specification, 5.0 in November of 2018, 5.1 in November of 2020, and 5.1 in November of 2021 introduce new clauses and directives that many application developers and general users are keen on utilizing. Thus, when the updates are published, we set out to create tests for each new feature or new directive. It takes time for the compiler developers to develop implementations for several of the new features, as a result there is a gap between versions released by the specification, implementations developed and implementations made available for the application developers. Due to this fact, we are often times writing test cases for new clauses and directives even before the implementations begin to exist. This can be quite a challenge since we cannot even compile or execute them right away, so would need to revisit the test cases as soon as the implementations are made available. 8 | 9 | \paragraph{Solution Strategy} 10 | For every new specification version we begin by classifying the priority of each new feature based on input from ECP and (sometimes) CAAR application teams. We also track LLVM's OpenMP implementation status and formulate a priority list for test implementation. As more features are implemented by LLVM, we continue to create functional tests cases and verify our own work by running the tests on several heterogeneous systems that represent multiple vendors and OpenMP compiler implementations. In previous years, we followed the same strategy for providing OpenMP 4.5 test coverage \cite{vandv2019}. 11 | 12 | \paragraph{Recent Progress} 13 | Over the past year, we have been able to provide tests (C, C++) that cover almost all of the new features introduced in OpenMP 5.0. We continue to improve our Fortran tests coverage for 5.0 features as well. We periodically report the pass-fail status and individual test results on state-of-the-art systems such as Oak Ridge National Lab's Summit and Spock computing systems as well as NERSC's Cori system \cite{sollvevvwebsite}. This provides a useful tracking system for vendors and application developers alike. Also, we have created functional tests for several of the latest OpenMP 5.1 features, namely: atomic compare, C++ attribute specifier, declare variant, default first private, tiling etc. These have been implemented by LLVM and deemed of high importance to AD teams. 14 | 15 | \paragraph{Next Steps} 16 | We will continue C/C++ test development for OpenMP 5.1 specification while we maintain, improve and fix any issues discovered over our previously developed test. We have continued to follow the same strategy as we did for providing test coverage of 5.0 features. We periodically run our tests on the newest available compiler implementations that support OpenMP and maintain the results \cite{sollvevvwebsite}. Additionally, we are tracking AD teams use of OpenMP features and incorporating application kernels in our tests that are outside the scope of individual feature tests but test a legal combination of OpenMP features that is critical for the application. -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/2.3.2.11-SOLLVE-training.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{2.11} Training \& Outreach in 2021}\label{subsubsect:train_outreach} 2 | 3 | \begin{enumerate} 4 | \item Annual ECP Meeting 2021 related 5 | \begin{itemize} 6 | \item \enquote{OpenMP Tutorial} by O. Hernandez, D. Oryspayev, T. Scogland, C. Bertoni, J. Doerfert, and V. Kale 7 | \item \enquote{ECP + SOLLVE COVID} 8 | \item \enquote{OpenMP Application Experiences BoF} 9 | \item \enquote{LLVM in ECP Short Stories About a Compiler Framework in HPC} 10 | \item \enquote{OpenMP Vendor BoF} 11 | \item \enquote{Session on Testing in ECP including OpenMP V\&V Suite} 12 | \item \enquote{Tutorial: Autotuning PolyBench Benchmarks with LLVM Clang/Polly Loop Optimization Pragmas Using Bayesian Optimization} 13 | \end{itemize} 14 | 15 | \item \enquote{OpenMP Users Monthly Telecons\footnote{\url{https://www.openmp.org/events/ecp-sollve-openmp-monthly-teleconference/}}} led by D. Oryspayev 16 | 17 | \item Weekly \enquote{OpenMP-in-LLVM} teleconference with DOE labs and vendors (AMD, Intel, Cray etc.) 18 | 19 | \item Biweekly \enquote{OpenMP work in Flang} teleconference with DOE labs and vendors (AMD, ARM, NVIDIA etc.) 20 | 21 | \item Hackathons 22 | 23 | \begin{itemize} 24 | \item \enquote{ECP SOLLVE + NERSC OpenMP Hackathon\footnote{\url{https://sites.google.com/view/ecpomphackjan2021/home}}}, January 22, and 27 – 29, 2021 25 | \begin{itemize} 26 | \item Organizers: C. Daley, D. Oryspayev, K. Gott, H. He, O. Hernandez, and V. Kale 27 | \end{itemize} 28 | \item \enquote{ECP OpenMP Virtual Hackathon\footnote{\url{https://www.bnl.gov/ompbrookathon2021/}}}, October 1, and 6 -8, 2021 29 | \begin{itemize} 30 | \item Organizers: D. Oryspayev, J. Doerfert, S. Chandrasekaran, S. Pophale, T. Scogland, and V. Kale 31 | \end{itemize} 32 | \end{itemize} 33 | 34 | \item ISC HPC'21\footnote{\url{https://www.isc-hpc.com/schedule.html}} related tutorials \& presentations 35 | \begin{itemize} 36 | \item Tutorial: \enquote{OpenMP Common Core: Learning Parallelization of Real Applications from the Ground-Up} by M. Arenaz, B. Chapman, R. Budiardja, O. Hernandez, and D. Oryspayev. 37 | \end{itemize} 38 | 39 | \item OpenMP.org Webinars 40 | \begin{itemize} 41 | \item \enquote{A Compiler's View of the OpenMP API\footnote{\url{https://www.openmp.org/events/webinar-a-compilers-view-of-the-openmp-api/}}} by J. Doerfert. 42 | \item \enquote{The Leaders of OpenMP Discuss the Future of the OpenMP API\footnote{\url{https://www.openmp.org/events/webinar-the-leaders-of-openmp-discuss-the-future-of-the-openmp-api/}}} by M. Klemm and B. de Supinski. 43 | \end{itemize} 44 | 45 | \item \enquote{Introduction to OpenMP GPU Offloading\footnote{\url{https://www.olcf.ornl.gov/calendar/introduction-to-openmp-gpu-offloading/}}} by S. Pophale, R. Budiardja, and W. Elwasif September 22 - 23, 2021 46 | 47 | \item ICPP'21 presentations: 48 | \begin{itemize} 49 | \item \enquote{Loop Transformations Using Clang’s Abstract Syntax Tree}, LLVM in Parallel Processing Workshop, by M. Kruse 50 | \end{itemize} 51 | 52 | \item SC'21\footnote{\url{https://sc21.supercomputing.org/program/}} 53 | \begin{itemize} 54 | \item OpenMP Tutorials 55 | \begin{itemize} 56 | \item \enquote{Advanced OpenMP: Host Performance and 5.1 Features} by C. Terboven, M. Klemm, R. van der Pas, B. R. de Supinski 57 | \end{itemize} 58 | \item OpenMP BoF 59 | \begin{itemize} 60 | \item \enquote{OpenMP Offloading and the 5.2 API} session led by J. Doerfert and M. Klemm 61 | \end{itemize} 62 | \item OpenMP Booth Talks 63 | \begin{itemize} 64 | \item \enquote{Behind the Pragmas} by J. Doerfert 65 | \item \enquote{Low-overhead Loop Scheduling in OpenMP} by V. Kale 66 | \item \enquote{Using OpenMP Loop Transformations with Clang} by M. Kruse 67 | \item \enquote{SOLLVE Validation and Verification Suite} by S. Pophale 68 | \end{itemize} 69 | \item Workshops 70 | \begin{itemize} 71 | \item \enquote{Loop Transformations Using Clang’s Abstract Syntax Tree}, LLVM-in-HPC Workshop, by M. Kruse 72 | \end{itemize} 73 | \end{itemize} 74 | 75 | 76 | \end{enumerate} 77 | 78 | 79 | 80 | 81 | 82 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/LLVM-Implementation-Figures/LLVM-opt-kernel-times.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/LLVM-Implementation-Figures/LLVM-opt-kernel-times.jpg -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/LLVM-Implementation-Figures/t_1024.tex: -------------------------------------------------------------------------------- 1 | % This file was created by tikzplotlib v0.9.2. 2 | \begin{tikzpicture} 3 | 4 | \begin{axis}[ 5 | axis line style={black}, 6 | xlabel={$N$}, 7 | xmin=-0.6, xmax=12.6, 8 | xlabel near ticks, 9 | xtick style={color=white!33.3333333333333!black}, 10 | xtick={0,1,2,3,4,5,6,7,8,9,10,11,12}, 11 | xticklabels={\(\displaystyle 2^4\),\(\),\(\displaystyle 2^6\),\(\),\(\displaystyle 2^8\),\(\),\(\displaystyle 2^{10}\),\(\),\(\displaystyle 2^{12}\),\(\),\(\displaystyle 2^{14}\),\(\),\(\displaystyle 2^{16}\)}, 12 | ylabel={Speedup}, 13 | ylabel near ticks, 14 | %ymin=0.202966825333382, ymax=7.6, 15 | ytick style={color=white!33.3333333333333!black}, 16 | %yticklabels={,\(\displaystyle {1.0}\),,\(\displaystyle {3.0}\),,\(\displaystyle {5.0}\),,\(\displaystyle {7.0}\),\(\displaystyle {8.0}\)}, 17 | ymode=log, 18 | log basis y={2}, 19 | ymin=0.3, ymax=8.5, 20 | ytick={0.5,1,2,4,8}, 21 | log ticks with fixed point, 22 | yticklabel pos=right, 23 | width=\textwidth, 24 | height=0.6\textwidth, 25 | title={$T=1024$}, 26 | title style={below right,at={(0.05,0.9)}} 27 | ] 28 | \addplot [semithick, mark=otimes] 29 | table {% 30 | 0 1.54172560113154 31 | 1 1.65860215053763 32 | 2 1.59782608695652 33 | 3 2.03624161073826 34 | 4 3.17523056653491 35 | 5 3.96593673965937 36 | 6 5.32525951557093 37 | 7 6.72148541114058 38 | 8 6.2743450321305 39 | 9 3.42638125542378 40 | 10 2.32380177063193 41 | 11 1.40163487155345 42 | 12 1.29789579295094 43 | }; 44 | % \addlegendentry{B1} 45 | \addplot [semithick, mark=square] 46 | table {% 47 | 0 0.513372472276582 48 | 1 0.547333333333333 49 | 2 0.599075297225892 50 | 3 0.550828729281768 51 | 4 0.57201646090535 52 | 5 0.835728952772074 53 | 6 1.43811764705882 54 | 7 2.48555411815438 55 | 8 3.56691152986266 56 | 9 2.76931747025673 57 | 10 2.24389385867926 58 | 11 1.37479676536026 59 | 12 1.28436651244046 60 | }; 61 | % \addlegendentry{B2} 62 | \addplot [semithick, mark=x] 63 | table {% 64 | 0 3.30685203574975 65 | 1 2.79770114942529 66 | 2 3.30263157894737 67 | 3 2.75550891920252 68 | 4 2.48282630029441 69 | 5 3.44634377967711 70 | 6 3.23179190751445 71 | 7 2.64840182648402 72 | 8 2.59288461538462 73 | 9 1.89490421158768 74 | 10 1.7509535977484 75 | 11 1.34198274819622 76 | 12 1.29377530790229 77 | }; 78 | % \addlegendentry{B3} 79 | \addplot [semithick, mark=*] 80 | table {% 81 | 0 0.833864844343204 82 | 1 1.06823060410917 83 | 2 1.30601343101343 84 | 3 1.40609367894497 85 | 4 1.4334323922734 86 | 5 1.77639399943391 87 | 6 2.22291134622401 88 | 7 1.9573504027618 89 | 8 1.64384220061375 90 | 9 1.46215812497777 91 | 10 1.27950960037583 92 | 11 1.14186188461619 93 | 12 1.07420840134936 94 | }; 95 | % \addlegendentry{B4} 96 | \addplot[gray, dashed] coordinates {(-1,1) (13,1)}; 97 | \end{axis} 98 | 99 | \end{tikzpicture} 100 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/LLVM-Implementation-Figures/t_256.tex: -------------------------------------------------------------------------------- 1 | % This file was created by tikzplotlib v0.9.2. 2 | \begin{tikzpicture} 3 | 4 | \begin{axis}[ 5 | axis line style={black}, 6 | xlabel={$N$}, 7 | xlabel near ticks, 8 | xmin=-0.6, xmax=12.6, 9 | xtick style={color=white!33.3333333333333!black}, 10 | xtick={0,1,2,3,4,5,6,7,8,9,10,11,12}, 11 | xticklabels={\(\displaystyle 2^4\),\(\),\(\displaystyle 2^6\),\(\),\(\displaystyle 2^8\),\(\),\(\displaystyle 2^{10}\),\(\),\(\displaystyle 2^{12}\),\(\),\(\displaystyle 2^{14}\),\(\),\(\displaystyle 2^{16}\)}, 12 | ylabel={Speedup}, 13 | ylabel near ticks, 14 | ytick style={color=white!33.3333333333333!black}, 15 | %ytick={0,1,2,3,4,5,6}, 16 | %yticklabels={,\(\displaystyle {1.0}\),,\(\displaystyle {3.0}\),,\(\displaystyle {5.0}\),}, 17 | %ymin=0.361127455148372, ymax=5.51707532158344, 18 | ymin=0.3, ymax=8.5, 19 | ymode=log, 20 | log basis y={2}, 21 | ytick={0.5,2,4,8}, 22 | log ticks with fixed point, 23 | width=\textwidth, 24 | height=0.6\textwidth, 25 | title={$T=256$}, 26 | title style={below right,at={(0.05,0.9)}} 27 | ] 28 | \addplot [semithick, mark=otimes] 29 | table {% 30 | 0 1.11147540983607 31 | 1 1.16501650165017 32 | 2 1.37581699346405 33 | 3 2.05629139072848 34 | 4 2.21710526315789 35 | 5 2.60615384615385 36 | 6 3.12078651685393 37 | 7 4.57857142857143 38 | 8 5.2827140549273 39 | 9 3.32571109871723 40 | 10 2.28499799438428 41 | 11 1.40641665600068 42 | 12 1.29619187709406 43 | }; 44 | % \addlegendentry{B1} 45 | \addplot [semithick, mark=square] 46 | table {% 47 | 0 0.610244988864143 48 | 1 0.620842572062084 49 | 2 0.686666666666667 50 | 3 0.611408199643494 51 | 4 0.595488721804511 52 | 5 0.698653198653199 53 | 6 0.995929443690638 54 | 7 2.06111111111111 55 | 8 3.21023359288098 56 | 9 2.18633540372671 57 | 10 1.99912018300194 58 | 11 1.38082448735985 59 | 12 1.28262231666122 60 | }; 61 | % \addlegendentry{B2} 62 | \addplot [semithick, mark=x] 63 | table {% 64 | 0 2.04658385093168 65 | 1 2.55905511811024 66 | 2 2.58680555555556 67 | 3 2.4 68 | 4 2.74642857142857 69 | 5 2.88562091503268 70 | 6 3.40054495912806 71 | 7 2.83580080753701 72 | 8 2.70911949685535 73 | 9 1.74132043255549 74 | 10 1.58726097495287 75 | 11 1.32766260484254 76 | 12 1.2893861343636 77 | }; 78 | % \addlegendentry{B3} 79 | \addplot [semithick, mark=*] 80 | table {% 81 | 0 0.714707329070339 82 | 1 0.899248120300752 83 | 2 1.03947368421053 84 | 3 1.18948412698413 85 | 4 1.09095002251238 86 | 5 1.46853146853147 87 | 6 2.03842794759825 88 | 7 1.84909727836163 89 | 8 1.61319515399212 90 | 9 1.45761636107193 91 | 10 1.29182463005992 92 | 11 1.13366620453858 93 | 12 1.06254475718846 94 | }; 95 | % \addlegendentry{B4} 96 | \addplot[gray, dashed] coordinates {(-1,1) (13,1)}; 97 | \end{axis} 98 | 99 | \end{tikzpicture} 100 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/LLVM-opt-kernel-times.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/LLVM-opt-kernel-times.jpg -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/SOLLVE-ARGOBOTS.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/SOLLVE-ARGOBOTS.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/SOLLVE-BOLT.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/SOLLVE-BOLT.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/SOLLVE-progress.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/SOLLVE-progress.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/mgpu-Spock.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/mgpu-Spock.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/multi_gpu_spock.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/multi_gpu_spock.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/multi_gpu_spock2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/multi_gpu_spock2.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/one_gpu_spock.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/one_gpu_spock.png -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/onegpu-Spock.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/onegpu-Spock.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/sollve-figure-ecp-car-source-empty.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/sollve-figure-ecp-car-source-empty.pptx -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/text-for-sollve-progress-diagram.txt: -------------------------------------------------------------------------------- 1 | # Application Requirements 2 | - OpenMP Hackathons: application teams include QMCPACK, GridQCD, GAMESS, Kokkos, Force-of-nature 3 | - In-depth engagement with application teams using OpenMP, particularly those using LLVM's OpenMP 4 | - OpenMP Performance benchmarks for assessing feature performance in OpenMP implementations 5 | - Contributions to DoE LLVM Spack package 6 | 7 | # Specification Evolution 8 | - Fall 2021 OpenMP virtual Face-to-Face Meeting 9 | - Release of OpenMP 5.2 Specification (Nov. 2021) with new OpenMP 5.0 Examples and clarificiations in the Specification to improve implementation of the OpenMP Spec, particularly for OpenMP offload features 10 | 11 | # Compiler 12 | 13 | # Runtime Systems 14 | - Improved BOLT 1.0 runtime with features for nested parallelism and MPI+OpenMP interoperability, integrated into the LLVM OpenMP implementation. 15 | - Prototype runtime library for OpenMP task and loop scheduling strategies on multicore processors of ECP Systems 16 | - Prototype runtime library for OpenMP task-to-device scheduling on heterogeneous processors that provide adaptivity based on state, e.g., occupancies, load, of GPUs. 17 | 18 | # Verification and Validation -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/tiling.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/tiling.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.11-SOLLVE/unroll.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.11-SOLLVE/unroll.pdf -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.12-Flang/2.3.2.12-Flang.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | @book{adams-fortran-95-handbook, 3 | title={{Fortran 95 Handbook Complete ISO/ANSI Reference}}, 4 | author={Adams, Jeanne C. and Brainerd, Walter S. and Martin, Jeanne T and Smith, Brian T. and Wagener, Jerrold L.}, 5 | year={1997}, 6 | publisher={The MIT Press} 7 | } 8 | 9 | @book{adams-fortran-2003-handbook, 10 | title={{Fortran 2003 Handbook: The Complete Syntax, Features and Procedures}}, 11 | author={Adams, Jeanne C. and Brainerd, Walter S. and Hendrickson, Richard A. and Maine, Richard E. and Martin, Jeanne T and Smith, Brian T.}, 12 | year={2009}, 13 | publisher={Springer} 14 | } 15 | 16 | @techreport{ansi-fortran-1977, 17 | title= {{American National Standard Programming Language FORTRAN}}, 18 | year = 1978, 19 | author = {ANSI X3} 20 | } 21 | 22 | @techreport{iso-fortran-1991, 23 | type = {Standard}, 24 | key = {ISO/IEC 1539-1:1991}, 25 | month = oct, 26 | year = {1991}, 27 | title = {Information technology -- {P}rogramming languages -- {F}ortran}, 28 | volume = {1991}, 29 | address = {Geneva, CH}, 30 | institution = {International Organization for Standardization}, 31 | author = {Fortran Standards Committee} 32 | } 33 | 34 | @techreport{iso-fortran-1997, 35 | type = {Standard}, 36 | key = {ISO/IEC 1539-1:1997}, 37 | month = oct, 38 | year = {1997}, 39 | title = {Information technology -- {P}rogramming languages -- {F}ortran -- {P}art 1: {B}ase language}, 40 | volume = {1997}, 41 | address = {Geneva, CH}, 42 | institution = {International Organization for Standardization}, 43 | author = {Fortran Standards Committee} 44 | } 45 | 46 | @techreport{iso-fortran-2004, 47 | type = {Standard}, 48 | key = {ISO/IEC 1539-1:2004}, 49 | month = oct, 50 | year = {2004}, 51 | title = {Information technology -- {P}rogramming languages -- {F}ortran -- {P}art 1: {B}ase language}, 52 | volume = {2004}, 53 | address = {Geneva, CH}, 54 | institution = {International Organization for Standardization}, 55 | author = {Fortran Standards Committee} 56 | } 57 | 58 | 59 | @techreport{iso-fortran-2010, 60 | type = {Standard}, 61 | key = {ISO/IEC 1539-1:2010}, 62 | month = oct, 63 | year = {2010}, 64 | title = {Information technology -- {P}rogramming languages -- {F}ortran -- {P}art 1: {B}ase language}, 65 | volume = {2010}, 66 | address = {Geneva, CH}, 67 | institution = {International Organization for Standardization}, 68 | author = {Fortran Standards Committee} 69 | } 70 | 71 | @techreport{iso-fortran-2018, 72 | type = {Standard}, 73 | key = {ISO/IEC DIS 1539-1:2018}, 74 | month = dec, 75 | year = {2017}, 76 | title = {{Draft International Standard -- Information technology -- Programming languages -- Fortran -- Part 1: Base language}}, 77 | volume = {{DIS} 2017}, 78 | address = {Geneva, CH}, 79 | institution = {International Organization for Standardization}, 80 | author = {Fortran Standards Committee} 81 | } 82 | 83 | @misc{llvm:homepage, 84 | title = {{LLVM} {W}eb page}, 85 | author = {{LLVM} {P}roject {T}eam}, 86 | howpublished = {\url{https://llvm.org}}, 87 | } 88 | 89 | @techreport{openmp-spec-31, 90 | author = {{OpenMP Architecture Review Board}}, 91 | keywords = {OpenMP Specification}, 92 | title = {{O}pen{MP} {A}pplication {P}rogram {I}nterface {V}ersion 3.1}, 93 | type = {Specification}, 94 | url = {http://www.openmp.org/mp-documents/OpenMP3.1.pdf}, 95 | institution = {OpenMP.org}, 96 | volume = {Version 3.1}, 97 | year = 2011 98 | } 99 | 100 | @techreport{openmp-spec-45, 101 | author = {{OpenMP Architecture Review Board}}, 102 | keywords = {OpenMP Specification}, 103 | title = {{O}pen{MP} {A}pplication {P}rogram {I}nterface {V}ersion 4.5}, 104 | type = {Specification}, 105 | url = {http://www.openmp.org/mp-documents/OpenMP3.1.pdf}, 106 | institution = {OpenMP.org}, 107 | volume = {Version 4.5}, 108 | year = 2015 109 | } 110 | 111 | @book{vax-fortran-4, 112 | title={Programming in VAX Fortran, Version 4.0}, 113 | author={Digital Equipment Corporation}, 114 | year={1984}, 115 | publisher={Digital Equipment Corporation} 116 | } 117 | -------------------------------------------------------------------------------- /projects/2.3.2-Tools/2.3.2.12-Flang/flang-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.2-Tools/2.3.2.12-Flang/flang-performance.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3-MathLibs.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.01-xSDK/xsdk-0.6.0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.01-xSDK/xsdk-0.6.0.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.01-xSDK/xsdk-examples-diagram.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.01-xSDK/xsdk-examples-diagram.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.01-xSDK/xsdk-machinebalance.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.01-xSDK/xsdk-machinebalance.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.06-PETSc-TAO/2.3.3.06-PETSc-TAO.bib: -------------------------------------------------------------------------------- 1 | 2 | @techreport{petsc-man, 3 | title={{PETSc Users Manual Revision 3.14}}, 4 | author={S. Balay and S. Abhyankar and M. Adams and J. Brown and P. Brune and K. Buschelman and L. Dalcin and A. Dener and V. Eijkhout and W. Gropp and D. Karpeyev and D. Kaushik and M. Knepley and D. May and L. Curfman McInnes and R. Mills and T. Munson and K. Rupp and P. Sanan and B. Smith and S. Zampini and H. Zhang and H. Zhang}, 5 | type={Technical Memorandum}, 6 | number={ANL-95/11 Rev. 3.14}, 7 | institution={Argonne National Laboratory}, 8 | year={2020}, 9 | } 10 | 11 | @techreport{tao-man, 12 | title={{TAO 3.14 Users Manual}}, 13 | author={A. Dener and A. Denchfield and T. Munson and J. Sarich and S. Wild and S. Benson and L. Curfman McInnes}, 14 | type={Technical Memorandum}, 15 | number={ANL/MCS-TM-322 Rev. 3.14}, 16 | institution={Argonne National Laboratory}, 17 | year={2020}, 18 | } 19 | 20 | @misc{petsc:homepage, 21 | author = "{PETSc/TAO} Team", 22 | title = "{PETSc/TAO} Website", 23 | howpublished = {\url{https://www.mcs.anl.gov/petsc}} 24 | } 25 | 26 | @article{mills2021toward, 27 | title={Toward performance-portable {PETSc} for {GPU}-based exascale systems}, 28 | author={Mills, Richard Tran and Adams, Mark F and Balay, Satish and Brown, Jed and Dener, Alp and Knepley, Matthew and Kruger, Scott E and Morgan, Hannah and Munson, Todd and Rupp, Karl and others}, 29 | journal={Parallel Computing}, 30 | pages={102831}, 31 | year={2021}, 32 | publisher={Elsevier} 33 | } 34 | 35 | @article{zhang2021petscsf, 36 | title={The {PetscSF} Scalable Communication Layer}, 37 | author={Zhang, Junchao and Brown, Jed and Balay, Satish and Faibussowitsch, Jacob and Knepley, Matthew and Marin, Oana and Mills, Richard Tran and Munson, Todd and Smith, Barry F and Zampini, Stefano}, 38 | journal={IEEE Transactions on Parallel and Distributed Systems}, 39 | year={2021}, 40 | publisher={IEEE} 41 | } 42 | 43 | @article{hudson2021libensemble, 44 | title={{libEnsemble}: {A} Library to Coordinate the Concurrent Evaluation of Dynamic Ensembles of Calculations}, 45 | author={Hudson, Stephen and Larson, Jeffrey and Navarro, John-Luke and Wild, Stefan}, 46 | journal={IEEE Transactions on Parallel and Distributed Systems}, 47 | year={2021}, 48 | publisher={IEEE} 49 | } 50 | 51 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.06-PETSc-TAO/petsc_arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.06-PETSc-TAO/petsc_arch.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.06-PETSc-TAO/petsc_perf.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.06-PETSc-TAO/petsc_perf.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/2.3.3.07-STRUMPACK-SuperLU.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | @misc{AWPM2018, 3 | author = {A. Azad and A. Buluc and X.S. Li and X. Wang and J. Langguth}, 4 | title = {A distributed-memory approximation algorithm for maximum weight 5 | perfect bipartite matching}, 6 | note = {available via \url{https://arxiv.org/abs/1801.09809}}, 7 | month = {January}, 8 | year = {2018}, 9 | } 10 | 11 | @inproceedings{LiuTriSolve2018, 12 | author = {Y. Liu and M. Jacquelin and P. Ghysels and X.S. Li}, 13 | title = {Highly scalable distributed-memory sparse triangular 14 | solution algorithms}, 15 | booktitle = {Proceedings of the SIAM Workshop on Combinatorial 16 | Scientific Computing}, 17 | address = {Bergen, Norway}, 18 | year = {2018}, 19 | month = {June 6-8, 2018} 20 | } 21 | 22 | @proceedings{ghysels2017-ipdps, 23 | author = {P. Ghysels and C. Gorman and X.S. Li and F.-H. Rouet}, 24 | title = {A robust and scalable preconditioner for indefinite systems using 25 | hierarchical matrices and randomized sampling}, 26 | booktitle = {{Proceedings of IEEE International Parallel \& Distributed 27 | Processing Symposium (IPDPS)}}, 28 | month = {May 29 - June 2}, 29 | year = {2017}, 30 | address = {Orlando, USA} 31 | } 32 | 33 | @inproceedings{sao2018, 34 | author = {P. Sao and R. Vuduc and X.S. Li}, 35 | title = {A Communication-Avoiding 3D Factorization for Sparse Matrices}, 36 | booktitle = {32nd IEEE International Parallel \& Distributed Processing 37 | Symposium (IPDPS)}, 38 | address = {Vancouver, Canada}, 39 | year = {2018}, 40 | month = {May 21-25} 41 | } 42 | 43 | @inbook{Sptrsv-nvshmem, 44 | author = { Nan Ding and Yang Liu and Samuel Williams and Xiaoye S. Li }, 45 | title = {A Message-Driven, Multi-GPU Parallel Sparse Triangular Solver}, 46 | booktitle = {Proceedings of the 2021 SIAM Conference on Applied and Computational Di\ 47 | screte Algorithms (ACDA21)}, 48 | chapter = {}, 49 | pages = {147-159}, 50 | doi = {10.1137/1.9781611976830.14}, 51 | URL = {https://epubs.siam.org/doi/abs/10.1137/1.9781611976830.14}, 52 | eprint = {https://epubs.siam.org/doi/pdf/10.1137/1.9781611976830.14} 53 | } 54 | 55 | @article{ghyselsSTRUMPACKGPU, 56 | author={Ghysels, Pieter and Synk, Ryan}, 57 | title={{High performance sparse multifrontal solvers on modern GPUs}}, 58 | journal={Submitted to the Special Issue A: Transitioning Libraries and Applications 59 | in Parallel Computing}, 60 | year={2021} 61 | } 62 | 63 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/P3_V100.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/P3_V100.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/periodic-cube-scaling-strumpack.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/periodic-cube-scaling-strumpack.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/periodic-cube-scaling-strumpack_metis.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/periodic-cube-scaling-strumpack_metis.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/speedup_SOA.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/speedup_SOA.jpg -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/strumpack-Summit.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/strumpack-Summit.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/strumpack-scaling.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/strumpack-scaling.jpg -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/strumpack-scaling.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/strumpack-scaling.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/superlu-solve-Summit.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/superlu-solve-Summit.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/superlu-trisolve-scaling.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.07-STRUMPACK-SuperLU/superlu-trisolve-scaling.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/2.3.3.12-SUNDIALS.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | @misc{SUNDIALSweb, 3 | author = {{SUNDIALS} {P}roject {T}eam}, 4 | title = {{SUNDIALS} {W}eb Page}, 5 | howpublished = {\url{http://computation.llnl.gov/projects/sundials}} 6 | } 7 | 8 | @article{balosEnablingGPUAccelerated2021, 9 | title = {Enabling {{GPU}} Accelerated Computing in the {{SUNDIALS}} Time Integration Library}, 10 | author = {Balos, Cody J. and Gardner, David J. and Woodward, Carol S. and Reynolds, Daniel R.}, 11 | year = {2021}, 12 | month = dec, 13 | volume = {108}, 14 | pages = {102836}, 15 | issn = {01678191}, 16 | doi = {10.1016/j.parco.2021.102836}, 17 | journal = {Parallel Computing}, 18 | language = {en} 19 | } 20 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/2.3.3.12-hypre.bib: -------------------------------------------------------------------------------- 1 | 2 | @article{HeYa2002, 3 | author = {V.~Henson and U.~Yang}, 4 | title = {{BoomerAMG}: a Parallel Algebraic Multigrid Solver and Preconditioner}, 5 | journal = {Applied Numerical Mathematics}, 6 | volume = {41}, 7 | pages = {155--177}, 8 | year = {2002} 9 | } 10 | 11 | @article{AsFa1996, 12 | author = "S.~F.~Ashby and R.~D.~Falgout", 13 | title = "A Parallel Multigrid Preconditioned Conjugate Gradient Algorithm for Groundwater Flow Simulations", 14 | journal = "Nuclear Science and Engineering", 15 | month = "September", 16 | volume = "124", 17 | number = "1", 18 | pages = "145--159", 19 | note = "UCRL-JC-122359", 20 | year = "1996" 21 | } 22 | 23 | @incollection{hypre_design_impl_2006, 24 | author = "R.~D.~Falgout and J.~E.~Jones and U.~M.~Yang", 25 | title = "The Design and Implementation of {\sl hypre}, a Library 26 | of Parallel High Performance Preconditioners", 27 | booktitle = "Numerical Solution of Partial Differential Equations 28 | on Parallel Computers", 29 | series = "Lecture Notes in Computational Science and Engineering", 30 | publisher = "Springer-Verlag", 31 | editor = "A.~M.~Bruaset and A.~Tveito", 32 | volume = "51", 33 | note = "UCRL-JRNL-205459", 34 | chapter = "8", 35 | pages = "267--294", 36 | year = "2006" 37 | } 38 | 39 | @article{LiSY2020, 40 | author = "R.~Li and B.~Sjogreen and U.~M.~Yang", 41 | title = "A New Class of AMG Interpolation Operators Based on Matrix-Matrix Operations", 42 | note = "Submitted to SIAM Journal on Scientific Computing", 43 | year = "2020" 44 | } 45 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/AMReX_CVODE_OpenMP_GPU-Streams-2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/AMReX_CVODE_OpenMP_GPU-Streams-2.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/AMS-PCG.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/AMS-PCG.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/PeleC_fig.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/PeleC_fig.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/Spock-AMG-PCG.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/Spock-AMG-PCG.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/SpockResults-Dec2021.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/SpockResults-Dec2021.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/crusher-AMG-PCG.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/crusher-AMG-PCG.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/crusher-spock-1e7-Feb2022.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/crusher-spock-1e7-Feb2022.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/hypre-mixed-int.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/hypre-mixed-int.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/hypre-rap-1gpu.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/hypre-rap-1gpu.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/manyvector_v2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/manyvector_v2.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/sunorg1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.12-SUNDIALS-hypre/sunorg1.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/2.3.3.13-CLOVER.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{3.13} CLOVER} \label{subsubsect:clover} 2 | Mathematical libraries are powerful tools to make better use of Exascale 3 | architectural features and are central for application projects to efficiently 4 | exploit the available computing power. The high-level objective of CLOVER is to 5 | provide scalable, portable numerical algorithms that facilitate efficient 6 | application simulations on Exascale computers. With the intention of generating synergies 7 | by facilitating vivid cooperation among the distinct project focus efforts 8 | and expert knowledge transfer, CLOVER was designed as a merger of the heFFTe, SLATE, 9 | and Ginkgo projects, each being complementary 10 | in focus but similar in the need for hardware-specific algorithm design 11 | expertise: SLATE focuses on Exascale-capable dense linear algebra 12 | functionality; heFFTe’s scope is providing robust and fast calculation for 2D 13 | and 3D FFT routines; Ginkgo delivers production-ready, preconditioned iterative solvers for 14 | GPU-accelerated systems. Together, these projects form a robust ecosystem of numerical 15 | base functionality for Exascale computers. 16 | \newpage 17 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/2.3.3.13-FFT.bib: -------------------------------------------------------------------------------- 1 | @techreport {heffte0.2, 2 | title = {FFT-ECP API and High-Performance Library Prototype for 2-D and 3-D FFTs on Large-Scale Heterogeneous Systems with GPUs}, 3 | number = {FFT-ECP STML13-27}, 4 | year = {2020}, 5 | note = {revision 01-2020}, 6 | month = {2020-01}, 7 | publisher = {Innovative Computing Laboratory, University of Tennessee}, 8 | type = {ECP WBS 2.3.3.13 Milestone Report}, 9 | author = {Stanimire Tomov and Alan Ayala and Azzam Haidar and Jack Dongarra} 10 | } 11 | 12 | @conference{heffte-iccs20, 13 | title = {{heFFTe: Highly Efficient FFT for Exascale}}, 14 | booktitle = {International Conference on Computational Science (ICCS 2020)}, 15 | year = {2020}, 16 | month = {2020-06}, 17 | address = {Amsterdam, Netherlands}, 18 | keywords = {exascale, FFT, gpu, scalable algorithm}, 19 | doi = {https://doi.org/10.1007/978-3-030-50371-0_19}, 20 | author = {Alan Ayala and Stanimire Tomov and Azzam Haidar and Jack Dongarra} 21 | } 22 | 23 | 24 | @conference{heffte-pact21, 25 | title = {{Scalability Issues in FFT Computation}}, 26 | booktitle = {International Conference on Parallel Computing Technologies (PaCT 2021)}, 27 | year = {2021}, 28 | month = {2021-09}, 29 | publisher = {Springer, Cham}, 30 | doi = {https://doi.org/10.1007/978-3-030-86359-3_21}, 31 | author = {Alan Ayala and Stanimire Tomov and Miroslav Stoyanov and Jack Dongarra} 32 | } 33 | 34 | @techreport {fftbenchmark, 35 | title = {Interim Report on Benchmarking FFT Libraries on High Performance Systems}, 36 | journal = {Innovative Computing Laboratory Technical Report}, 37 | number = {ICL-UT-21-03}, 38 | year = {2021}, 39 | month = {2021-07}, 40 | publisher = {University of Tennessee}, 41 | type = {ICL Tech Report}, 42 | author = {Ayala, Alan and Tomov, Stanimire and Luszczek, Piotr and Cayrols, Sebastien and Ragghianti, Gerald and Dongarra, Jack} 43 | } 44 | 45 | @techreport{hpec21, 46 | title = {A More Portable HeFFTe: Implementing a Fallback Algorithm for Scalable Fourier Transforms}, 47 | journal = {ICL Technical Report}, 48 | number = {ICL-UT-21-04}, 49 | year = {2021}, 50 | note = {HPEC{\textquoteright}21}, 51 | month = {2021-08}, 52 | publisher = {University of Tennessee}, 53 | type = {ICL Tech Report}, 54 | author = {Daniel Sharp and Miroslav Stoyanov and Stanimire Tomov and Jack Dongarra} 55 | } 56 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/SLATE-architecture.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/SLATE-architecture.jpg -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/batchedFFT-Spock.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/batchedFFT-Spock.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ffttransormations.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ffttransormations.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_cg_solver.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_cg_solver.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_csr_spmv.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_csr_spmv.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_ell_spmv.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_ell_spmv.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_gmres_solver.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_eas/bw_gmres_solver.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_portability_crop.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/ginkgo_portability_crop.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heFFTeAcceleration.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heFFTeAcceleration.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heFFTeScalability.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heFFTeScalability.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heFFTeStrongScalability.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heFFTeStrongScalability.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heffte.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heffte.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heffte_conv_dst.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/heffte_conv_dst.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/runtime2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/runtime2.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-he2hb-1node.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-he2hb-1node.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-he2hb-4node.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-he2hb-4node.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-spock-gemm.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-spock-gemm.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-spock-trf.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.13-CLOVER/slate-spock-trf.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/2.3.3.14-ALExa.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | @inproceedings{beazley1996swig, 3 | title={{SWIG}: An Easy to Use Tool for Integrating Scripting Languages with {C} and {C++}.}, 4 | author={Beazley, David M and others}, 5 | booktitle={4th Conference on USENIX Tcl/Tk Workshop}, 6 | year={1996} 7 | } 8 | -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/2.3.3.14-ForTrilinos.bib: -------------------------------------------------------------------------------- 1 | % Empty bib file -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/ForTrilinos_ioc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/ForTrilinos_ioc.pdf -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/arborx_summit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/arborx_summit.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/dtk-gpu.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/dtk-gpu.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/dtk_exaam_pit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/dtk_exaam_pit.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/tasmanian-gpu.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/tasmanian-gpu.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/tasmanian_exastar.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.3-MathLibs/2.3.3.14-ALExa-ForTrilinos/tasmanian_exastar.png -------------------------------------------------------------------------------- /projects/2.3.3-MathLibs/2.3.3.15-Sake/2.3.3.15-Sake.tex: -------------------------------------------------------------------------------- 1 | \subsubsection{\stid{3.15} Sake} \label{subsubsect:sake} 2 | 3 | \paragraph{Overview} 4 | 5 | Modern simulation codes running on high performance computing (HPC) machines often rely heavily on multiple libraries to provide core capabilities such as 6 | meshing, mathematical algorithms, I/O services and more. This approach is highly productive as it allows domain experts to focus on their core technical 7 | contributions. The Sake project focuses on the design and development of performance portable mathematical libraries within the Trilinos project and the 8 | Kokkos ecosystem. Specifically, the team provides new implementations of linear algebra methods optimized for the architectures planned for the upcoming exascale 9 | systems while using interfaces already defined in Trilinos allowing applications a smooth transition toward exascale readiness. 10 | 11 | Sake has two software products: Trilinos and KokkosKernels. It is organized into three subprojects, Trilinos, KokkosKernels, and PEEKS, where 12 | PEEKS and KokkosKernels were formerly part of CLOVER, whereas the Trilinos subproject is new in ECP. 13 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4-DataViz.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/2.3.4.01-DataViz-SDK.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/HDF5-Arch-small.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/HDF5-Arch-small.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/HDF5-Arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/HDF5-Arch.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/VOL-improvements.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.01-DataViz-SDK/VOL-improvements.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.09-ADIOS/2.3.4.09-ADIOS.bib: -------------------------------------------------------------------------------- 1 | @article{liu2014hello, 2 | title={{Hello ADIOS}: the challenges and lessons of developing leadership class I/O frameworks}, 3 | author={Liu, Qing and Logan, Jeremy and Tian, Yuan and Abbasi, Hasan and Podhorszki, Norbert and Choi, Jong Youl and Klasky, Scott and Tchoua, Roselyne and Lofstead, Jay and Oldfield, Ron and others}, 4 | journal={Concurrency and Computation: Practice and Experience}, 5 | volume={26}, 6 | number={7}, 7 | pages={1453--1473}, 8 | year={2014} 9 | } 10 | 11 | @article{adios2-softwarex-2020, 12 | title = "ADIOS 2: The Adaptable Input Output System. A framework for high-performance data management", 13 | journal = "SoftwareX", 14 | volume = "12", 15 | pages = "100561", 16 | year = "2020", 17 | issn = "2352-7110", 18 | doi = "https://doi.org/10.1016/j.softx.2020.100561", 19 | url = "http://www.sciencedirect.com/science/article/pii/S2352711019302560", 20 | author = "William F. Godoy and Norbert Podhorszki and Ruonan Wang and Chuck Atkins and Greg Eisenhauer and Junmin Gu and Philip Davis and Jong Choi and Kai Germaschewski and Kevin Huck and Axel Huebl and Mark Kim and James Kress and Tahsin Kurc and Qing Liu and Jeremy Logan and Kshitij Mehta and George Ostrouchov and Manish Parashar and Franz Poeschel and David Pugmire and Eric Suchyta and Keichi Takahashi and Nick Thompson and Seiji Tsutsumi and Lipeng Wan and Matthew Wolf and Kesheng Wu and Scott Klasky", 21 | keywords = "High-performance computing (HPC), Scalable I/O, Luster GPFS file systems, Staging, RDMA, Data science, In-situ, Exascale computing", 22 | abstract = "We present ADIOS 2, the latest version of the Adaptable Input Output (I/O) System. ADIOS 2 addresses scientific data management needs ranging from scalable I/O in supercomputers, to data analysis in personal computer and cloud systems. Version 2 introduces a unified application programming interface (API) that enables seamless data movement through files, wide-area-networks, and direct memory access, as well as high-level APIs for data analysis. The internal architecture provides a set of reusable and extendable components for managing data presentation and transport mechanisms for new applications. ADIOS 2 bindings are available in C++11, C, Fortran, Python, and Matlab and are currently used across different scientific communities. ADIOS 2 provides a communal framework to tackle data management challenges as we approach the exascale era of supercomputing." 23 | } 24 | @MISC{ADIOS2-git, 25 | key ="{ADIOS2Git}", 26 | title ="{The {ADIOS2} framework}", 27 | URL = {https://github.com/ornladios/ADIOS2}, 28 | howpublished = "\url{https://github.com/ornladios/ADIOS2}" 29 | } 30 | 31 | 32 | @MISC{ADIOS2-docs, 33 | key ="{ADIOS2Docs}", 34 | title ="{{ADIOS2} documentation}", 35 | URL = {https://adios2.readthedocs.io}, 36 | howpublished = "\url{https://adios2.readthedocs.io}" 37 | } 38 | 39 | 40 | @misc{ecp:homepage, 41 | author = "{ECP} Team", 42 | title = "{The {E}xascale {C}omputing {P}roject}", 43 | howpublished = {\url{https://exascaleproject.org}} 44 | } 45 | 46 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.09-ADIOS/ADIOS_in_ECP.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.09-ADIOS/ADIOS_in_ECP.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.10-DataLib/pnetcdf-figure.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.10-DataLib/pnetcdf-figure.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Bubbles-Components.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Bubbles-Components.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Bubbles-Density.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Bubbles-Density.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Clip.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Clip.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-FTLE.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-FTLE.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Streamlines.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-Streamlines.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-contour-cell-types.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-contour-cell-types.jpg -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-extruded-cell-set.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-extruded-cell-set.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-flying-edges.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-flying-edges.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-particle-density.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-particle-density.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-particle-spheres.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-particle-spheres.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-spock-timing.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-spock-timing.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-warpx-flow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-warpx-flow.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-warpx-in-situ.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-warpx-in-situ.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-wdm-in-situ.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/VTKm-wdm-in-situ.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/snl-logos.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.13-ECP-VTK-m/snl-logos.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/2.3.4.14-EZ.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/2.3.4.14-VeloC.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @inproceedings{PortResEuroPar21, 4 | title = {Towards High Performance Resilience using Performance Portable Abstractions}, 5 | year = {2021}, 6 | author = {Morales, Nicolas and Teranishi, Keita and Nicolae, Bogdan and Trott, Christian and Cappello, Franck}, 7 | booktitle = {EuroPar’21: 27th International European Conference on Parallel and Distributed Systems}, 8 | address = {Lisbon, Portugal}, 9 | url = {https://hal.inria.fr/hal-03260432}, 10 | doi = {10.1007/978-3-030-29400-7_4}, 11 | keywords = {Performance Portability, Resilience, Fault Tolerance, Checkpointing, Programming Models} 12 | } 13 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/200718_workflow.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/200718_workflow.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/Visual-quality-NYX-SZ.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/Visual-quality-NYX-SZ.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/qmcpackbig-a.eps: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/qmcpackbig-a.eps -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/sz-illu.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/sz-illu.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/time-based-comp-and-random.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/time-based-comp-and-random.jpg -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/veloc-arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/veloc-arch.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/xSDK-diagram.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.14-VeloC-SZ/xSDK-diagram.jpeg -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/2.3.4.15-UNIFYCR.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/UnifyCR-overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/UnifyCR-overview.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/UnifyFS-overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/UnifyFS-overview.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/VOL-Overview.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/VOL-Overview.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/async_io_overview.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/async_io_overview.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/milestone2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/milestone2.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/usingUnifyFS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.15-HDF5-UnifyCR/usingUnifyFS.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/ZFP.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/ZFP.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine-cinema-mfixexa-workflow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine-cinema-mfixexa-workflow.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_infrastructure.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_infrastructure.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_nyxSamplingExample.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_nyxSamplingExample.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_topology.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_topology.jpg -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_topology_orig.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/alpine_topology_orig.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/zfp-performance.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/zfp-performance.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/zfp-sw4-hdf5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/zfp-sw4-hdf5.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/zfp-sw4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/2.3.4.16-ALPINE-ZFP/zfp-sw4.png -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/DataViz-storage-notional-diagram.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/DataViz-storage-notional-diagram.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/DataViz-storage-specs-current.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/DataViz-storage-specs-current.pdf -------------------------------------------------------------------------------- /projects/2.3.4-DataViz/DataViz-storage-specs-next.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.4-DataViz/DataViz-storage-specs-next.pdf -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5-Ecosystem.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/2.3.5.01-Ecosystem-SDK.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | 3 | @misc{xSDK-community-package-policies2016, 4 | title = {{xSDK} Community Package Policies}, 5 | author = {B. Smith and R. Bartlett and {xSDK developers}}, 6 | note = {version 0.3, December 2, 2016, 7 | \url{https://dx.doi.org/10.6084/m9.figshare.4495136}}, 8 | year = 2016 9 | } 10 | 11 | @misc{e4s:policies, 12 | key = "{E4S} {P}roject {T}eam", 13 | title = "{{E4S} {C}ommunity {P}olicies}", 14 | howpublished = {\url{https://e4s-project.github.io/policies.html}} 15 | } 16 | 17 | 18 | techreport{Klinvex-xSDKTrilinos, 19 | title = {{xSDKTrilinos} User Manual}, 20 | author = {Alicia Marie Klinvex}, 21 | year = 2016, 22 | number = {SAND2016-3396 O}, 23 | institution = {Sandia} 24 | } 25 | 26 | misc{xSDK-community-installation-policies2016, 27 | title = {{xSDK} Community Installation Policies: {GNU Autoconf} and {CMake} Options}, 28 | author = {R. Bartlett and J. Sarich and B. Smith and T. Gamblin and {xSDK developers}}, 29 | note = {version 0.1, December 19, 2016, \url{https://dx.doi.org/10.6084/m9.figshare.4495133}}, 30 | year = 2016 31 | } 32 | 33 | inproceedings{gamblin+:sc15, 34 | Acceptancerate = {22\%}, 35 | Address = {Austin, Texas}, 36 | Author = {Todd Gamblin and Matthew P. LeGendre and Michael R. Collette and Gregory L. Lee and Adam Moody and Bronis R. de Supinski and W. Scott Futral}, 37 | Booktitle = {Supercomputing 2015 (SC'15)}, 38 | Date-Added = {2015-06-28 22:46:34 +0000}, 39 | Date-Modified = {2015-10-12 16:12:11 +0000}, 40 | Month = {November 15-20}, 41 | Note = {LLNL-CONF-669890}, 42 | Title = {{The Spack Package Manager: Bringing order to HPC software chaos}}, 43 | Url = {http://tgamblin.github.io/pubs/spack-sc15.pdf}, 44 | Year = {2015}} 45 | 46 | @misc{e4s:homepage, 47 | key = "{E4S} {P}roject {T}eam", 48 | title = "{{E4S} {W}eb page}", 49 | howpublished = {\url{http://e4s.io}} 50 | } 51 | 52 | @misc{e4s:validation, 53 | key = "{E4S} {P}roject {T}eam", 54 | title = "{{E4S} {V}alidation {T}est {S}uite}", 55 | howpublished = {\url{https://github.com/E4S-Project/testsuite}} 56 | } 57 | 58 | -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S-policy-comment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S-policy-comment.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_Nalu_AWS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_Nalu_AWS.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_Pantheon.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_Pantheon.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_Pantheon_small.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_Pantheon_small.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_WDMApp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_WDMApp.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_buildcache_Feb22.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_buildcache_Feb22.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_buildcache_Jun22.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_buildcache_Jun22.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_buildcache_Oct21.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/E4S_buildcache_Oct21.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinition1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinition1.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinition2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinition2.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinition3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinition3.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinitionV2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKdefinitionV2.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKfig.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SDKfig.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SpackBuildCacheWDMapp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.01-Ecosystem-SDK/SpackBuildCacheWDMapp.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.09-SW-Packaging/2.3.5.09-SW-Packaging.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | @misc{supercontainers, 3 | key = "{S}upercontainers {P}roject {T}eam", 4 | title = "{Supercontainers Presentation}", 5 | howpublished = {\url{https://oaciss.uoregon.edu/E4S-Forum19/talks/Younge-E4S.pdf}} 6 | } -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.10-ExaWorks/exaworks-circle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.10-ExaWorks/exaworks-circle.png -------------------------------------------------------------------------------- /projects/2.3.5-Ecosystem/2.3.5.10-ExaWorks/exaworks.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.5-Ecosystem/2.3.5.10-ExaWorks/exaworks.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6-NNSA.bib: -------------------------------------------------------------------------------- 1 | # Put your BibTeX entries in this file. 2 | -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/ECPReviewScreenshot.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/ECPReviewScreenshot.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-stone-coolwarm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-stone-coolwarm.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-stone-grayscale.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-stone-grayscale.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-stone-water.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-stone-water.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-streamlines.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-cis-streamlines.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-jnc-nyx-volume.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/cinema-jnc-nyx-volume.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/control-replication-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/control-replication-performance.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/hxhim-main.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/hxhim-main.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/mesh.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/mesh.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/pantheon-workflow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/pantheon-workflow.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/tracing-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.01-LANL-ATDM/tracing-performance.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/HO-LO.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/HO-LO.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/New.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/New.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/Old.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/Old.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/ROSE-raja.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/ROSE-raja.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/mfem-amr.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/mfem-amr.jpg -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/mfem-gpu.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/mfem-gpu.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/mfem-hp-refinement.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/mfem-hp-refinement.png -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/raja-umpire-chai-support.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/raja-umpire-chai-support.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/spack-pipelines.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/spack-pipelines.pdf -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/xSDK-diagram.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.02-LLNL-ATDM/xSDK-diagram.jpeg -------------------------------------------------------------------------------- /projects/2.3.6-NNSA/2.3.6.03-SNL-ATDM/kokkos-abstractions.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/projects/2.3.6-NNSA/2.3.6.03-SNL-ATDM/kokkos-abstractions.jpg -------------------------------------------------------------------------------- /references.bib: -------------------------------------------------------------------------------- 1 | @misc{Heroux-SDK-Podcast, 2 | author = {Michael A.~Heroux}, 3 | title = {Episode 17: Making the Development of Scientific Applications Effective and Efficient}, 4 | date = {May 10, 2018}, 5 | note = {\url{https://soundcloud.com/exascale-computing-project/episode-17-making-the-development-of-scientific-applications-effective-and-efficient}}, 6 | organization = {The Exascale Computing Project}, 7 | } 8 | @unpublished{Thakur2017GapAnalysis, 9 | author = {Rajeev Thakur and Pat McCormick and Jim Ahrens and Al Geist and Michael A.~Heroux and Rob Neely and Rob Ross and Martin Schulz and Jeff Vetter}, 10 | title = {ECP Software Technology Gap Analysis}, 11 | date = {September 30, 2017}, 12 | note = {This is an internal report for the Exascale Computing Project, Software Technology Focus Area}, 13 | } 14 | @misc{TOSS, 15 | author = {Livermore Computing}, 16 | title = {TOSS: Speeding Up Commodity Cluster Computing}, 17 | date = {May 25, 2018}, 18 | url = {https://computation.llnl.gov/projects/toss-speeding-commodity-cluster-computing}, 19 | note = {\url{https://computation.llnl.gov/projects/toss-speeding-commodity-cluster-computing}}, 20 | } 21 | @misc{OpenHPC, 22 | author = {OpenHPC}, 23 | title = {Community building blocks for HPC systems}, 24 | date = {May 25, 2018}, 25 | url = {http://openhpc.community}, 26 | note = {\url{http://openhpc.community}}, 27 | } 28 | @Article{FFTW05, 29 | author = {Frigo, Matteo and Johnson, Steven~G.}, 30 | title = {The Design and Implementation of {FFTW3}}, 31 | journal = {Proceedings of the IEEE}, 32 | year = 2005, 33 | volume = 93, 34 | number = 2, 35 | pages = {216--231}, 36 | note = {Special issue on ``Program Generation, Optimization, and Platform Adaptation''} 37 | } 38 | @misc{413.3B, 39 | author = "Paul Basco", 40 | title = {{DOE Order 413.3B: Program and Project Management (PM) for the Acquisition of Capital Assets, Significant Changes to the Order}}, 41 | url = {https://www.energy.gov/sites/prod/files/maprod/documents/15-1025_Bosco.pdf}, 42 | note = {\url{https://www.energy.gov/sites/prod/files/maprod/documents/15-1025_Bosco.pdf}} 43 | } -------------------------------------------------------------------------------- /xSDK-Diagram.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/xSDK-Diagram.jpeg -------------------------------------------------------------------------------- /xSDK-Policies.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/E4S-Project/ECP-ST-CAR-PUBLIC/adda6659ca54db6a4140e3480fb74bf9269311bc/xSDK-Policies.jpeg --------------------------------------------------------------------------------