├── .gitattributes ├── .github └── ISSUE_TEMPLATE │ ├── ISSUE.yaml │ ├── QUESTION.yaml │ ├── RFE.yaml │ └── config.yml ├── .gitignore ├── .pre-commit-config.yaml ├── CMakeLists.txt ├── Compatibility.md ├── License.txt ├── README.md ├── changelog ├── cmake_config ├── NVSHMEMConfig.cmake.in └── NVSHMEMEnv.cmake ├── examples ├── CMakeLists.txt ├── bootstrap_helper.h ├── collective-launch.cu ├── dev-guide-ring-mpi.cu ├── dev-guide-ring.cu ├── gemm_allreduce │ ├── allreduce_nvls_warpspecialized.hpp │ ├── gemmAR_fusion_blackwell_fp16.cu │ ├── nvshmemAlloc.hpp │ └── sm100_gemm_tma_warpspecialized_allreduce.hpp ├── hello.cpp ├── moe_shuffle.cu ├── mpi-based-init.cu ├── on-stream.cu ├── put-block.cu ├── ring-bcast.cu ├── ring-reduce.cu ├── shmem-based-init.cu ├── thread-group.cu ├── uid-based-init.cu └── user-buffer.cu ├── nvshmem4py ├── CMakeLists.txt ├── License.txt ├── MANIFEST.in ├── README.md ├── build_assets │ └── numbast │ │ ├── config_nvshmem.py │ │ ├── generate_mem.py │ │ ├── numbast_entry_point.h │ │ └── templates │ │ ├── config_nvshmem.yml.j2 │ │ └── core │ │ └── device │ │ └── numba │ │ └── mem.py.j2 ├── cmake │ ├── addNumbast.cmake │ └── buildWheel.cmake ├── examples │ ├── device │ │ └── numba │ │ │ └── moe_dataflow.py │ ├── device_custom_kernel.py │ ├── device_ring_all_reduce.py │ ├── init_fini.py │ ├── on-stream.py │ ├── simple_p2p_kernel.py │ ├── torch_mempool.py │ ├── torch_triton_interop.py │ └── triton_comm_kernels.py ├── nvshmem │ ├── __init__.py │ ├── bindings │ │ ├── __init__.py │ │ ├── _internal │ │ │ ├── __init__.py │ │ │ ├── nvshmem.pxd │ │ │ ├── nvshmem.pyx │ │ │ └── nvshmem_linux.pyx │ │ ├── cynvshmem.pxd │ │ ├── cynvshmem.pyx │ │ ├── device │ │ │ ├── __init__.py │ │ │ └── numba │ │ │ │ ├── __init__.py │ │ │ │ ├── _numbast.py │ │ │ │ └── entry_point.h │ │ ├── nvshmem.pxd │ │ └── nvshmem.pyx │ ├── core │ │ ├── __init__.py │ │ ├── _internal_tracking.py │ │ ├── collective.py │ │ ├── device │ │ │ ├── __init__.py │ │ │ └── numba │ │ │ │ ├── __init__.py │ │ │ │ ├── amo.py │ │ │ │ ├── collective.py │ │ │ │ ├── direct.py │ │ │ │ └── rma.py │ │ ├── direct.py │ │ ├── init_fini.py │ │ ├── interop │ │ │ ├── cupy.py │ │ │ └── torch.py │ │ ├── memory.py │ │ ├── nvshmem_types.py │ │ ├── rma.py │ │ ├── teams.py │ │ └── utils.py │ └── version.py ├── perftest │ ├── alltoall_on_stream.py │ ├── broadcast_on_stream.py │ ├── fcollect_on_stream.py │ ├── reducescatter_on_stream.py │ ├── reduction_on_stream.py │ └── utils.py ├── requirements_build.txt ├── requirements_cuda11.txt ├── requirements_cuda12.txt ├── requirements_cuda13.txt ├── requirements_optional_cuda11.txt ├── requirements_optional_cuda12.txt ├── requirements_optional_cuda13.txt ├── scripts │ ├── find_python_versions.sh │ └── generate_pyproject_toml.py └── setup.py ├── nvshmem_bootstrap.sym ├── nvshmem_host.sym ├── nvshmem_transport.sym ├── perftest ├── CMakeLists.txt ├── README.md ├── common │ ├── CMakeLists.txt │ ├── atomic_bw_common.h │ ├── atomic_one_sided_common.h │ ├── atomic_ping_pong_common.h │ ├── utils.cu │ └── utils.h ├── device │ ├── CMakeLists.txt │ ├── coll │ │ ├── CMakeLists.txt │ │ ├── alltoall_latency.args │ │ ├── alltoall_latency.cu │ │ ├── barrier_latency.args │ │ ├── barrier_latency.cu │ │ ├── bcast_latency.args │ │ ├── bcast_latency.cu │ │ ├── coll_test.h │ │ ├── fcollect_latency.args │ │ ├── fcollect_latency.cu │ │ ├── redmaxloc_latency.cu │ │ ├── reducescatter_latency.args │ │ ├── reducescatter_latency.cu │ │ ├── reduction_latency.args │ │ ├── reduction_latency.cu │ │ ├── sync_latency.args │ │ └── sync_latency.cu │ ├── pt-to-pt │ │ ├── CMakeLists.txt │ │ ├── shmem_atomic_bw.args │ │ ├── shmem_atomic_bw.cu │ │ ├── shmem_atomic_latency.args │ │ ├── shmem_atomic_latency.cu │ │ ├── shmem_atomic_ping_pong_latency.args │ │ ├── shmem_atomic_ping_pong_latency.cu │ │ ├── shmem_g_bw.args │ │ ├── shmem_g_bw.cu │ │ ├── shmem_g_latency.args │ │ ├── shmem_g_latency.cu │ │ ├── shmem_get_bw.args │ │ ├── shmem_get_bw.cu │ │ ├── shmem_get_latency.args │ │ ├── shmem_get_latency.cu │ │ ├── shmem_p_bw.args │ │ ├── shmem_p_bw.cu │ │ ├── shmem_p_latency.args │ │ ├── shmem_p_latency.cu │ │ ├── shmem_p_ping_pong_latency.args │ │ ├── shmem_p_ping_pong_latency.cu │ │ ├── shmem_put_atomic_ping_pong_latency.cu │ │ ├── shmem_put_bw.args │ │ ├── shmem_put_bw.cu │ │ ├── shmem_put_latency.args │ │ ├── shmem_put_latency.cu │ │ ├── shmem_put_ping_pong_latency.args │ │ ├── shmem_put_ping_pong_latency.cu │ │ ├── shmem_put_signal_ping_pong_latency.args │ │ ├── shmem_put_signal_ping_pong_latency.cu │ │ ├── shmem_signal_ping_pong_latency.args │ │ ├── shmem_signal_ping_pong_latency.cu │ │ ├── shmem_st_bw.args │ │ └── shmem_st_bw.cu │ └── tile │ │ ├── CMakeLists.txt │ │ ├── tile_allgather_latency.cu │ │ ├── tile_allreduce_latency.cu │ │ └── tile_coll_test.h ├── host │ ├── CMakeLists.txt │ ├── coll │ │ ├── CMakeLists.txt │ │ ├── alltoall_on_stream.args │ │ ├── alltoall_on_stream.cpp │ │ ├── barrier_all_on_stream.cpp │ │ ├── barrier_on_stream.args │ │ ├── barrier_on_stream.cpp │ │ ├── broadcast_on_stream.args │ │ ├── broadcast_on_stream.cpp │ │ ├── coll_test.h │ │ ├── fcollect_on_stream.args │ │ ├── fcollect_on_stream.cpp │ │ ├── reducescatter_on_stream.args │ │ ├── reducescatter_on_stream.cpp │ │ ├── reduction_on_stream.args │ │ ├── reduction_on_stream.cpp │ │ ├── sync_all_on_stream.cpp │ │ ├── sync_on_stream.args │ │ └── sync_on_stream.cpp │ ├── init │ │ ├── CMakeLists.txt │ │ └── malloc.cpp │ └── pt-to-pt │ │ ├── CMakeLists.txt │ │ ├── bw.args │ │ ├── bw.cpp │ │ ├── latency.args │ │ ├── latency.cpp │ │ ├── stream_latency.args │ │ └── stream_latency.cu ├── perfTestRunnerSlurm.py ├── perftest-ib.list ├── perftest-mmap-full.list ├── perftest-mmap-sanity.list ├── perftest-p2p-cudagraph.list ├── perftest-p2p-nvlink.list ├── perftest-p2p-pcie.list ├── perftestCommon.py └── perftestRunner.py ├── pkg └── nvshmem_package_description.txt ├── scripts ├── bitcode_lib_cleanup.sh └── install_hydra.sh └── src ├── CMakeLists.txt ├── bin └── nvshmem-info.cpp ├── device ├── CMakeLists.txt ├── init │ └── init_device.cu └── launch │ └── collective_launch.cpp ├── host ├── bootstrap │ ├── bootstrap.cpp │ └── bootstrap_loader.cpp ├── coll │ ├── alltoall │ │ ├── alltoall.cpp │ │ ├── alltoall.h │ │ └── alltoall_on_stream.cpp │ ├── barrier │ │ ├── barrier.cpp │ │ ├── barrier.h │ │ └── barrier_on_stream.cpp │ ├── broadcast │ │ ├── broadcast.cpp │ │ ├── broadcast.h │ │ └── broadcast_on_stream.cpp │ ├── cpu_coll.cpp │ ├── cpu_coll.h │ ├── fcollect │ │ ├── fcollect.cpp │ │ ├── fcollect.h │ │ ├── fcollect_on_stream.cpp │ │ └── fcollect_on_stream.h │ ├── rdxn │ │ ├── rdxn.cpp │ │ ├── rdxn.h │ │ └── rdxn_on_stream.cpp │ └── reducescatter │ │ ├── reducescatter.cpp │ │ ├── reducescatter.h │ │ └── reducescatter_on_stream.cpp ├── comm │ ├── amo.cpp │ ├── fence.cpp │ ├── putget.cpp │ ├── quiet.cpp │ ├── rma.cu │ └── sync.cpp ├── init │ ├── cudawrap.cpp │ ├── init.cu │ ├── init_nvtx.cpp │ ├── nvmlwrap.cpp │ └── query_host.cpp ├── mem │ ├── custom_malloc.cpp │ ├── dlmalloc.cpp │ ├── dlmalloc.h │ ├── mem.cpp │ ├── mem_heap.cpp │ └── mem_transport.cpp ├── proxy │ ├── proxy.cpp │ └── proxy_host.h ├── stream │ ├── coll │ │ ├── alltoall │ │ │ └── alltoall.cu │ │ ├── barrier │ │ │ └── barrier.cu │ │ ├── broadcast │ │ │ └── broadcast.cu │ │ ├── fcollect │ │ │ └── fcollect.cu │ │ ├── rdxn │ │ │ ├── reduce_and.cu │ │ │ ├── reduce_common.cuh │ │ │ ├── reduce_max.cu │ │ │ ├── reduce_min.cu │ │ │ ├── reduce_or.cu │ │ │ ├── reduce_prod.cu │ │ │ ├── reduce_sum.cu │ │ │ ├── reduce_team.cu │ │ │ └── reduce_xor.cu │ │ └── reducescatter │ │ │ ├── reducescatter_and.cu │ │ │ ├── reducescatter_common.cuh │ │ │ ├── reducescatter_max.cu │ │ │ ├── reducescatter_min.cu │ │ │ ├── reducescatter_or.cu │ │ │ ├── reducescatter_prod.cu │ │ │ ├── reducescatter_sum.cu │ │ │ └── reducescatter_xor.cu │ └── comm │ │ ├── cuda_interface_sync.cu │ │ └── quiet_on_stream.cu ├── team │ ├── team.cu │ ├── team_internal.cpp │ ├── team_internal.h │ ├── team_internal_cuda.cu │ └── team_internal_nvls.cpp ├── topo │ ├── topo.cpp │ └── topo.h ├── transport │ ├── p2p │ │ ├── p2p.cpp │ │ └── p2p.h │ └── transport.cpp └── util │ ├── cs.cpp │ ├── debug.cpp │ ├── env_vars.cpp │ ├── shared_memory.cpp │ ├── sockets.cpp │ └── util.cpp ├── include ├── bootstrap_device_host │ └── nvshmem_uniqueid.h ├── bootstrap_host_transport │ └── env_defs_internal.h ├── device │ ├── nvshmem_coll_defines.cuh │ ├── nvshmem_defines.h │ ├── nvshmem_device_macros.h │ ├── nvshmemx_coll_defines.cuh │ ├── nvshmemx_collective_launch_apis.h │ ├── nvshmemx_defines.h │ └── tile │ │ ├── nvshmemx_tile_api.hpp │ │ └── nvshmemx_tile_api_defines.cuh ├── device_host │ ├── nvshmem_common.cuh │ ├── nvshmem_proxy_channel.h │ ├── nvshmem_tensor.h │ └── nvshmem_types.h ├── device_host_transport │ ├── nvshmem_common_ibgda.h │ ├── nvshmem_common_transport.h │ └── nvshmem_constants.h ├── host │ ├── env │ │ └── env_defs.h │ ├── nvshmem_api.h │ ├── nvshmem_coll_api.h │ ├── nvshmem_macros.h │ ├── nvshmemx_api.h │ └── nvshmemx_coll_api.h ├── internal │ ├── bootstrap_host │ │ └── nvshmemi_bootstrap.h │ ├── bootstrap_host_transport │ │ └── nvshmemi_bootstrap_defines.h │ ├── common │ │ └── error_codes_internal.h │ ├── device │ │ └── nvshmemi_device.h │ ├── host │ │ ├── cuda_interface_sync.h │ │ ├── custom_malloc.h │ │ ├── debug.h │ │ ├── error_codes_internal.h │ │ ├── nvmlwrap.h │ │ ├── nvshmem_internal.h │ │ ├── nvshmem_nvtx.hpp │ │ ├── nvshmemi_bootstrap_library.h │ │ ├── nvshmemi_coll.h │ │ ├── nvshmemi_mem_transport.hpp │ │ ├── nvshmemi_nvls_rsc.hpp │ │ ├── nvshmemi_symmetric_heap.hpp │ │ ├── nvshmemi_team.h │ │ ├── nvshmemi_types.h │ │ ├── nvtx3.hpp │ │ ├── shared_memory.h │ │ ├── sockets.h │ │ └── util.h │ ├── host_transport │ │ ├── cudawrap.h │ │ ├── nvshmemi_transport_defines.h │ │ └── transport.h │ └── non_abi │ │ ├── nvshmemi_h_to_d_coll_defs.cuh │ │ ├── nvshmemi_h_to_d_rma_defs.cuh │ │ └── nvshmemi_h_to_d_sync_defs.cuh ├── non_abi │ ├── device │ │ ├── coll │ │ │ ├── alltoall.cuh │ │ │ ├── barrier.cuh │ │ │ ├── broadcast.cuh │ │ │ ├── defines.cuh │ │ │ ├── fcollect.cuh │ │ │ ├── reduce.cuh │ │ │ ├── reducescatter.cuh │ │ │ └── utils.cuh │ │ ├── common │ │ │ ├── nvshmemi_common_device.cuh │ │ │ └── nvshmemi_tile_utils.cuh │ │ ├── pt-to-pt │ │ │ ├── ibgda_device.cuh │ │ │ ├── nvshmemi_transfer_api.cuh │ │ │ ├── proxy_device.cuh │ │ │ ├── tile.cuh │ │ │ ├── transfer_device.cuh.in │ │ │ └── utils_device.h │ │ ├── team │ │ │ └── nvshmemi_team_defines.cuh │ │ ├── threadgroup │ │ │ └── nvshmemi_common_device_defines.cuh │ │ └── wait │ │ │ └── nvshmemi_wait_until_apis.cuh │ ├── nvshmem_build_options.h.in │ ├── nvshmem_version.h.in │ └── nvshmemx_error.h ├── nvshmem.h ├── nvshmem_host.h └── nvshmemx.h └── modules ├── bootstrap ├── CMakeLists.txt.in ├── common │ ├── CMakeLists.txt.in │ ├── bootstrap_util.cpp │ ├── bootstrap_util.h │ └── env_defs.h ├── mpi │ ├── CMakeLists.txt.in │ └── bootstrap_mpi.c ├── pmi │ ├── CMakeLists.txt.in │ ├── bootstrap_pmi.cpp │ ├── pmi-2 │ │ ├── COPYRIGHT │ │ ├── pmi2.h │ │ ├── pmi2_api.c │ │ ├── pmi2_util.c │ │ └── pmi2_util.h │ └── simple-pmi │ │ ├── pmi_internal.h │ │ ├── simple_pmi.cpp │ │ ├── simple_pmiutil.cpp │ │ └── simple_pmiutil.h ├── pmix │ ├── CMakeLists.txt.in │ └── bootstrap_pmix.c ├── shmem │ ├── CMakeLists.txt.in │ └── bootstrap_shmem.c └── uid │ ├── CMakeLists.txt.in │ ├── bootstrap_uid.cpp │ ├── bootstrap_uid_remap.h │ ├── bootstrap_uid_types.hpp │ └── ncclSocket │ ├── commit_info.txt │ ├── ncclsocket_checks.h │ ├── ncclsocket_debug.h │ ├── ncclsocket_nccl.h │ ├── ncclsocket_param.h │ ├── ncclsocket_socket.cpp │ ├── ncclsocket_socket.hpp │ └── ncclsocket_utils.h └── transport ├── CMakeLists.txt.in ├── common ├── CMakeLists.txt.in ├── env_defs.h ├── mlx5_ifc.h ├── mlx5_prm.h ├── transport_common.cpp ├── transport_common.h ├── transport_gdr_common.cpp ├── transport_gdr_common.h ├── transport_ib_common.cpp ├── transport_ib_common.h ├── transport_mlx5_common.cpp └── transport_mlx5_common.h ├── ibdevx ├── CMakeLists.txt.in ├── ibdevx.cpp └── ibdevx.h ├── ibgda ├── CMakeLists.txt.in └── ibgda.cpp ├── ibrc ├── CMakeLists.txt.in └── ibrc.cpp ├── libfabric ├── CMakeLists.txt.in ├── libfabric.cpp └── libfabric.h └── ucx ├── CMakeLists.txt.in ├── ucx.cpp └── ucx.h /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/.gitattributes -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/ISSUE.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/.github/ISSUE_TEMPLATE/ISSUE.yaml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/QUESTION.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/.github/ISSUE_TEMPLATE/QUESTION.yaml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/RFE.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/.github/ISSUE_TEMPLATE/RFE.yaml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/config.yml: -------------------------------------------------------------------------------- 1 | blank_issues_enabled: false -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/CMakeLists.txt -------------------------------------------------------------------------------- /Compatibility.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/Compatibility.md -------------------------------------------------------------------------------- /License.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/License.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/README.md -------------------------------------------------------------------------------- /changelog: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/changelog -------------------------------------------------------------------------------- /cmake_config/NVSHMEMConfig.cmake.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/cmake_config/NVSHMEMConfig.cmake.in -------------------------------------------------------------------------------- /cmake_config/NVSHMEMEnv.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/cmake_config/NVSHMEMEnv.cmake -------------------------------------------------------------------------------- /examples/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/CMakeLists.txt -------------------------------------------------------------------------------- /examples/bootstrap_helper.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/bootstrap_helper.h -------------------------------------------------------------------------------- /examples/collective-launch.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/collective-launch.cu -------------------------------------------------------------------------------- /examples/dev-guide-ring-mpi.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/dev-guide-ring-mpi.cu -------------------------------------------------------------------------------- /examples/dev-guide-ring.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/dev-guide-ring.cu -------------------------------------------------------------------------------- /examples/gemm_allreduce/allreduce_nvls_warpspecialized.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/gemm_allreduce/allreduce_nvls_warpspecialized.hpp -------------------------------------------------------------------------------- /examples/gemm_allreduce/gemmAR_fusion_blackwell_fp16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/gemm_allreduce/gemmAR_fusion_blackwell_fp16.cu -------------------------------------------------------------------------------- /examples/gemm_allreduce/nvshmemAlloc.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/gemm_allreduce/nvshmemAlloc.hpp -------------------------------------------------------------------------------- /examples/gemm_allreduce/sm100_gemm_tma_warpspecialized_allreduce.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/gemm_allreduce/sm100_gemm_tma_warpspecialized_allreduce.hpp -------------------------------------------------------------------------------- /examples/hello.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/hello.cpp -------------------------------------------------------------------------------- /examples/moe_shuffle.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/moe_shuffle.cu -------------------------------------------------------------------------------- /examples/mpi-based-init.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/mpi-based-init.cu -------------------------------------------------------------------------------- /examples/on-stream.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/on-stream.cu -------------------------------------------------------------------------------- /examples/put-block.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/put-block.cu -------------------------------------------------------------------------------- /examples/ring-bcast.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/ring-bcast.cu -------------------------------------------------------------------------------- /examples/ring-reduce.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/ring-reduce.cu -------------------------------------------------------------------------------- /examples/shmem-based-init.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/shmem-based-init.cu -------------------------------------------------------------------------------- /examples/thread-group.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/thread-group.cu -------------------------------------------------------------------------------- /examples/uid-based-init.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/uid-based-init.cu -------------------------------------------------------------------------------- /examples/user-buffer.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/examples/user-buffer.cu -------------------------------------------------------------------------------- /nvshmem4py/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/CMakeLists.txt -------------------------------------------------------------------------------- /nvshmem4py/License.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/License.txt -------------------------------------------------------------------------------- /nvshmem4py/MANIFEST.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/MANIFEST.in -------------------------------------------------------------------------------- /nvshmem4py/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/README.md -------------------------------------------------------------------------------- /nvshmem4py/build_assets/numbast/config_nvshmem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/build_assets/numbast/config_nvshmem.py -------------------------------------------------------------------------------- /nvshmem4py/build_assets/numbast/generate_mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/build_assets/numbast/generate_mem.py -------------------------------------------------------------------------------- /nvshmem4py/build_assets/numbast/numbast_entry_point.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/build_assets/numbast/numbast_entry_point.h -------------------------------------------------------------------------------- /nvshmem4py/build_assets/numbast/templates/config_nvshmem.yml.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/build_assets/numbast/templates/config_nvshmem.yml.j2 -------------------------------------------------------------------------------- /nvshmem4py/build_assets/numbast/templates/core/device/numba/mem.py.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/build_assets/numbast/templates/core/device/numba/mem.py.j2 -------------------------------------------------------------------------------- /nvshmem4py/cmake/addNumbast.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/cmake/addNumbast.cmake -------------------------------------------------------------------------------- /nvshmem4py/cmake/buildWheel.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/cmake/buildWheel.cmake -------------------------------------------------------------------------------- /nvshmem4py/examples/device/numba/moe_dataflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/device/numba/moe_dataflow.py -------------------------------------------------------------------------------- /nvshmem4py/examples/device_custom_kernel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/device_custom_kernel.py -------------------------------------------------------------------------------- /nvshmem4py/examples/device_ring_all_reduce.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/device_ring_all_reduce.py -------------------------------------------------------------------------------- /nvshmem4py/examples/init_fini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/init_fini.py -------------------------------------------------------------------------------- /nvshmem4py/examples/on-stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/on-stream.py -------------------------------------------------------------------------------- /nvshmem4py/examples/simple_p2p_kernel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/simple_p2p_kernel.py -------------------------------------------------------------------------------- /nvshmem4py/examples/torch_mempool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/torch_mempool.py -------------------------------------------------------------------------------- /nvshmem4py/examples/torch_triton_interop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/torch_triton_interop.py -------------------------------------------------------------------------------- /nvshmem4py/examples/triton_comm_kernels.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/examples/triton_comm_kernels.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/_internal/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/_internal/nvshmem.pxd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/_internal/nvshmem.pxd -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/_internal/nvshmem.pyx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/_internal/nvshmem.pyx -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/_internal/nvshmem_linux.pyx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/_internal/nvshmem_linux.pyx -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/cynvshmem.pxd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/cynvshmem.pxd -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/cynvshmem.pyx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/cynvshmem.pyx -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/device/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/device/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/device/numba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/device/numba/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/device/numba/_numbast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/device/numba/_numbast.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/device/numba/entry_point.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/device/numba/entry_point.h -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/nvshmem.pxd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/nvshmem.pxd -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/bindings/nvshmem.pyx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/bindings/nvshmem.pyx -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/_internal_tracking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/_internal_tracking.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/collective.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/collective.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/device/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/device/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/device/numba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/device/numba/__init__.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/device/numba/amo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/device/numba/amo.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/device/numba/collective.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/device/numba/collective.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/device/numba/direct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/device/numba/direct.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/device/numba/rma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/device/numba/rma.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/direct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/direct.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/init_fini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/init_fini.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/interop/cupy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/interop/cupy.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/interop/torch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/interop/torch.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/memory.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/nvshmem_types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/nvshmem_types.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/rma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/rma.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/teams.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/teams.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/core/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/core/utils.py -------------------------------------------------------------------------------- /nvshmem4py/nvshmem/version.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/nvshmem/version.py -------------------------------------------------------------------------------- /nvshmem4py/perftest/alltoall_on_stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/perftest/alltoall_on_stream.py -------------------------------------------------------------------------------- /nvshmem4py/perftest/broadcast_on_stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/perftest/broadcast_on_stream.py -------------------------------------------------------------------------------- /nvshmem4py/perftest/fcollect_on_stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/perftest/fcollect_on_stream.py -------------------------------------------------------------------------------- /nvshmem4py/perftest/reducescatter_on_stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/perftest/reducescatter_on_stream.py -------------------------------------------------------------------------------- /nvshmem4py/perftest/reduction_on_stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/perftest/reduction_on_stream.py -------------------------------------------------------------------------------- /nvshmem4py/perftest/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/perftest/utils.py -------------------------------------------------------------------------------- /nvshmem4py/requirements_build.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_build.txt -------------------------------------------------------------------------------- /nvshmem4py/requirements_cuda11.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_cuda11.txt -------------------------------------------------------------------------------- /nvshmem4py/requirements_cuda12.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_cuda12.txt -------------------------------------------------------------------------------- /nvshmem4py/requirements_cuda13.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_cuda13.txt -------------------------------------------------------------------------------- /nvshmem4py/requirements_optional_cuda11.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_optional_cuda11.txt -------------------------------------------------------------------------------- /nvshmem4py/requirements_optional_cuda12.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_optional_cuda12.txt -------------------------------------------------------------------------------- /nvshmem4py/requirements_optional_cuda13.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/requirements_optional_cuda13.txt -------------------------------------------------------------------------------- /nvshmem4py/scripts/find_python_versions.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/scripts/find_python_versions.sh -------------------------------------------------------------------------------- /nvshmem4py/scripts/generate_pyproject_toml.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/scripts/generate_pyproject_toml.py -------------------------------------------------------------------------------- /nvshmem4py/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem4py/setup.py -------------------------------------------------------------------------------- /nvshmem_bootstrap.sym: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem_bootstrap.sym -------------------------------------------------------------------------------- /nvshmem_host.sym: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem_host.sym -------------------------------------------------------------------------------- /nvshmem_transport.sym: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/nvshmem_transport.sym -------------------------------------------------------------------------------- /perftest/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/README.md -------------------------------------------------------------------------------- /perftest/common/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/common/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/common/atomic_bw_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/common/atomic_bw_common.h -------------------------------------------------------------------------------- /perftest/common/atomic_one_sided_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/common/atomic_one_sided_common.h -------------------------------------------------------------------------------- /perftest/common/atomic_ping_pong_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/common/atomic_ping_pong_common.h -------------------------------------------------------------------------------- /perftest/common/utils.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/common/utils.cu -------------------------------------------------------------------------------- /perftest/common/utils.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/common/utils.h -------------------------------------------------------------------------------- /perftest/device/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/device/coll/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/device/coll/alltoall_latency.args: -------------------------------------------------------------------------------- 1 | -n 100 -w 10 -b 1 -e 4M -------------------------------------------------------------------------------- /perftest/device/coll/alltoall_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/alltoall_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/barrier_latency.args: -------------------------------------------------------------------------------- 1 | -n 1000 -w 10 -------------------------------------------------------------------------------- /perftest/device/coll/barrier_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/barrier_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/bcast_latency.args: -------------------------------------------------------------------------------- 1 | -n 100 -w 10 -b 1 -e 4M -------------------------------------------------------------------------------- /perftest/device/coll/bcast_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/bcast_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/coll_test.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/coll_test.h -------------------------------------------------------------------------------- /perftest/device/coll/fcollect_latency.args: -------------------------------------------------------------------------------- 1 | -n 100 -w 10 -b 1 -e 4M -------------------------------------------------------------------------------- /perftest/device/coll/fcollect_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/fcollect_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/redmaxloc_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/redmaxloc_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/reducescatter_latency.args: -------------------------------------------------------------------------------- 1 | -n 50 -w 10 -b 1 -e 4k -------------------------------------------------------------------------------- /perftest/device/coll/reducescatter_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/reducescatter_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/reduction_latency.args: -------------------------------------------------------------------------------- 1 | -n 50 -w 10 -b 1 -e 4M -------------------------------------------------------------------------------- /perftest/device/coll/reduction_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/reduction_latency.cu -------------------------------------------------------------------------------- /perftest/device/coll/sync_latency.args: -------------------------------------------------------------------------------- 1 | -n 1000 -w 10 -------------------------------------------------------------------------------- /perftest/device/coll/sync_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/coll/sync_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_atomic_bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_atomic_bw.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_atomic_bw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_atomic_bw.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_atomic_latency.args: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_atomic_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_atomic_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_atomic_ping_pong_latency.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_atomic_ping_pong_latency.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_atomic_ping_pong_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_atomic_ping_pong_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_g_bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_g_bw.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_g_bw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_g_bw.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_g_latency.args: -------------------------------------------------------------------------------- 1 | -n 200 -w 20 -t 512 -e 64K -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_g_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_g_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_get_bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_get_bw.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_get_bw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_get_bw.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_get_latency.args: -------------------------------------------------------------------------------- 1 | -n 200 -w 20 -t 1024 -e 64K -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_get_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_get_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_p_bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_p_bw.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_p_bw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_p_bw.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_p_latency.args: -------------------------------------------------------------------------------- 1 | -t 512 -e 64K -n 50 -w 5 -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_p_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_p_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_p_ping_pong_latency.args: -------------------------------------------------------------------------------- 1 | -t 512 -e 16K -n 500 -w 50 -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_p_ping_pong_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_p_ping_pong_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_atomic_ping_pong_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_put_atomic_ping_pong_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_put_bw.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_bw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_put_bw.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_latency.args: -------------------------------------------------------------------------------- 1 | -e 64K -t 1024 -n 200 -w 20 -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_put_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_ping_pong_latency.args: -------------------------------------------------------------------------------- 1 | -e 1M -n 500 -w 50 -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_ping_pong_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_put_ping_pong_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_signal_ping_pong_latency.args: -------------------------------------------------------------------------------- 1 | -e 1M -n 500 -w 50 -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_put_signal_ping_pong_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_put_signal_ping_pong_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_signal_ping_pong_latency.args: -------------------------------------------------------------------------------- 1 | -n 500 -w 50 -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_signal_ping_pong_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_signal_ping_pong_latency.cu -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_st_bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_st_bw.args -------------------------------------------------------------------------------- /perftest/device/pt-to-pt/shmem_st_bw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/pt-to-pt/shmem_st_bw.cu -------------------------------------------------------------------------------- /perftest/device/tile/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/tile/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/device/tile/tile_allgather_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/tile/tile_allgather_latency.cu -------------------------------------------------------------------------------- /perftest/device/tile/tile_allreduce_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/tile/tile_allreduce_latency.cu -------------------------------------------------------------------------------- /perftest/device/tile/tile_coll_test.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/device/tile/tile_coll_test.h -------------------------------------------------------------------------------- /perftest/host/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/host/coll/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/host/coll/alltoall_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/alltoall_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/alltoall_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/alltoall_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/barrier_all_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/barrier_all_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/barrier_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/barrier_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/barrier_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/barrier_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/broadcast_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/broadcast_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/broadcast_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/broadcast_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/coll_test.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/coll_test.h -------------------------------------------------------------------------------- /perftest/host/coll/fcollect_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/fcollect_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/fcollect_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/fcollect_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/reducescatter_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/reducescatter_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/reducescatter_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/reducescatter_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/reduction_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/reduction_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/reduction_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/reduction_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/sync_all_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/sync_all_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/coll/sync_on_stream.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/sync_on_stream.args -------------------------------------------------------------------------------- /perftest/host/coll/sync_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/coll/sync_on_stream.cpp -------------------------------------------------------------------------------- /perftest/host/init/CMakeLists.txt: -------------------------------------------------------------------------------- 1 | nvshmem_add_perftest(malloc.cpp) 2 | -------------------------------------------------------------------------------- /perftest/host/init/malloc.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/init/malloc.cpp -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/pt-to-pt/CMakeLists.txt -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/bw.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/pt-to-pt/bw.args -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/bw.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/pt-to-pt/bw.cpp -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/latency.args: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/pt-to-pt/latency.args -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/latency.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/pt-to-pt/latency.cpp -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/stream_latency.args: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /perftest/host/pt-to-pt/stream_latency.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/host/pt-to-pt/stream_latency.cu -------------------------------------------------------------------------------- /perftest/perfTestRunnerSlurm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perfTestRunnerSlurm.py -------------------------------------------------------------------------------- /perftest/perftest-ib.list: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftest-ib.list -------------------------------------------------------------------------------- /perftest/perftest-mmap-full.list: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftest-mmap-full.list -------------------------------------------------------------------------------- /perftest/perftest-mmap-sanity.list: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftest-mmap-sanity.list -------------------------------------------------------------------------------- /perftest/perftest-p2p-cudagraph.list: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftest-p2p-cudagraph.list -------------------------------------------------------------------------------- /perftest/perftest-p2p-nvlink.list: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftest-p2p-nvlink.list -------------------------------------------------------------------------------- /perftest/perftest-p2p-pcie.list: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftest-p2p-pcie.list -------------------------------------------------------------------------------- /perftest/perftestCommon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftestCommon.py -------------------------------------------------------------------------------- /perftest/perftestRunner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/perftest/perftestRunner.py -------------------------------------------------------------------------------- /pkg/nvshmem_package_description.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/pkg/nvshmem_package_description.txt -------------------------------------------------------------------------------- /scripts/bitcode_lib_cleanup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/scripts/bitcode_lib_cleanup.sh -------------------------------------------------------------------------------- /scripts/install_hydra.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/scripts/install_hydra.sh -------------------------------------------------------------------------------- /src/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/CMakeLists.txt -------------------------------------------------------------------------------- /src/bin/nvshmem-info.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/bin/nvshmem-info.cpp -------------------------------------------------------------------------------- /src/device/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/device/CMakeLists.txt -------------------------------------------------------------------------------- /src/device/init/init_device.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/device/init/init_device.cu -------------------------------------------------------------------------------- /src/device/launch/collective_launch.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/device/launch/collective_launch.cpp -------------------------------------------------------------------------------- /src/host/bootstrap/bootstrap.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/bootstrap/bootstrap.cpp -------------------------------------------------------------------------------- /src/host/bootstrap/bootstrap_loader.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/bootstrap/bootstrap_loader.cpp -------------------------------------------------------------------------------- /src/host/coll/alltoall/alltoall.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/alltoall/alltoall.cpp -------------------------------------------------------------------------------- /src/host/coll/alltoall/alltoall.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/alltoall/alltoall.h -------------------------------------------------------------------------------- /src/host/coll/alltoall/alltoall_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/alltoall/alltoall_on_stream.cpp -------------------------------------------------------------------------------- /src/host/coll/barrier/barrier.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/barrier/barrier.cpp -------------------------------------------------------------------------------- /src/host/coll/barrier/barrier.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/barrier/barrier.h -------------------------------------------------------------------------------- /src/host/coll/barrier/barrier_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/barrier/barrier_on_stream.cpp -------------------------------------------------------------------------------- /src/host/coll/broadcast/broadcast.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/broadcast/broadcast.cpp -------------------------------------------------------------------------------- /src/host/coll/broadcast/broadcast.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/broadcast/broadcast.h -------------------------------------------------------------------------------- /src/host/coll/broadcast/broadcast_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/broadcast/broadcast_on_stream.cpp -------------------------------------------------------------------------------- /src/host/coll/cpu_coll.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/cpu_coll.cpp -------------------------------------------------------------------------------- /src/host/coll/cpu_coll.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/cpu_coll.h -------------------------------------------------------------------------------- /src/host/coll/fcollect/fcollect.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/fcollect/fcollect.cpp -------------------------------------------------------------------------------- /src/host/coll/fcollect/fcollect.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/fcollect/fcollect.h -------------------------------------------------------------------------------- /src/host/coll/fcollect/fcollect_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/fcollect/fcollect_on_stream.cpp -------------------------------------------------------------------------------- /src/host/coll/fcollect/fcollect_on_stream.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/fcollect/fcollect_on_stream.h -------------------------------------------------------------------------------- /src/host/coll/rdxn/rdxn.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/rdxn/rdxn.cpp -------------------------------------------------------------------------------- /src/host/coll/rdxn/rdxn.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/rdxn/rdxn.h -------------------------------------------------------------------------------- /src/host/coll/rdxn/rdxn_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/rdxn/rdxn_on_stream.cpp -------------------------------------------------------------------------------- /src/host/coll/reducescatter/reducescatter.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/reducescatter/reducescatter.cpp -------------------------------------------------------------------------------- /src/host/coll/reducescatter/reducescatter.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/reducescatter/reducescatter.h -------------------------------------------------------------------------------- /src/host/coll/reducescatter/reducescatter_on_stream.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/coll/reducescatter/reducescatter_on_stream.cpp -------------------------------------------------------------------------------- /src/host/comm/amo.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/comm/amo.cpp -------------------------------------------------------------------------------- /src/host/comm/fence.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/comm/fence.cpp -------------------------------------------------------------------------------- /src/host/comm/putget.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/comm/putget.cpp -------------------------------------------------------------------------------- /src/host/comm/quiet.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/comm/quiet.cpp -------------------------------------------------------------------------------- /src/host/comm/rma.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/comm/rma.cu -------------------------------------------------------------------------------- /src/host/comm/sync.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/comm/sync.cpp -------------------------------------------------------------------------------- /src/host/init/cudawrap.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/init/cudawrap.cpp -------------------------------------------------------------------------------- /src/host/init/init.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/init/init.cu -------------------------------------------------------------------------------- /src/host/init/init_nvtx.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/init/init_nvtx.cpp -------------------------------------------------------------------------------- /src/host/init/nvmlwrap.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/init/nvmlwrap.cpp -------------------------------------------------------------------------------- /src/host/init/query_host.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/init/query_host.cpp -------------------------------------------------------------------------------- /src/host/mem/custom_malloc.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/mem/custom_malloc.cpp -------------------------------------------------------------------------------- /src/host/mem/dlmalloc.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/mem/dlmalloc.cpp -------------------------------------------------------------------------------- /src/host/mem/dlmalloc.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/mem/dlmalloc.h -------------------------------------------------------------------------------- /src/host/mem/mem.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/mem/mem.cpp -------------------------------------------------------------------------------- /src/host/mem/mem_heap.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/mem/mem_heap.cpp -------------------------------------------------------------------------------- /src/host/mem/mem_transport.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/mem/mem_transport.cpp -------------------------------------------------------------------------------- /src/host/proxy/proxy.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/proxy/proxy.cpp -------------------------------------------------------------------------------- /src/host/proxy/proxy_host.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/proxy/proxy_host.h -------------------------------------------------------------------------------- /src/host/stream/coll/alltoall/alltoall.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/alltoall/alltoall.cu -------------------------------------------------------------------------------- /src/host/stream/coll/barrier/barrier.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/barrier/barrier.cu -------------------------------------------------------------------------------- /src/host/stream/coll/broadcast/broadcast.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/broadcast/broadcast.cu -------------------------------------------------------------------------------- /src/host/stream/coll/fcollect/fcollect.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/fcollect/fcollect.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_and.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_and.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_common.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_common.cuh -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_max.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_max.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_min.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_min.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_or.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_or.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_prod.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_prod.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_sum.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_sum.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_team.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_team.cu -------------------------------------------------------------------------------- /src/host/stream/coll/rdxn/reduce_xor.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/rdxn/reduce_xor.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_and.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_and.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_common.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_common.cuh -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_max.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_max.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_min.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_min.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_or.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_or.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_prod.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_prod.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_sum.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_sum.cu -------------------------------------------------------------------------------- /src/host/stream/coll/reducescatter/reducescatter_xor.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/coll/reducescatter/reducescatter_xor.cu -------------------------------------------------------------------------------- /src/host/stream/comm/cuda_interface_sync.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/comm/cuda_interface_sync.cu -------------------------------------------------------------------------------- /src/host/stream/comm/quiet_on_stream.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/stream/comm/quiet_on_stream.cu -------------------------------------------------------------------------------- /src/host/team/team.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/team/team.cu -------------------------------------------------------------------------------- /src/host/team/team_internal.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/team/team_internal.cpp -------------------------------------------------------------------------------- /src/host/team/team_internal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/team/team_internal.h -------------------------------------------------------------------------------- /src/host/team/team_internal_cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/team/team_internal_cuda.cu -------------------------------------------------------------------------------- /src/host/team/team_internal_nvls.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/team/team_internal_nvls.cpp -------------------------------------------------------------------------------- /src/host/topo/topo.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/topo/topo.cpp -------------------------------------------------------------------------------- /src/host/topo/topo.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/topo/topo.h -------------------------------------------------------------------------------- /src/host/transport/p2p/p2p.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/transport/p2p/p2p.cpp -------------------------------------------------------------------------------- /src/host/transport/p2p/p2p.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/transport/p2p/p2p.h -------------------------------------------------------------------------------- /src/host/transport/transport.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/transport/transport.cpp -------------------------------------------------------------------------------- /src/host/util/cs.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/util/cs.cpp -------------------------------------------------------------------------------- /src/host/util/debug.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/util/debug.cpp -------------------------------------------------------------------------------- /src/host/util/env_vars.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/util/env_vars.cpp -------------------------------------------------------------------------------- /src/host/util/shared_memory.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/util/shared_memory.cpp -------------------------------------------------------------------------------- /src/host/util/sockets.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/util/sockets.cpp -------------------------------------------------------------------------------- /src/host/util/util.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/host/util/util.cpp -------------------------------------------------------------------------------- /src/include/bootstrap_device_host/nvshmem_uniqueid.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/bootstrap_device_host/nvshmem_uniqueid.h -------------------------------------------------------------------------------- /src/include/bootstrap_host_transport/env_defs_internal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/bootstrap_host_transport/env_defs_internal.h -------------------------------------------------------------------------------- /src/include/device/nvshmem_coll_defines.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/nvshmem_coll_defines.cuh -------------------------------------------------------------------------------- /src/include/device/nvshmem_defines.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/nvshmem_defines.h -------------------------------------------------------------------------------- /src/include/device/nvshmem_device_macros.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/nvshmem_device_macros.h -------------------------------------------------------------------------------- /src/include/device/nvshmemx_coll_defines.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/nvshmemx_coll_defines.cuh -------------------------------------------------------------------------------- /src/include/device/nvshmemx_collective_launch_apis.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/nvshmemx_collective_launch_apis.h -------------------------------------------------------------------------------- /src/include/device/nvshmemx_defines.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/nvshmemx_defines.h -------------------------------------------------------------------------------- /src/include/device/tile/nvshmemx_tile_api.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/tile/nvshmemx_tile_api.hpp -------------------------------------------------------------------------------- /src/include/device/tile/nvshmemx_tile_api_defines.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device/tile/nvshmemx_tile_api_defines.cuh -------------------------------------------------------------------------------- /src/include/device_host/nvshmem_common.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host/nvshmem_common.cuh -------------------------------------------------------------------------------- /src/include/device_host/nvshmem_proxy_channel.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host/nvshmem_proxy_channel.h -------------------------------------------------------------------------------- /src/include/device_host/nvshmem_tensor.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host/nvshmem_tensor.h -------------------------------------------------------------------------------- /src/include/device_host/nvshmem_types.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host/nvshmem_types.h -------------------------------------------------------------------------------- /src/include/device_host_transport/nvshmem_common_ibgda.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host_transport/nvshmem_common_ibgda.h -------------------------------------------------------------------------------- /src/include/device_host_transport/nvshmem_common_transport.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host_transport/nvshmem_common_transport.h -------------------------------------------------------------------------------- /src/include/device_host_transport/nvshmem_constants.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/device_host_transport/nvshmem_constants.h -------------------------------------------------------------------------------- /src/include/host/env/env_defs.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/host/env/env_defs.h -------------------------------------------------------------------------------- /src/include/host/nvshmem_api.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/host/nvshmem_api.h -------------------------------------------------------------------------------- /src/include/host/nvshmem_coll_api.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/host/nvshmem_coll_api.h -------------------------------------------------------------------------------- /src/include/host/nvshmem_macros.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/host/nvshmem_macros.h -------------------------------------------------------------------------------- /src/include/host/nvshmemx_api.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/host/nvshmemx_api.h -------------------------------------------------------------------------------- /src/include/host/nvshmemx_coll_api.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/host/nvshmemx_coll_api.h -------------------------------------------------------------------------------- /src/include/internal/bootstrap_host/nvshmemi_bootstrap.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/bootstrap_host/nvshmemi_bootstrap.h -------------------------------------------------------------------------------- /src/include/internal/bootstrap_host_transport/nvshmemi_bootstrap_defines.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/bootstrap_host_transport/nvshmemi_bootstrap_defines.h -------------------------------------------------------------------------------- /src/include/internal/common/error_codes_internal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/common/error_codes_internal.h -------------------------------------------------------------------------------- /src/include/internal/device/nvshmemi_device.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/device/nvshmemi_device.h -------------------------------------------------------------------------------- /src/include/internal/host/cuda_interface_sync.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/cuda_interface_sync.h -------------------------------------------------------------------------------- /src/include/internal/host/custom_malloc.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/custom_malloc.h -------------------------------------------------------------------------------- /src/include/internal/host/debug.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/debug.h -------------------------------------------------------------------------------- /src/include/internal/host/error_codes_internal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/error_codes_internal.h -------------------------------------------------------------------------------- /src/include/internal/host/nvmlwrap.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvmlwrap.h -------------------------------------------------------------------------------- /src/include/internal/host/nvshmem_internal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmem_internal.h -------------------------------------------------------------------------------- /src/include/internal/host/nvshmem_nvtx.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmem_nvtx.hpp -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_bootstrap_library.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_bootstrap_library.h -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_coll.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_coll.h -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_mem_transport.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_mem_transport.hpp -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_nvls_rsc.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_nvls_rsc.hpp -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_symmetric_heap.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_symmetric_heap.hpp -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_team.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_team.h -------------------------------------------------------------------------------- /src/include/internal/host/nvshmemi_types.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvshmemi_types.h -------------------------------------------------------------------------------- /src/include/internal/host/nvtx3.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/nvtx3.hpp -------------------------------------------------------------------------------- /src/include/internal/host/shared_memory.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/shared_memory.h -------------------------------------------------------------------------------- /src/include/internal/host/sockets.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/sockets.h -------------------------------------------------------------------------------- /src/include/internal/host/util.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host/util.h -------------------------------------------------------------------------------- /src/include/internal/host_transport/cudawrap.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host_transport/cudawrap.h -------------------------------------------------------------------------------- /src/include/internal/host_transport/nvshmemi_transport_defines.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host_transport/nvshmemi_transport_defines.h -------------------------------------------------------------------------------- /src/include/internal/host_transport/transport.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/host_transport/transport.h -------------------------------------------------------------------------------- /src/include/internal/non_abi/nvshmemi_h_to_d_coll_defs.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/non_abi/nvshmemi_h_to_d_coll_defs.cuh -------------------------------------------------------------------------------- /src/include/internal/non_abi/nvshmemi_h_to_d_rma_defs.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/non_abi/nvshmemi_h_to_d_rma_defs.cuh -------------------------------------------------------------------------------- /src/include/internal/non_abi/nvshmemi_h_to_d_sync_defs.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/internal/non_abi/nvshmemi_h_to_d_sync_defs.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/alltoall.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/alltoall.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/barrier.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/barrier.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/broadcast.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/broadcast.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/defines.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/defines.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/fcollect.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/fcollect.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/reduce.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/reduce.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/reducescatter.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/reducescatter.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/coll/utils.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/coll/utils.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/common/nvshmemi_common_device.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/common/nvshmemi_common_device.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/common/nvshmemi_tile_utils.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/common/nvshmemi_tile_utils.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/pt-to-pt/ibgda_device.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/pt-to-pt/ibgda_device.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/pt-to-pt/nvshmemi_transfer_api.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/pt-to-pt/nvshmemi_transfer_api.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/pt-to-pt/proxy_device.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/pt-to-pt/proxy_device.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/pt-to-pt/tile.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/pt-to-pt/tile.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/pt-to-pt/transfer_device.cuh.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/pt-to-pt/transfer_device.cuh.in -------------------------------------------------------------------------------- /src/include/non_abi/device/pt-to-pt/utils_device.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/pt-to-pt/utils_device.h -------------------------------------------------------------------------------- /src/include/non_abi/device/team/nvshmemi_team_defines.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/team/nvshmemi_team_defines.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/threadgroup/nvshmemi_common_device_defines.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/threadgroup/nvshmemi_common_device_defines.cuh -------------------------------------------------------------------------------- /src/include/non_abi/device/wait/nvshmemi_wait_until_apis.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/device/wait/nvshmemi_wait_until_apis.cuh -------------------------------------------------------------------------------- /src/include/non_abi/nvshmem_build_options.h.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/nvshmem_build_options.h.in -------------------------------------------------------------------------------- /src/include/non_abi/nvshmem_version.h.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/nvshmem_version.h.in -------------------------------------------------------------------------------- /src/include/non_abi/nvshmemx_error.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/non_abi/nvshmemx_error.h -------------------------------------------------------------------------------- /src/include/nvshmem.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/nvshmem.h -------------------------------------------------------------------------------- /src/include/nvshmem_host.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/nvshmem_host.h -------------------------------------------------------------------------------- /src/include/nvshmemx.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/include/nvshmemx.h -------------------------------------------------------------------------------- /src/modules/bootstrap/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/common/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/common/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/common/bootstrap_util.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/common/bootstrap_util.cpp -------------------------------------------------------------------------------- /src/modules/bootstrap/common/bootstrap_util.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/common/bootstrap_util.h -------------------------------------------------------------------------------- /src/modules/bootstrap/common/env_defs.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/common/env_defs.h -------------------------------------------------------------------------------- /src/modules/bootstrap/mpi/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/mpi/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/mpi/bootstrap_mpi.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/mpi/bootstrap_mpi.c -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/bootstrap_pmi.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/bootstrap_pmi.cpp -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/pmi-2/COPYRIGHT: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/pmi-2/COPYRIGHT -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/pmi-2/pmi2.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/pmi-2/pmi2.h -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/pmi-2/pmi2_api.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/pmi-2/pmi2_api.c -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/pmi-2/pmi2_util.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/pmi-2/pmi2_util.c -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/pmi-2/pmi2_util.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/pmi-2/pmi2_util.h -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/simple-pmi/pmi_internal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/simple-pmi/pmi_internal.h -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/simple-pmi/simple_pmi.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/simple-pmi/simple_pmi.cpp -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/simple-pmi/simple_pmiutil.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/simple-pmi/simple_pmiutil.cpp -------------------------------------------------------------------------------- /src/modules/bootstrap/pmi/simple-pmi/simple_pmiutil.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmi/simple-pmi/simple_pmiutil.h -------------------------------------------------------------------------------- /src/modules/bootstrap/pmix/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmix/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/pmix/bootstrap_pmix.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/pmix/bootstrap_pmix.c -------------------------------------------------------------------------------- /src/modules/bootstrap/shmem/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/shmem/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/shmem/bootstrap_shmem.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/shmem/bootstrap_shmem.c -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/bootstrap_uid.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/bootstrap_uid.cpp -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/bootstrap_uid_remap.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/bootstrap_uid_remap.h -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/bootstrap_uid_types.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/bootstrap_uid_types.hpp -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/commit_info.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/commit_info.txt -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_checks.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_checks.h -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_debug.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_debug.h -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_nccl.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_nccl.h -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_param.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_param.h -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_socket.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_socket.cpp -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_socket.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_socket.hpp -------------------------------------------------------------------------------- /src/modules/bootstrap/uid/ncclSocket/ncclsocket_utils.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/bootstrap/uid/ncclSocket/ncclsocket_utils.h -------------------------------------------------------------------------------- /src/modules/transport/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/common/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/common/env_defs.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/env_defs.h -------------------------------------------------------------------------------- /src/modules/transport/common/mlx5_ifc.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/mlx5_ifc.h -------------------------------------------------------------------------------- /src/modules/transport/common/mlx5_prm.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/mlx5_prm.h -------------------------------------------------------------------------------- /src/modules/transport/common/transport_common.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_common.cpp -------------------------------------------------------------------------------- /src/modules/transport/common/transport_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_common.h -------------------------------------------------------------------------------- /src/modules/transport/common/transport_gdr_common.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_gdr_common.cpp -------------------------------------------------------------------------------- /src/modules/transport/common/transport_gdr_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_gdr_common.h -------------------------------------------------------------------------------- /src/modules/transport/common/transport_ib_common.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_ib_common.cpp -------------------------------------------------------------------------------- /src/modules/transport/common/transport_ib_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_ib_common.h -------------------------------------------------------------------------------- /src/modules/transport/common/transport_mlx5_common.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_mlx5_common.cpp -------------------------------------------------------------------------------- /src/modules/transport/common/transport_mlx5_common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/common/transport_mlx5_common.h -------------------------------------------------------------------------------- /src/modules/transport/ibdevx/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibdevx/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/ibdevx/ibdevx.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibdevx/ibdevx.cpp -------------------------------------------------------------------------------- /src/modules/transport/ibdevx/ibdevx.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibdevx/ibdevx.h -------------------------------------------------------------------------------- /src/modules/transport/ibgda/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibgda/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/ibgda/ibgda.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibgda/ibgda.cpp -------------------------------------------------------------------------------- /src/modules/transport/ibrc/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibrc/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/ibrc/ibrc.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ibrc/ibrc.cpp -------------------------------------------------------------------------------- /src/modules/transport/libfabric/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/libfabric/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/libfabric/libfabric.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/libfabric/libfabric.cpp -------------------------------------------------------------------------------- /src/modules/transport/libfabric/libfabric.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/libfabric/libfabric.h -------------------------------------------------------------------------------- /src/modules/transport/ucx/CMakeLists.txt.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ucx/CMakeLists.txt.in -------------------------------------------------------------------------------- /src/modules/transport/ucx/ucx.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ucx/ucx.cpp -------------------------------------------------------------------------------- /src/modules/transport/ucx/ucx.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/nvshmem/HEAD/src/modules/transport/ucx/ucx.h --------------------------------------------------------------------------------