├── .gitignore ├── CONTRIBUTING.md ├── LICENSE.txt ├── README.md ├── SECURITY.md ├── autoscaling ├── .DS_Store ├── clusters │ └── README ├── credentials │ └── key.sh ├── crontab │ └── autoscale_slurm.sh ├── provider_inst_prin.tpl ├── provider_user.tpl └── tf_init │ ├── cluster-network-configuration.tf │ ├── cluster-network.tf │ ├── compute-cluster.tf │ ├── compute-nodes.tf │ ├── config.controller │ ├── config.hpc │ ├── controller_update.tf │ ├── data.tf │ ├── instance-pool-configuration.tf │ ├── instance-pool.tf │ ├── inventory.tpl │ ├── locals.tf │ ├── marketplace.tf │ ├── network.tf │ ├── outputs.tf │ ├── user_data.tf │ └── versions.tf ├── bin ├── cleanup.sh ├── configure.sh ├── configure_as.sh ├── controller.sh ├── create_cluster.sh ├── delete_cluster.sh ├── find_reachable_hosts.sh ├── initial_monitoring.sh ├── rdma_metrics_collection_config.conf ├── remove_nodes_prompt.txt ├── resize.sh ├── resize │ ├── ociobj.py │ ├── reconfigure.py │ ├── resize.py │ └── utils.py ├── slurm_config.sh ├── upload_rdma_nic_metrics.sh └── wait_for_hosts.sh ├── cluster-network-configuration.tf ├── cluster-network.tf ├── compute-cluster.tf ├── compute-nodes.tf ├── conf ├── queues.conf.example └── variables.tpl ├── config.controller ├── config.hpc ├── configure.tpl ├── controller.tf ├── data.tf ├── fss.tf ├── initial_mon.tpl ├── instance-pool-configuration.tf ├── instance-pool.tf ├── inventory.tpl ├── locals.tf ├── login.tf ├── logs └── README ├── lustre.tf ├── marketplace.tf ├── monitoring.tf ├── mysql.tf ├── network.tf ├── oci_images.tf ├── outputs.tf ├── playbooks ├── destroy.yml ├── group_vars │ └── all.yml ├── monitoring.yml ├── new_nodes.yml ├── resize_add.yml ├── resize_remove.yml ├── resize_remove_unreachable.yml ├── roles │ ├── autoscaling_mon │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── dashboard.json │ │ │ ├── initial.sh │ │ │ ├── initial.sql │ │ │ ├── monitor_oci.sh │ │ │ └── monitor_slurm.sh │ │ ├── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ │ └── templates │ │ │ ├── env.j2 │ │ │ └── mysql_service_initial.j2 │ ├── boot-volume │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── cloud-agent_update │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── cluster-cli │ │ ├── files │ │ │ └── cluster │ │ └── tasks │ │ │ ├── debian.yml │ │ │ ├── el7.yml │ │ │ ├── el8.yml │ │ │ └── main.yml │ ├── cron │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── destroy_unreachable │ │ └── tasks │ │ │ ├── common.yml │ │ │ ├── main.yml │ │ │ ├── slurm-rack-aware.yml │ │ │ └── slurm.yml │ ├── disable_core_dumps │ │ └── tasks │ │ │ └── main.yml │ ├── docker │ │ ├── tasks │ │ │ ├── main.yml │ │ │ ├── oraclelinux.yml │ │ │ └── ubuntu.yml │ │ └── templates │ │ │ └── templates.j2 │ ├── etc-hosts │ │ ├── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ │ └── templates │ │ │ ├── etc-hosts-controller.j2 │ │ │ └── etc-hosts.j2 │ ├── firewall │ │ ├── files │ │ │ └── off-iptables.sh │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── fix_broken │ │ ├── README.md │ │ └── tasks │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── fix_ldap │ │ └── tasks │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── fss-home │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── grafana │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── alert-rules.yaml │ │ │ ├── cluster-dashboard.jsonnet │ │ │ ├── cluster-level-variables.libsonnet │ │ │ ├── cluster-level.jsonnet │ │ │ ├── cluster-variables.libsonnet │ │ │ ├── cluster.json │ │ │ ├── cluster_amd.json │ │ │ ├── cluster_prometheus.json │ │ │ ├── cluster_prometheus_v2.json │ │ │ ├── command-center-variables.libsonnet │ │ │ ├── command-center.jsonnet │ │ │ ├── delete-rules.yaml │ │ │ ├── g.libsonnet │ │ │ ├── gauge-panel-util.libsonnet │ │ │ ├── gauge-panel.libsonnet │ │ │ ├── gpu-health.jsonnet │ │ │ ├── gpu-metrics-single-variables.libsonnet │ │ │ ├── gpu-metrics-single.jsonnet │ │ │ ├── host-metrics-single-variables.libsonnet │ │ │ ├── host-metrics-single.jsonnet │ │ │ ├── main.jsonnet │ │ │ ├── multi-node-variables.libsonnet │ │ │ ├── multi-node.jsonnet │ │ │ ├── nccl-traces.jsonnet │ │ │ ├── node_exporter.json │ │ │ ├── oci-dashboard.jsonnet │ │ │ ├── oci-variables.libsonnet │ │ │ ├── raw_message_template.txt │ │ │ ├── rdma-hw-counters.json │ │ │ ├── slurm-dashboard.jsonnet │ │ │ ├── slurm-variables.libsonnet │ │ │ ├── stat-health-panel.libsonnet │ │ │ ├── stat-panel-single.libsonnet │ │ │ ├── stat-panel.libsonnet │ │ │ ├── statetimeline-panel.libsonnet │ │ │ ├── storage-metrics-variables.libsonnet │ │ │ ├── storage-metrics.jsonnet │ │ │ ├── table-panel.libsonnet │ │ │ ├── timeseries-panel.libsonnet │ │ │ └── variables.libsonnet │ │ ├── tasks │ │ │ ├── dashboard.yml │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ │ └── templates │ │ │ ├── ons-webhook.service.j2 │ │ │ └── ons_webhook.py.j2 │ ├── healthchecks │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── check_gpu_setup.py │ │ │ ├── gpu_bw_test.py │ │ │ ├── meshpinger_readme.md │ │ │ ├── rdma_link_flapping.py │ │ │ ├── run_meshpinger.sh │ │ │ ├── shared_logging.py │ │ │ └── xid_checker.py │ │ └── tasks │ │ │ └── main.yml │ ├── home_nfs │ │ └── tasks │ │ │ ├── el.yml │ │ │ └── main.yml │ ├── hostname │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── hyperthreading │ │ ├── files │ │ │ ├── control_hyperthreading.sh │ │ │ ├── control_hyperthreading_ubuntu.sh │ │ │ ├── disable-hyperthreading.service │ │ │ └── disable-hyperthreading_ubuntu.service │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── influxdb │ │ ├── defaults │ │ │ └── main.yml │ │ ├── handlers │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── config_influxdb.yml │ │ │ ├── el.yml │ │ │ ├── el_install_influxdb.yml │ │ │ ├── main.yml │ │ │ ├── ubuntu.yml │ │ │ └── ubuntu_install_influxdb.yml │ │ └── templates │ │ │ └── influxdb.conf.j2 │ ├── iscsi │ │ └── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── latency_check │ │ ├── tasks │ │ │ ├── el.yml │ │ │ └── main.yml │ │ └── templates │ │ │ └── latency_check.sh.j2 │ ├── limits │ │ ├── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ │ └── templates │ │ │ └── limits.j2 │ ├── localdisk │ │ ├── defaults │ │ │ └── main.yml │ │ └── tasks │ │ │ ├── common.yml │ │ │ ├── debian.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── lustre-client │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ └── install_lustre_ubuntu.sh │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── metrics-exporter │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── custom_metric_common.py │ │ │ ├── dcgm-counters.csv │ │ │ ├── nccl_profiler_exporter.py │ │ │ ├── node_exporter.service │ │ │ ├── nvidia-allow-prof.conf │ │ │ ├── nvlink_counters_exporter.py │ │ │ ├── nvml_metrics_exporter.py │ │ │ ├── pcie_faults_exporter.py │ │ │ ├── rdma_counters_exporter.py │ │ │ ├── rdma_link_flapping.py │ │ │ ├── shared_logging.py │ │ │ └── xid_checker.py │ │ ├── tasks │ │ │ ├── custom_metrics.yml │ │ │ ├── dcgm_exporter.yml │ │ │ ├── main.yml │ │ │ ├── nccl_profiler.yml │ │ │ ├── node_exporter_el.yml │ │ │ ├── node_exporter_ubuntu.yml │ │ │ ├── nvlink_exporter.yml │ │ │ ├── nvml_exporter.yml │ │ │ ├── pcie_faults.yml │ │ │ └── rdma_exporter.yml │ │ ├── templates │ │ │ ├── customMetrics.service.j2 │ │ │ ├── custom_metrics.py.j2 │ │ │ ├── dcgm-exporter.service.j2 │ │ │ ├── nccl-profiler-exporter.service.j2 │ │ │ ├── nvlink-exporter.service.j2 │ │ │ ├── nvml-exporter.service.j2 │ │ │ ├── pcie-faults-exporter.service.j2 │ │ │ ├── prometheus.yml.j2 │ │ │ └── rdma-exporter.service.j2 │ │ └── vars │ │ │ └── main.yml │ ├── mpi-hostfiles │ │ ├── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ │ └── templates │ │ │ ├── hostfile_rdma.j2 │ │ │ └── hostfile_tcp.j2 │ ├── mpivars │ │ ├── defaults │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ │ ├── templates │ │ │ └── mpivars.j2 │ │ └── vars │ │ │ └── main.yml │ ├── multiple-mount-target │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ └── mmt.py │ │ └── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── mysql │ │ ├── files │ │ │ └── innodb.cnf │ │ ├── handlers │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── centos.yml │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ └── main.yml │ │ ├── templates │ │ │ ├── debian_mariadb_etc_my.cnf.j2 │ │ │ ├── debian_my.cnf.j2 │ │ │ ├── mariadb_etc_my.cnf.j2 │ │ │ ├── my.cnf.j2 │ │ │ └── mysqld_etc_my.cnf.j2 │ │ └── vars │ │ │ ├── ol_vars.yml │ │ │ ├── ubuntu-2204_vars.yml │ │ │ └── ubuntu_vars.yml │ ├── nccl-conf │ │ ├── tasks │ │ │ └── main.yml │ │ └── templates │ │ │ ├── a100_b4.8 │ │ │ ├── b200 │ │ │ ├── bm.gpu4.8 │ │ │ ├── h100 │ │ │ └── h200 │ ├── nfs-client │ │ ├── defaults │ │ │ └── main.yml │ │ ├── meta │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ │ └── vars │ │ │ └── main.yml │ ├── nfs-server │ │ ├── defaults │ │ │ └── main.yml │ │ ├── handlers │ │ │ └── main.yml │ │ ├── meta │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ │ ├── templates │ │ │ └── exports.j2 │ │ └── vars │ │ │ └── main.yml │ ├── no_instance_principal │ │ ├── defaults │ │ │ └── main.yml │ │ ├── meta │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ │ ├── templates │ │ │ └── config.j2 │ │ └── vars │ │ │ └── main.yml │ ├── nvidia-container │ │ ├── defaults │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── main.yml │ │ │ ├── oraclelinux-7.yml │ │ │ └── ubuntu.yml │ │ ├── templates │ │ │ └── templates.j2 │ │ └── vars │ │ │ └── main.yml │ ├── nvidia-enroot │ │ └── tasks │ │ │ ├── main.yml │ │ │ ├── oraclelinux.yml │ │ │ └── ubuntu.yml │ ├── nvidia_peermem │ │ ├── defaults │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ │ └── vars │ │ │ └── main.yml │ ├── oci-cloud-agent-updater │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── oci-cloud-agent │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── oci-cn-auth │ │ ├── defaults │ │ │ └── main.yml │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── oci-hostname │ │ └── tasks │ │ │ ├── el.yml │ │ │ └── main.yml │ ├── oci-legacy │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── oci-metrics │ │ ├── files │ │ │ ├── oci-fss-metrics-exporter.py │ │ │ ├── oci-lustre-metrics-exporter.py │ │ │ └── oci-rdma-faults-exporter.py │ │ ├── tasks │ │ │ └── main.yml │ │ └── templates │ │ │ ├── oci-fss-exporter.service.j2 │ │ │ ├── oci-lustre-exporter.service.j2 │ │ │ └── oci-rdma-faults-exporter.service.j2 │ ├── oom-adjust │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ └── oom-adjust.conf │ │ └── tasks │ │ │ └── main.yml │ ├── openldap │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── autoinc.ldif │ │ │ ├── debian_memberof.ldif │ │ │ ├── debian_ppolicy.ldif │ │ │ ├── el_memberof.ldif │ │ │ ├── el_memberof_ol8.ldif │ │ │ ├── el_ppolicy.ldif │ │ │ ├── el_ppolicy_ol8.ldif │ │ │ ├── local_schema.ldif │ │ │ ├── rfc2307bis.ldif │ │ │ └── slapd │ │ ├── handlers │ │ │ └── main.yml │ │ ├── meta │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ └── main.yml │ │ ├── templates │ │ │ ├── config.ldif.j2 │ │ │ ├── debian_local.ldif.j2 │ │ │ ├── el_local.ldif.j2 │ │ │ └── el_local_ol8.ldif.j2 │ │ └── vars │ │ │ ├── debian_vars.yml │ │ │ └── el_vars.yml │ ├── packages │ │ └── tasks │ │ │ ├── centos-7.yml │ │ │ ├── debian.yml │ │ │ ├── el-7.yml │ │ │ ├── main.yml │ │ │ ├── ol-7.yml │ │ │ ├── ol-8.yml │ │ │ ├── ubuntu-2204.yml │ │ │ └── ubuntu.yml │ ├── passwords │ │ └── tasks │ │ │ └── main.yml │ ├── privilege_group │ │ └── tasks │ │ │ ├── common.yml │ │ │ ├── el.yml │ │ │ └── main.yml │ ├── prometheus │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ └── recording_rules.yml │ │ ├── tasks │ │ │ ├── cleanup_targets.yml │ │ │ ├── create_target.yml │ │ │ ├── gather_info.yml │ │ │ ├── main.yml │ │ │ └── setup_prometheus.yml │ │ └── templates │ │ │ ├── prometheus.conf.j2 │ │ │ ├── prometheus.service.j2 │ │ │ ├── prometheus.yml.j2 │ │ │ └── prometheus_target.json.j2 │ ├── rack-aware │ │ ├── files │ │ │ └── node_ordering_by_rack.py │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── rdma-interface │ │ ├── defaults │ │ │ └── main.yml │ │ ├── handlers │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ └── main.yml │ │ ├── templates │ │ │ ├── ifcfg.j2 │ │ │ └── interface.j2 │ │ └── vars │ │ │ └── main.yml │ ├── rttcc │ │ └── tasks │ │ │ └── main.yml │ ├── safe_yum │ │ └── tasks │ │ │ ├── el.yml │ │ │ ├── main.yml │ │ │ └── ubuntu.yml │ ├── slurm │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── cgroup.conf │ │ │ ├── healthchecks.sh │ │ │ └── sshd │ │ ├── handlers │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── backup_server.yml │ │ │ ├── cleanup.yml │ │ │ ├── common.yml │ │ │ ├── common_pmix.yml │ │ │ ├── common_pyxis.yml │ │ │ ├── compute-rack-aware.yml │ │ │ ├── compute.yml │ │ │ ├── compute_pam.yml │ │ │ ├── controller.yml │ │ │ ├── destroy-rack-aware.yml │ │ │ ├── destroy.yml │ │ │ ├── download.yml │ │ │ ├── el7.yml │ │ │ ├── el8.yml │ │ │ ├── login.yml │ │ │ ├── main.yml │ │ │ ├── move-topology.yml │ │ │ ├── server.yml │ │ │ └── ubuntu.yml │ │ ├── templates │ │ │ ├── gres.conf.j2 │ │ │ ├── pyxis.sh.j2 │ │ │ ├── slurm.conf.j2 │ │ │ ├── slurmdbd.conf.j2 │ │ │ ├── systemd │ │ │ │ ├── munge.service.d │ │ │ │ │ └── unit.conf.j2 │ │ │ │ ├── sackd.service.d │ │ │ │ │ └── unit.conf.j2 │ │ │ │ ├── sackd.service.j2 │ │ │ │ ├── slurm_env.j2 │ │ │ │ ├── slurmctld.service.d │ │ │ │ │ └── unit.conf.j2 │ │ │ │ ├── slurmctld.service.j2 │ │ │ │ ├── slurmctld_backup.service.d │ │ │ │ │ └── unit.conf.j2 │ │ │ │ ├── slurmd.service.d │ │ │ │ │ └── unit.conf.j2 │ │ │ │ ├── slurmd.service.j2 │ │ │ │ ├── slurmdbd.service.d │ │ │ │ │ └── unit.conf.j2 │ │ │ │ └── slurmdbd.service.j2 │ │ │ └── topology.conf.j2 │ │ └── vars │ │ │ ├── centos_vars.yml │ │ │ ├── el_vars.yml │ │ │ └── ubuntu_vars.yml │ ├── slurm_rest_api │ │ ├── defaults │ │ │ └── main.yml │ │ ├── handlers │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── main.yml │ │ │ ├── slurm_exporter.yml │ │ │ ├── slurm_restd.yml │ │ │ └── slurm_sdk.yml │ │ └── templates │ │ │ ├── slurm-exporter.py.j2 │ │ │ ├── slurm-exporter.service.j2 │ │ │ └── slurmrestd.service.j2 │ ├── spack │ │ ├── defaults │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ └── main.yml │ │ └── templates │ │ │ └── spack.j2 │ ├── ssh │ │ ├── files │ │ │ └── ssh_config │ │ └── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ ├── ssl │ │ ├── defaults │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el.yml │ │ │ └── main.yml │ │ └── templates │ │ │ └── san.conf.j2 │ ├── sssd │ │ ├── handlers │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── debian.yml │ │ │ ├── el-7.yml │ │ │ ├── el-8.yml │ │ │ └── main.yml │ │ ├── templates │ │ │ ├── sssd.conf.j2 │ │ │ └── sssd_ubuntu.conf.j2 │ │ └── vars │ │ │ └── main.yml │ ├── telegraf │ │ ├── defaults │ │ │ └── main.yml │ │ ├── files │ │ │ ├── telegraf.conf │ │ │ ├── telegraf_amd_gpu.conf │ │ │ └── telegraf_nvidia_gpu.conf │ │ ├── handlers │ │ │ └── main.yml │ │ ├── meta │ │ │ └── main.yml │ │ ├── tasks │ │ │ ├── common.yml │ │ │ └── main.yml │ │ └── templates │ │ │ ├── amd_gpu.conf.j2 │ │ │ ├── custom.cnf.j2 │ │ │ ├── ethtool_counters.conf.j2 │ │ │ ├── infiniband.conf.j2 │ │ │ ├── infiniband_mlx5_0_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_10_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_11_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_12_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_13_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_14_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_15_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_16_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_1_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_2_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_3_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_4_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_5_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_6_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_7_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_8_hw_counters.conf.j2 │ │ │ ├── infiniband_mlx5_9_hw_counters.conf.j2 │ │ │ ├── influxdb.conf.j2 │ │ │ ├── net.conf.j2 │ │ │ ├── nvidia_gpu.conf.j2 │ │ │ └── prometheus.conf.j2 │ ├── tuned │ │ ├── files │ │ │ └── tuned.conf │ │ └── tasks │ │ │ ├── el-7.yml │ │ │ └── main.yml │ ├── weka_client │ │ └── tasks │ │ │ └── main.yml │ └── yaml │ │ └── tasks │ │ ├── el.yml │ │ ├── main.yml │ │ └── ubuntu.yml ├── site.yml ├── slurm_config.yml └── slurm_config_as.yml ├── provider.tf ├── queues.conf ├── samples ├── NCCL_readme ├── disable_ht.sh ├── gpu │ ├── H100-topology-kubernetes.xml │ ├── H100-topology.xml │ ├── ifdown.sh │ ├── ifup.sh │ ├── nccl_run_allreduce.sbatch │ ├── nccl_run_allreduce.sh │ ├── nccl_run_allreduce_H100_200.sbatch │ ├── nccl_run_allreduce_H100_200.sh │ ├── nccl_run_allreduce_containers_H100_H200.sbatch │ ├── nccl_run_allreduce_containers_with_ordering.sbatch │ ├── nccl_run_allreduce_srun.sbatch │ ├── nccl_run_allreduce_srun.sh │ ├── nccl_run_allreduce_tuner.sbatch │ ├── nccl_run_allreduce_tuner.sh │ ├── nccl_run_alltoall.sh │ ├── no_ncclparam_nccl_run_allreduce.sbatch │ ├── no_ncclparam_nccl_run_allreduce.sh │ ├── no_ncclparam_nccl_run_allreduce_H100_H200.sbatch │ ├── no_ncclparam_nccl_run_allreduce_H100_H200.sh │ ├── notes.txt │ ├── ping.sh │ ├── qfabv1_nccl_run_allreduce.sbatch │ ├── qfabv1_nccl_run_allreduce.sh │ ├── qfabv1_nccl_run_alltoall.sh │ ├── rccl_run_allreduce.sbatch │ ├── srun_examples_with_container.txt │ ├── topo-flattened-b4.xml │ ├── topo-flattened.xml │ ├── update_arp_settings.sh │ └── update_netmask.sh ├── nccl_compile │ └── compile.sh ├── nfs │ ├── README.txt │ └── fix_nfs.sh ├── open-ldap │ ├── add-ldap-users.yml │ └── add-linux-group.yml ├── prep_sample_files.sh ├── rdma-tuning │ ├── check_pcie_max_read.sh │ ├── pcie_max_read.sh │ ├── pcie_max_read_default.sh │ ├── rdma-nic-tuning-1.sh │ ├── rdma-nic-tuning-2.sh │ └── rdma-nic-tuning-validate.sh └── submit │ ├── sleep.sbatch │ └── sleep_gpu.sbatch ├── schema.yaml ├── scripts ├── check_firmware_version.sh ├── collect_logs.py ├── collect_metadata │ ├── collect_metadata.py │ └── requirements.txt ├── create_instance_config.py ├── gpu_throttle.sh ├── h100_script.py ├── ib_write_bw.sh ├── ib_write_lat.sh ├── max_nodes_partition.py ├── ncclscout.py ├── pcie.sh ├── runNCCL_on_hostPair.sh └── validation.py ├── slurm_ha.tf ├── user_data.tf ├── variables.tf └── versions.tf /.gitignore: -------------------------------------------------------------------------------- 1 | .DS_Store 2 | -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/LICENSE.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/README.md -------------------------------------------------------------------------------- /SECURITY.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/SECURITY.md -------------------------------------------------------------------------------- /autoscaling/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/.DS_Store -------------------------------------------------------------------------------- /autoscaling/clusters/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/clusters/README -------------------------------------------------------------------------------- /autoscaling/credentials/key.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/credentials/key.sh -------------------------------------------------------------------------------- /autoscaling/crontab/autoscale_slurm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/crontab/autoscale_slurm.sh -------------------------------------------------------------------------------- /autoscaling/provider_inst_prin.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/provider_inst_prin.tpl -------------------------------------------------------------------------------- /autoscaling/provider_user.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/provider_user.tpl -------------------------------------------------------------------------------- /autoscaling/tf_init/cluster-network-configuration.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/cluster-network-configuration.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/cluster-network.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/cluster-network.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/compute-cluster.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/compute-cluster.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/compute-nodes.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/compute-nodes.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/config.controller: -------------------------------------------------------------------------------- 1 | #cloud-config 2 | -------------------------------------------------------------------------------- /autoscaling/tf_init/config.hpc: -------------------------------------------------------------------------------- 1 | #cloud-config 2 | -------------------------------------------------------------------------------- /autoscaling/tf_init/controller_update.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/controller_update.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/data.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/data.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/instance-pool-configuration.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/instance-pool-configuration.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/instance-pool.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/instance-pool.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/inventory.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/inventory.tpl -------------------------------------------------------------------------------- /autoscaling/tf_init/locals.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/locals.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/marketplace.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/marketplace.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/network.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/network.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/outputs.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/outputs.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/user_data.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/user_data.tf -------------------------------------------------------------------------------- /autoscaling/tf_init/versions.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/autoscaling/tf_init/versions.tf -------------------------------------------------------------------------------- /bin/cleanup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/cleanup.sh -------------------------------------------------------------------------------- /bin/configure.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/configure.sh -------------------------------------------------------------------------------- /bin/configure_as.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/configure_as.sh -------------------------------------------------------------------------------- /bin/controller.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/controller.sh -------------------------------------------------------------------------------- /bin/create_cluster.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/create_cluster.sh -------------------------------------------------------------------------------- /bin/delete_cluster.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/delete_cluster.sh -------------------------------------------------------------------------------- /bin/find_reachable_hosts.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/find_reachable_hosts.sh -------------------------------------------------------------------------------- /bin/initial_monitoring.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/initial_monitoring.sh -------------------------------------------------------------------------------- /bin/rdma_metrics_collection_config.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/rdma_metrics_collection_config.conf -------------------------------------------------------------------------------- /bin/remove_nodes_prompt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/remove_nodes_prompt.txt -------------------------------------------------------------------------------- /bin/resize.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/resize.sh -------------------------------------------------------------------------------- /bin/resize/ociobj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/resize/ociobj.py -------------------------------------------------------------------------------- /bin/resize/reconfigure.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/resize/reconfigure.py -------------------------------------------------------------------------------- /bin/resize/resize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/resize/resize.py -------------------------------------------------------------------------------- /bin/resize/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/resize/utils.py -------------------------------------------------------------------------------- /bin/slurm_config.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/slurm_config.sh -------------------------------------------------------------------------------- /bin/upload_rdma_nic_metrics.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/upload_rdma_nic_metrics.sh -------------------------------------------------------------------------------- /bin/wait_for_hosts.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/bin/wait_for_hosts.sh -------------------------------------------------------------------------------- /cluster-network-configuration.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/cluster-network-configuration.tf -------------------------------------------------------------------------------- /cluster-network.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/cluster-network.tf -------------------------------------------------------------------------------- /compute-cluster.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/compute-cluster.tf -------------------------------------------------------------------------------- /compute-nodes.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/compute-nodes.tf -------------------------------------------------------------------------------- /conf/queues.conf.example: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/conf/queues.conf.example -------------------------------------------------------------------------------- /conf/variables.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/conf/variables.tpl -------------------------------------------------------------------------------- /config.controller: -------------------------------------------------------------------------------- 1 | #cloud-config 2 | -------------------------------------------------------------------------------- /config.hpc: -------------------------------------------------------------------------------- 1 | #cloud-config 2 | -------------------------------------------------------------------------------- /configure.tpl: -------------------------------------------------------------------------------- 1 | ${configure} -------------------------------------------------------------------------------- /controller.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/controller.tf -------------------------------------------------------------------------------- /data.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/data.tf -------------------------------------------------------------------------------- /fss.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/fss.tf -------------------------------------------------------------------------------- /initial_mon.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/initial_mon.tpl -------------------------------------------------------------------------------- /instance-pool-configuration.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/instance-pool-configuration.tf -------------------------------------------------------------------------------- /instance-pool.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/instance-pool.tf -------------------------------------------------------------------------------- /inventory.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/inventory.tpl -------------------------------------------------------------------------------- /locals.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/locals.tf -------------------------------------------------------------------------------- /login.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/login.tf -------------------------------------------------------------------------------- /logs/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/logs/README -------------------------------------------------------------------------------- /lustre.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/lustre.tf -------------------------------------------------------------------------------- /marketplace.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/marketplace.tf -------------------------------------------------------------------------------- /monitoring.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/monitoring.tf -------------------------------------------------------------------------------- /mysql.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/mysql.tf -------------------------------------------------------------------------------- /network.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/network.tf -------------------------------------------------------------------------------- /oci_images.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/oci_images.tf -------------------------------------------------------------------------------- /outputs.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/outputs.tf -------------------------------------------------------------------------------- /playbooks/destroy.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/destroy.yml -------------------------------------------------------------------------------- /playbooks/group_vars/all.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/group_vars/all.yml -------------------------------------------------------------------------------- /playbooks/monitoring.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/monitoring.yml -------------------------------------------------------------------------------- /playbooks/new_nodes.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/new_nodes.yml -------------------------------------------------------------------------------- /playbooks/resize_add.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/resize_add.yml -------------------------------------------------------------------------------- /playbooks/resize_remove.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/resize_remove.yml -------------------------------------------------------------------------------- /playbooks/resize_remove_unreachable.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/resize_remove_unreachable.yml -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/files/dashboard.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/files/dashboard.json -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/files/initial.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/files/initial.sh -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/files/initial.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/files/initial.sql -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/files/monitor_oci.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/files/monitor_oci.sh -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/files/monitor_slurm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/files/monitor_slurm.sh -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/templates/env.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/templates/env.j2 -------------------------------------------------------------------------------- /playbooks/roles/autoscaling_mon/templates/mysql_service_initial.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/autoscaling_mon/templates/mysql_service_initial.j2 -------------------------------------------------------------------------------- /playbooks/roles/boot-volume/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/boot-volume/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/boot-volume/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/boot-volume/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/boot-volume/tasks/ubuntu.yml: -------------------------------------------------------------------------------- 1 | # no extra steps required for ubuntu. 2 | -------------------------------------------------------------------------------- /playbooks/roles/cloud-agent_update/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cloud-agent_update/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/cloud-agent_update/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cloud-agent_update/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/cloud-agent_update/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cloud-agent_update/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/cluster-cli/files/cluster: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cluster-cli/files/cluster -------------------------------------------------------------------------------- /playbooks/roles/cluster-cli/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cluster-cli/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/cluster-cli/tasks/el7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cluster-cli/tasks/el7.yml -------------------------------------------------------------------------------- /playbooks/roles/cluster-cli/tasks/el8.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cluster-cli/tasks/el8.yml -------------------------------------------------------------------------------- /playbooks/roles/cluster-cli/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cluster-cli/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/cron/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cron/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/cron/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cron/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/cron/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/cron/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/destroy_unreachable/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/destroy_unreachable/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/destroy_unreachable/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/destroy_unreachable/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/destroy_unreachable/tasks/slurm-rack-aware.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/destroy_unreachable/tasks/slurm-rack-aware.yml -------------------------------------------------------------------------------- /playbooks/roles/destroy_unreachable/tasks/slurm.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/destroy_unreachable/tasks/slurm.yml -------------------------------------------------------------------------------- /playbooks/roles/disable_core_dumps/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/disable_core_dumps/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/docker/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/docker/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/docker/tasks/oraclelinux.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/docker/tasks/oraclelinux.yml -------------------------------------------------------------------------------- /playbooks/roles/docker/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/docker/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/docker/templates/templates.j2: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/etc-hosts/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/etc-hosts/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/etc-hosts/tasks/main.yml: -------------------------------------------------------------------------------- 1 | - include_tasks: common.yml 2 | -------------------------------------------------------------------------------- /playbooks/roles/etc-hosts/templates/etc-hosts-controller.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/etc-hosts/templates/etc-hosts-controller.j2 -------------------------------------------------------------------------------- /playbooks/roles/etc-hosts/templates/etc-hosts.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/etc-hosts/templates/etc-hosts.j2 -------------------------------------------------------------------------------- /playbooks/roles/firewall/files/off-iptables.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/firewall/files/off-iptables.sh -------------------------------------------------------------------------------- /playbooks/roles/firewall/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/firewall/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/firewall/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/firewall/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/firewall/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/firewall/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/fix_broken/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fix_broken/README.md -------------------------------------------------------------------------------- /playbooks/roles/fix_broken/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fix_broken/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/fix_broken/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fix_broken/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/fix_ldap/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fix_ldap/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/fix_ldap/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fix_ldap/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/fss-home/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fss-home/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/fss-home/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fss-home/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/fss-home/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/fss-home/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/grafana/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/alert-rules.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/alert-rules.yaml -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster-dashboard.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster-dashboard.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster-level-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster-level-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster-level.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster-level.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster.json -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster_amd.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster_amd.json -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster_prometheus.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster_prometheus.json -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/cluster_prometheus_v2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/cluster_prometheus_v2.json -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/command-center-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/command-center-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/command-center.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/command-center.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/delete-rules.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/delete-rules.yaml -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/g.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/g.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/gauge-panel-util.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/gauge-panel-util.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/gauge-panel.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/gauge-panel.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/gpu-health.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/gpu-health.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/gpu-metrics-single-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/gpu-metrics-single-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/gpu-metrics-single.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/gpu-metrics-single.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/host-metrics-single-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/host-metrics-single-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/host-metrics-single.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/host-metrics-single.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/main.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/main.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/multi-node-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/multi-node-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/multi-node.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/multi-node.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/nccl-traces.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/nccl-traces.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/node_exporter.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/node_exporter.json -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/oci-dashboard.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/oci-dashboard.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/oci-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/oci-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/raw_message_template.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/raw_message_template.txt -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/rdma-hw-counters.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/rdma-hw-counters.json -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/slurm-dashboard.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/slurm-dashboard.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/slurm-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/slurm-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/stat-health-panel.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/stat-health-panel.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/stat-panel-single.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/stat-panel-single.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/stat-panel.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/stat-panel.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/statetimeline-panel.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/statetimeline-panel.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/storage-metrics-variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/storage-metrics-variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/storage-metrics.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/storage-metrics.jsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/table-panel.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/table-panel.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/timeseries-panel.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/timeseries-panel.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/files/variables.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/files/variables.libsonnet -------------------------------------------------------------------------------- /playbooks/roles/grafana/tasks/dashboard.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/tasks/dashboard.yml -------------------------------------------------------------------------------- /playbooks/roles/grafana/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/grafana/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/grafana/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/grafana/templates/ons-webhook.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/templates/ons-webhook.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/grafana/templates/ons_webhook.py.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/grafana/templates/ons_webhook.py.j2 -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/check_gpu_setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/check_gpu_setup.py -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/gpu_bw_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/gpu_bw_test.py -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/meshpinger_readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/meshpinger_readme.md -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/rdma_link_flapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/rdma_link_flapping.py -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/run_meshpinger.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/run_meshpinger.sh -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/shared_logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/shared_logging.py -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/files/xid_checker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/files/xid_checker.py -------------------------------------------------------------------------------- /playbooks/roles/healthchecks/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/healthchecks/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/home_nfs/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/home_nfs/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/home_nfs/tasks/main.yml: -------------------------------------------------------------------------------- 1 | - include_tasks: el.yml 2 | when: ansible_os_family == 'RedHat' 3 | -------------------------------------------------------------------------------- /playbooks/roles/hostname/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hostname/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/hostname/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hostname/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/hostname/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hostname/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/files/control_hyperthreading.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/files/control_hyperthreading.sh -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/files/control_hyperthreading_ubuntu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/files/control_hyperthreading_ubuntu.sh -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/files/disable-hyperthreading.service: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/files/disable-hyperthreading.service -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/files/disable-hyperthreading_ubuntu.service: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/files/disable-hyperthreading_ubuntu.service -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/hyperthreading/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/hyperthreading/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/tasks/config_influxdb.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/tasks/config_influxdb.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/tasks/el_install_influxdb.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/tasks/el_install_influxdb.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/tasks/ubuntu_install_influxdb.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/tasks/ubuntu_install_influxdb.yml -------------------------------------------------------------------------------- /playbooks/roles/influxdb/templates/influxdb.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/influxdb/templates/influxdb.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/iscsi/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/iscsi/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/iscsi/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/iscsi/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/iscsi/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/iscsi/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/iscsi/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/iscsi/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/latency_check/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/latency_check/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/latency_check/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/latency_check/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/latency_check/templates/latency_check.sh.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/latency_check/templates/latency_check.sh.j2 -------------------------------------------------------------------------------- /playbooks/roles/limits/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/limits/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/limits/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/limits/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/limits/templates/limits.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/limits/templates/limits.j2 -------------------------------------------------------------------------------- /playbooks/roles/localdisk/defaults/main.yml: -------------------------------------------------------------------------------- 1 | nvme_path: "/scratch" 2 | -------------------------------------------------------------------------------- /playbooks/roles/localdisk/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/localdisk/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/localdisk/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/localdisk/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/localdisk/tasks/main.yml: -------------------------------------------------------------------------------- 1 | - include_tasks: common.yml 2 | -------------------------------------------------------------------------------- /playbooks/roles/localdisk/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/localdisk/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/lustre-client/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/lustre-client/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/lustre-client/files/install_lustre_ubuntu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/lustre-client/files/install_lustre_ubuntu.sh -------------------------------------------------------------------------------- /playbooks/roles/lustre-client/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/lustre-client/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/lustre-client/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/lustre-client/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/lustre-client/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/lustre-client/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/custom_metric_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/custom_metric_common.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/dcgm-counters.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/dcgm-counters.csv -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/nccl_profiler_exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/nccl_profiler_exporter.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/node_exporter.service: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/node_exporter.service -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/nvidia-allow-prof.conf: -------------------------------------------------------------------------------- 1 | options nvidia NVreg_RestrictProfilingToAdminUsers=0 2 | -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/nvlink_counters_exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/nvlink_counters_exporter.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/nvml_metrics_exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/nvml_metrics_exporter.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/pcie_faults_exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/pcie_faults_exporter.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/rdma_counters_exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/rdma_counters_exporter.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/rdma_link_flapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/rdma_link_flapping.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/shared_logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/shared_logging.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/files/xid_checker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/files/xid_checker.py -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/custom_metrics.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/custom_metrics.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/dcgm_exporter.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/dcgm_exporter.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/nccl_profiler.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/nccl_profiler.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/node_exporter_el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/node_exporter_el.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/node_exporter_ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/node_exporter_ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/nvlink_exporter.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/nvlink_exporter.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/nvml_exporter.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/nvml_exporter.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/pcie_faults.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/pcie_faults.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/tasks/rdma_exporter.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/tasks/rdma_exporter.yml -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/customMetrics.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/customMetrics.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/custom_metrics.py.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/custom_metrics.py.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/dcgm-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/dcgm-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/nccl-profiler-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/nccl-profiler-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/nvlink-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/nvlink-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/nvml-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/nvml-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/pcie-faults-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/pcie-faults-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/prometheus.yml.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/prometheus.yml.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/templates/rdma-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/templates/rdma-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/metrics-exporter/vars/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/metrics-exporter/vars/main.yml -------------------------------------------------------------------------------- /playbooks/roles/mpi-hostfiles/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpi-hostfiles/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/mpi-hostfiles/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpi-hostfiles/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/mpi-hostfiles/templates/hostfile_rdma.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpi-hostfiles/templates/hostfile_rdma.j2 -------------------------------------------------------------------------------- /playbooks/roles/mpi-hostfiles/templates/hostfile_tcp.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpi-hostfiles/templates/hostfile_tcp.j2 -------------------------------------------------------------------------------- /playbooks/roles/mpivars/defaults/main.yml: -------------------------------------------------------------------------------- 1 | --- 2 | # defaults file for mpivars 3 | -------------------------------------------------------------------------------- /playbooks/roles/mpivars/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpivars/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/mpivars/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpivars/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/mpivars/templates/mpivars.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mpivars/templates/mpivars.j2 -------------------------------------------------------------------------------- /playbooks/roles/mpivars/vars/main.yml: -------------------------------------------------------------------------------- 1 | --- 2 | # vars file for mpivars -------------------------------------------------------------------------------- /playbooks/roles/multiple-mount-target/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/multiple-mount-target/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/multiple-mount-target/files/mmt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/multiple-mount-target/files/mmt.py -------------------------------------------------------------------------------- /playbooks/roles/multiple-mount-target/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/multiple-mount-target/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/multiple-mount-target/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/multiple-mount-target/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/multiple-mount-target/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/multiple-mount-target/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/multiple-mount-target/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/multiple-mount-target/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/files/innodb.cnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/files/innodb.cnf -------------------------------------------------------------------------------- /playbooks/roles/mysql/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/tasks/centos.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/tasks/centos.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/templates/debian_mariadb_etc_my.cnf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/templates/debian_mariadb_etc_my.cnf.j2 -------------------------------------------------------------------------------- /playbooks/roles/mysql/templates/debian_my.cnf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/templates/debian_my.cnf.j2 -------------------------------------------------------------------------------- /playbooks/roles/mysql/templates/mariadb_etc_my.cnf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/templates/mariadb_etc_my.cnf.j2 -------------------------------------------------------------------------------- /playbooks/roles/mysql/templates/my.cnf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/templates/my.cnf.j2 -------------------------------------------------------------------------------- /playbooks/roles/mysql/templates/mysqld_etc_my.cnf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/templates/mysqld_etc_my.cnf.j2 -------------------------------------------------------------------------------- /playbooks/roles/mysql/vars/ol_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/vars/ol_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/vars/ubuntu-2204_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/vars/ubuntu-2204_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/mysql/vars/ubuntu_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/mysql/vars/ubuntu_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/nccl-conf/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nccl-conf/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nccl-conf/templates/a100_b4.8: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nccl-conf/templates/a100_b4.8 -------------------------------------------------------------------------------- /playbooks/roles/nccl-conf/templates/b200: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nccl-conf/templates/b200 -------------------------------------------------------------------------------- /playbooks/roles/nccl-conf/templates/bm.gpu4.8: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nccl-conf/templates/bm.gpu4.8 -------------------------------------------------------------------------------- /playbooks/roles/nccl-conf/templates/h100: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nccl-conf/templates/h100 -------------------------------------------------------------------------------- /playbooks/roles/nccl-conf/templates/h200: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nccl-conf/templates/h200 -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-client/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/meta/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-client/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-client/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-client/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-client/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-client/vars/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/meta/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/templates/exports.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nfs-server/templates/exports.j2 -------------------------------------------------------------------------------- /playbooks/roles/nfs-server/vars/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/no_instance_principal/defaults/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/no_instance_principal/meta/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/no_instance_principal/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/no_instance_principal/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/no_instance_principal/tasks/main.yml: -------------------------------------------------------------------------------- 1 | - include_tasks: common.yml 2 | 3 | 4 | -------------------------------------------------------------------------------- /playbooks/roles/no_instance_principal/templates/config.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/no_instance_principal/templates/config.j2 -------------------------------------------------------------------------------- /playbooks/roles/no_instance_principal/vars/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/nvidia-container/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-container/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-container/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-container/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-container/tasks/oraclelinux-7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-container/tasks/oraclelinux-7.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-container/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-container/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-container/templates/templates.j2: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/nvidia-container/vars/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-container/vars/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-enroot/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-enroot/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-enroot/tasks/oraclelinux.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-enroot/tasks/oraclelinux.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia-enroot/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia-enroot/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia_peermem/defaults/main.yml: -------------------------------------------------------------------------------- 1 | --- 2 | # defaults file for nvidia_peermem 3 | -------------------------------------------------------------------------------- /playbooks/roles/nvidia_peermem/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia_peermem/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia_peermem/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/nvidia_peermem/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/nvidia_peermem/vars/main.yml: -------------------------------------------------------------------------------- 1 | --- 2 | # vars file for nvidia_peermem 3 | -------------------------------------------------------------------------------- /playbooks/roles/oci-cloud-agent-updater/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cloud-agent-updater/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cloud-agent-updater/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cloud-agent-updater/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cloud-agent-updater/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cloud-agent-updater/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cloud-agent/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cloud-agent/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cloud-agent/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cloud-agent/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cloud-agent/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cloud-agent/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cn-auth/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cn-auth/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cn-auth/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cn-auth/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cn-auth/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cn-auth/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-cn-auth/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-cn-auth/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-hostname/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-hostname/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-hostname/tasks/main.yml: -------------------------------------------------------------------------------- 1 | - include_tasks: el.yml 2 | when: ansible_os_family == 'RedHat' 3 | -------------------------------------------------------------------------------- /playbooks/roles/oci-legacy/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-legacy/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-legacy/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-legacy/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-legacy/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-legacy/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/files/oci-fss-metrics-exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/files/oci-fss-metrics-exporter.py -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/files/oci-lustre-metrics-exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/files/oci-lustre-metrics-exporter.py -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/files/oci-rdma-faults-exporter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/files/oci-rdma-faults-exporter.py -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/templates/oci-fss-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/templates/oci-fss-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/templates/oci-lustre-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/templates/oci-lustre-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/oci-metrics/templates/oci-rdma-faults-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oci-metrics/templates/oci-rdma-faults-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/oom-adjust/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oom-adjust/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/oom-adjust/files/oom-adjust.conf: -------------------------------------------------------------------------------- 1 | [Service] 2 | OOMScoreAdjust=-500 3 | 4 | -------------------------------------------------------------------------------- /playbooks/roles/oom-adjust/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/oom-adjust/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/autoinc.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/autoinc.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/debian_memberof.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/debian_memberof.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/debian_ppolicy.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/debian_ppolicy.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/el_memberof.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/el_memberof.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/el_memberof_ol8.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/el_memberof_ol8.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/el_ppolicy.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/el_ppolicy.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/el_ppolicy_ol8.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/el_ppolicy_ol8.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/local_schema.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/local_schema.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/rfc2307bis.ldif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/rfc2307bis.ldif -------------------------------------------------------------------------------- /playbooks/roles/openldap/files/slapd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/files/slapd -------------------------------------------------------------------------------- /playbooks/roles/openldap/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/meta/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/openldap/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/templates/config.ldif.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/templates/config.ldif.j2 -------------------------------------------------------------------------------- /playbooks/roles/openldap/templates/debian_local.ldif.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/templates/debian_local.ldif.j2 -------------------------------------------------------------------------------- /playbooks/roles/openldap/templates/el_local.ldif.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/templates/el_local.ldif.j2 -------------------------------------------------------------------------------- /playbooks/roles/openldap/templates/el_local_ol8.ldif.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/templates/el_local_ol8.ldif.j2 -------------------------------------------------------------------------------- /playbooks/roles/openldap/vars/debian_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/vars/debian_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/openldap/vars/el_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/openldap/vars/el_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/centos-7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/centos-7.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/el-7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/el-7.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/ol-7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/ol-7.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/ol-8.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/ol-8.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/ubuntu-2204.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/ubuntu-2204.yml -------------------------------------------------------------------------------- /playbooks/roles/packages/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/packages/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/passwords/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/passwords/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/privilege_group/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/privilege_group/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/privilege_group/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/privilege_group/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/privilege_group/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/privilege_group/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/files/recording_rules.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/files/recording_rules.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/tasks/cleanup_targets.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/tasks/cleanup_targets.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/tasks/create_target.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/tasks/create_target.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/tasks/gather_info.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/tasks/gather_info.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/tasks/setup_prometheus.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/tasks/setup_prometheus.yml -------------------------------------------------------------------------------- /playbooks/roles/prometheus/templates/prometheus.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/templates/prometheus.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/prometheus/templates/prometheus.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/templates/prometheus.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/prometheus/templates/prometheus.yml.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/templates/prometheus.yml.j2 -------------------------------------------------------------------------------- /playbooks/roles/prometheus/templates/prometheus_target.json.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/prometheus/templates/prometheus_target.json.j2 -------------------------------------------------------------------------------- /playbooks/roles/rack-aware/files/node_ordering_by_rack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rack-aware/files/node_ordering_by_rack.py -------------------------------------------------------------------------------- /playbooks/roles/rack-aware/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rack-aware/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/rack-aware/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rack-aware/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/rack-aware/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rack-aware/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/defaults/main.yml: -------------------------------------------------------------------------------- 1 | pci_id: '0000:5e:00.0' 2 | -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/handlers/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rdma-interface/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rdma-interface/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rdma-interface/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/templates/ifcfg.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rdma-interface/templates/ifcfg.j2 -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/templates/interface.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rdma-interface/templates/interface.j2 -------------------------------------------------------------------------------- /playbooks/roles/rdma-interface/vars/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rdma-interface/vars/main.yml -------------------------------------------------------------------------------- /playbooks/roles/rttcc/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/rttcc/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/safe_yum/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/safe_yum/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/safe_yum/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/safe_yum/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/safe_yum/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/safe_yum/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/files/cgroup.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/files/cgroup.conf -------------------------------------------------------------------------------- /playbooks/roles/slurm/files/healthchecks.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/files/healthchecks.sh -------------------------------------------------------------------------------- /playbooks/roles/slurm/files/sshd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/files/sshd -------------------------------------------------------------------------------- /playbooks/roles/slurm/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/backup_server.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/backup_server.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/cleanup.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/cleanup.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/common_pmix.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/common_pmix.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/common_pyxis.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/common_pyxis.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/compute-rack-aware.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/compute-rack-aware.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/compute.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/compute.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/compute_pam.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/compute_pam.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/controller.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/controller.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/destroy-rack-aware.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/destroy-rack-aware.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/destroy.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/destroy.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/download.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/download.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/el7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/el7.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/el8.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/el8.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/login.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/login.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/move-topology.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/move-topology.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/server.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/server.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/gres.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/gres.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/pyxis.sh.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/pyxis.sh.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/slurm.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/slurm.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/slurmdbd.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/slurmdbd.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/munge.service.d/unit.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/munge.service.d/unit.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/sackd.service.d/unit.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/sackd.service.d/unit.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/sackd.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/sackd.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurm_env.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurm_env.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmctld.service.d/unit.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmctld.service.d/unit.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmctld.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmctld.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmctld_backup.service.d/unit.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmctld_backup.service.d/unit.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmd.service.d/unit.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmd.service.d/unit.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmd.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmd.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmdbd.service.d/unit.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmdbd.service.d/unit.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/systemd/slurmdbd.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/templates/systemd/slurmdbd.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm/templates/topology.conf.j2: -------------------------------------------------------------------------------- 1 | ### Topology File -------------------------------------------------------------------------------- /playbooks/roles/slurm/vars/centos_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/vars/centos_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/vars/el_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/vars/el_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm/vars/ubuntu_vars.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm/vars/ubuntu_vars.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/tasks/slurm_exporter.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/tasks/slurm_exporter.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/tasks/slurm_restd.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/tasks/slurm_restd.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/tasks/slurm_sdk.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/tasks/slurm_sdk.yml -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/templates/slurm-exporter.py.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/templates/slurm-exporter.py.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/templates/slurm-exporter.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/templates/slurm-exporter.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/slurm_rest_api/templates/slurmrestd.service.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/slurm_rest_api/templates/slurmrestd.service.j2 -------------------------------------------------------------------------------- /playbooks/roles/spack/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/spack/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/spack/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/spack/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/spack/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/spack/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/spack/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/spack/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/spack/templates/spack.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/spack/templates/spack.j2 -------------------------------------------------------------------------------- /playbooks/roles/ssh/files/ssh_config: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssh/files/ssh_config -------------------------------------------------------------------------------- /playbooks/roles/ssh/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssh/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/ssh/tasks/main.yml: -------------------------------------------------------------------------------- 1 | - include_tasks: common.yml 2 | -------------------------------------------------------------------------------- /playbooks/roles/ssl/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssl/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/ssl/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssl/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/ssl/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssl/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/ssl/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssl/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/ssl/templates/san.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/ssl/templates/san.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/sssd/handlers/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/handlers/main.yml -------------------------------------------------------------------------------- /playbooks/roles/sssd/tasks/debian.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/tasks/debian.yml -------------------------------------------------------------------------------- /playbooks/roles/sssd/tasks/el-7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/tasks/el-7.yml -------------------------------------------------------------------------------- /playbooks/roles/sssd/tasks/el-8.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/tasks/el-8.yml -------------------------------------------------------------------------------- /playbooks/roles/sssd/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/sssd/templates/sssd.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/templates/sssd.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/sssd/templates/sssd_ubuntu.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/templates/sssd_ubuntu.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/sssd/vars/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/sssd/vars/main.yml -------------------------------------------------------------------------------- /playbooks/roles/telegraf/defaults/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/defaults/main.yml -------------------------------------------------------------------------------- /playbooks/roles/telegraf/files/telegraf.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/files/telegraf.conf -------------------------------------------------------------------------------- /playbooks/roles/telegraf/files/telegraf_amd_gpu.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/files/telegraf_amd_gpu.conf -------------------------------------------------------------------------------- /playbooks/roles/telegraf/files/telegraf_nvidia_gpu.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/files/telegraf_nvidia_gpu.conf -------------------------------------------------------------------------------- /playbooks/roles/telegraf/handlers/main.yml: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/telegraf/meta/main.yml: -------------------------------------------------------------------------------- 1 | --- 2 | -------------------------------------------------------------------------------- /playbooks/roles/telegraf/tasks/common.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/tasks/common.yml -------------------------------------------------------------------------------- /playbooks/roles/telegraf/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/amd_gpu.conf.j2: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/custom.cnf.j2: -------------------------------------------------------------------------------- 1 | [[inputs.exec]] 2 | commands = ["echo {}"] 3 | data_format = "json" -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/ethtool_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/ethtool_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_0_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_0_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_10_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_10_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_11_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_11_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_12_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_12_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_13_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_13_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_14_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_14_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_15_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_15_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_16_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_16_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_1_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_1_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_2_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_2_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_3_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_3_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_4_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_4_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_5_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_5_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_6_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_6_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_7_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_7_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_8_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_8_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/infiniband_mlx5_9_hw_counters.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/infiniband_mlx5_9_hw_counters.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/influxdb.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/influxdb.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/net.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/net.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/nvidia_gpu.conf.j2: -------------------------------------------------------------------------------- 1 | [[inputs.nvidia_smi]] -------------------------------------------------------------------------------- /playbooks/roles/telegraf/templates/prometheus.conf.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/telegraf/templates/prometheus.conf.j2 -------------------------------------------------------------------------------- /playbooks/roles/tuned/files/tuned.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/tuned/files/tuned.conf -------------------------------------------------------------------------------- /playbooks/roles/tuned/tasks/el-7.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/tuned/tasks/el-7.yml -------------------------------------------------------------------------------- /playbooks/roles/tuned/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/tuned/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/weka_client/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/weka_client/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/yaml/tasks/el.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/yaml/tasks/el.yml -------------------------------------------------------------------------------- /playbooks/roles/yaml/tasks/main.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/yaml/tasks/main.yml -------------------------------------------------------------------------------- /playbooks/roles/yaml/tasks/ubuntu.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/roles/yaml/tasks/ubuntu.yml -------------------------------------------------------------------------------- /playbooks/site.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/site.yml -------------------------------------------------------------------------------- /playbooks/slurm_config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/slurm_config.yml -------------------------------------------------------------------------------- /playbooks/slurm_config_as.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/playbooks/slurm_config_as.yml -------------------------------------------------------------------------------- /provider.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/provider.tf -------------------------------------------------------------------------------- /queues.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/queues.conf -------------------------------------------------------------------------------- /samples/NCCL_readme: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/NCCL_readme -------------------------------------------------------------------------------- /samples/disable_ht.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/disable_ht.sh -------------------------------------------------------------------------------- /samples/gpu/H100-topology-kubernetes.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/H100-topology-kubernetes.xml -------------------------------------------------------------------------------- /samples/gpu/H100-topology.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/H100-topology.xml -------------------------------------------------------------------------------- /samples/gpu/ifdown.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/ifdown.sh -------------------------------------------------------------------------------- /samples/gpu/ifup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/ifup.sh -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce.sbatch -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce.sh -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_H100_200.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_H100_200.sbatch -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_H100_200.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_H100_200.sh -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_containers_H100_H200.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_containers_H100_H200.sbatch -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_containers_with_ordering.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_containers_with_ordering.sbatch -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_srun.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_srun.sbatch -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_srun.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_srun.sh -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_tuner.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_tuner.sbatch -------------------------------------------------------------------------------- /samples/gpu/nccl_run_allreduce_tuner.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_allreduce_tuner.sh -------------------------------------------------------------------------------- /samples/gpu/nccl_run_alltoall.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/nccl_run_alltoall.sh -------------------------------------------------------------------------------- /samples/gpu/no_ncclparam_nccl_run_allreduce.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/no_ncclparam_nccl_run_allreduce.sbatch -------------------------------------------------------------------------------- /samples/gpu/no_ncclparam_nccl_run_allreduce.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/no_ncclparam_nccl_run_allreduce.sh -------------------------------------------------------------------------------- /samples/gpu/no_ncclparam_nccl_run_allreduce_H100_H200.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/no_ncclparam_nccl_run_allreduce_H100_H200.sbatch -------------------------------------------------------------------------------- /samples/gpu/no_ncclparam_nccl_run_allreduce_H100_H200.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/no_ncclparam_nccl_run_allreduce_H100_H200.sh -------------------------------------------------------------------------------- /samples/gpu/notes.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/notes.txt -------------------------------------------------------------------------------- /samples/gpu/ping.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/ping.sh -------------------------------------------------------------------------------- /samples/gpu/qfabv1_nccl_run_allreduce.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/qfabv1_nccl_run_allreduce.sbatch -------------------------------------------------------------------------------- /samples/gpu/qfabv1_nccl_run_allreduce.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/qfabv1_nccl_run_allreduce.sh -------------------------------------------------------------------------------- /samples/gpu/qfabv1_nccl_run_alltoall.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/qfabv1_nccl_run_alltoall.sh -------------------------------------------------------------------------------- /samples/gpu/rccl_run_allreduce.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/rccl_run_allreduce.sbatch -------------------------------------------------------------------------------- /samples/gpu/srun_examples_with_container.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/srun_examples_with_container.txt -------------------------------------------------------------------------------- /samples/gpu/topo-flattened-b4.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/topo-flattened-b4.xml -------------------------------------------------------------------------------- /samples/gpu/topo-flattened.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/topo-flattened.xml -------------------------------------------------------------------------------- /samples/gpu/update_arp_settings.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/update_arp_settings.sh -------------------------------------------------------------------------------- /samples/gpu/update_netmask.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/gpu/update_netmask.sh -------------------------------------------------------------------------------- /samples/nccl_compile/compile.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/nccl_compile/compile.sh -------------------------------------------------------------------------------- /samples/nfs/README.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/nfs/README.txt -------------------------------------------------------------------------------- /samples/nfs/fix_nfs.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/nfs/fix_nfs.sh -------------------------------------------------------------------------------- /samples/open-ldap/add-ldap-users.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/open-ldap/add-ldap-users.yml -------------------------------------------------------------------------------- /samples/open-ldap/add-linux-group.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/open-ldap/add-linux-group.yml -------------------------------------------------------------------------------- /samples/prep_sample_files.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/prep_sample_files.sh -------------------------------------------------------------------------------- /samples/rdma-tuning/check_pcie_max_read.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/rdma-tuning/check_pcie_max_read.sh -------------------------------------------------------------------------------- /samples/rdma-tuning/pcie_max_read.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/rdma-tuning/pcie_max_read.sh -------------------------------------------------------------------------------- /samples/rdma-tuning/pcie_max_read_default.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/rdma-tuning/pcie_max_read_default.sh -------------------------------------------------------------------------------- /samples/rdma-tuning/rdma-nic-tuning-1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/rdma-tuning/rdma-nic-tuning-1.sh -------------------------------------------------------------------------------- /samples/rdma-tuning/rdma-nic-tuning-2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/rdma-tuning/rdma-nic-tuning-2.sh -------------------------------------------------------------------------------- /samples/rdma-tuning/rdma-nic-tuning-validate.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/rdma-tuning/rdma-nic-tuning-validate.sh -------------------------------------------------------------------------------- /samples/submit/sleep.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/submit/sleep.sbatch -------------------------------------------------------------------------------- /samples/submit/sleep_gpu.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/samples/submit/sleep_gpu.sbatch -------------------------------------------------------------------------------- /schema.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/schema.yaml -------------------------------------------------------------------------------- /scripts/check_firmware_version.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/check_firmware_version.sh -------------------------------------------------------------------------------- /scripts/collect_logs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/collect_logs.py -------------------------------------------------------------------------------- /scripts/collect_metadata/collect_metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/collect_metadata/collect_metadata.py -------------------------------------------------------------------------------- /scripts/collect_metadata/requirements.txt: -------------------------------------------------------------------------------- 1 | paramiko 2 | -------------------------------------------------------------------------------- /scripts/create_instance_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/create_instance_config.py -------------------------------------------------------------------------------- /scripts/gpu_throttle.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/gpu_throttle.sh -------------------------------------------------------------------------------- /scripts/h100_script.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/h100_script.py -------------------------------------------------------------------------------- /scripts/ib_write_bw.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/ib_write_bw.sh -------------------------------------------------------------------------------- /scripts/ib_write_lat.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/ib_write_lat.sh -------------------------------------------------------------------------------- /scripts/max_nodes_partition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/max_nodes_partition.py -------------------------------------------------------------------------------- /scripts/ncclscout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/ncclscout.py -------------------------------------------------------------------------------- /scripts/pcie.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/pcie.sh -------------------------------------------------------------------------------- /scripts/runNCCL_on_hostPair.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/runNCCL_on_hostPair.sh -------------------------------------------------------------------------------- /scripts/validation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/scripts/validation.py -------------------------------------------------------------------------------- /slurm_ha.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/slurm_ha.tf -------------------------------------------------------------------------------- /user_data.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/user_data.tf -------------------------------------------------------------------------------- /variables.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/variables.tf -------------------------------------------------------------------------------- /versions.tf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/oracle-quickstart/oci-hpc/HEAD/versions.tf --------------------------------------------------------------------------------