├── .gitignore ├── CHANGELOG.md ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── LICENSE ├── NOTICE.txt ├── README.md ├── docs ├── ExamplesCfnTemplates │ ├── Batch-Large-Scale.yaml │ ├── VPC-Large-Scale-singleAZ.yaml │ └── VPC-Large-Scale.yaml ├── architecture.drawio ├── architecture.png └── jobs_transitions.png ├── pyproject.toml ├── src ├── ASGMonitoring │ ├── __init__.py │ ├── app.py │ └── requirements.txt ├── BatchJobsStates │ ├── JobStatesStateMachineServerless.asl.json │ ├── JobStatesToCW │ │ ├── __init__.py │ │ ├── app.py │ │ └── requirements.txt │ └── ParseJobProperties │ │ ├── __init__.py │ │ ├── app.py │ │ └── requirements.txt ├── ECSInstancesRegistration │ ├── ECSInstancesRegistrationStateMachineServerless.asl.json │ └── MetricToCW │ │ ├── __init__.py │ │ ├── app.py │ │ └── requirements.txt └── ECSRunTask │ ├── ECSRunTaskStateMachineServerless.asl.json │ ├── ECSTaskEventsStateMachineServerless.asl.json │ └── RunTaskToCW │ ├── __init__.py │ ├── app.py │ └── requirements.txt ├── template.yaml ├── tests ├── BatchJobStatesTests │ ├── batch-job-state-change-events │ │ ├── batch-event-MNP-CHILD-NODE-FAILED.json │ │ ├── batch-event-MNP-CHILD-NODE.json │ │ ├── batch-event-MNP-MAIN-NODE.json │ │ ├── batch-event-RUNNABLE.json │ │ ├── batch-event-RUNNING.json │ │ ├── batch-event-STARTING.json │ │ └── batch-event-SUCCEEDED.json │ ├── run_tests.py │ ├── test_parse_job_attributes.py │ └── test_state_machine.py ├── README.md └── run_all_tests.py └── uv.lock /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/.gitignore -------------------------------------------------------------------------------- /CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/CHANGELOG.md -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/LICENSE -------------------------------------------------------------------------------- /NOTICE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/NOTICE.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/README.md -------------------------------------------------------------------------------- /docs/ExamplesCfnTemplates/Batch-Large-Scale.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/docs/ExamplesCfnTemplates/Batch-Large-Scale.yaml -------------------------------------------------------------------------------- /docs/ExamplesCfnTemplates/VPC-Large-Scale-singleAZ.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/docs/ExamplesCfnTemplates/VPC-Large-Scale-singleAZ.yaml -------------------------------------------------------------------------------- /docs/ExamplesCfnTemplates/VPC-Large-Scale.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/docs/ExamplesCfnTemplates/VPC-Large-Scale.yaml -------------------------------------------------------------------------------- /docs/architecture.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/docs/architecture.drawio -------------------------------------------------------------------------------- /docs/architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/docs/architecture.png -------------------------------------------------------------------------------- /docs/jobs_transitions.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/docs/jobs_transitions.png -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/pyproject.toml -------------------------------------------------------------------------------- /src/ASGMonitoring/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/ASGMonitoring/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/ASGMonitoring/app.py -------------------------------------------------------------------------------- /src/ASGMonitoring/requirements.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/BatchJobsStates/JobStatesStateMachineServerless.asl.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/BatchJobsStates/JobStatesStateMachineServerless.asl.json -------------------------------------------------------------------------------- /src/BatchJobsStates/JobStatesToCW/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/BatchJobsStates/JobStatesToCW/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/BatchJobsStates/JobStatesToCW/app.py -------------------------------------------------------------------------------- /src/BatchJobsStates/JobStatesToCW/requirements.txt: -------------------------------------------------------------------------------- 1 | aws-embedded-metrics 2 | -------------------------------------------------------------------------------- /src/BatchJobsStates/ParseJobProperties/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/BatchJobsStates/ParseJobProperties/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/BatchJobsStates/ParseJobProperties/app.py -------------------------------------------------------------------------------- /src/BatchJobsStates/ParseJobProperties/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/BatchJobsStates/ParseJobProperties/requirements.txt -------------------------------------------------------------------------------- /src/ECSInstancesRegistration/ECSInstancesRegistrationStateMachineServerless.asl.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/ECSInstancesRegistration/ECSInstancesRegistrationStateMachineServerless.asl.json -------------------------------------------------------------------------------- /src/ECSInstancesRegistration/MetricToCW/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/ECSInstancesRegistration/MetricToCW/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/ECSInstancesRegistration/MetricToCW/app.py -------------------------------------------------------------------------------- /src/ECSInstancesRegistration/MetricToCW/requirements.txt: -------------------------------------------------------------------------------- 1 | aws-embedded-metrics 2 | -------------------------------------------------------------------------------- /src/ECSRunTask/ECSRunTaskStateMachineServerless.asl.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/ECSRunTask/ECSRunTaskStateMachineServerless.asl.json -------------------------------------------------------------------------------- /src/ECSRunTask/ECSTaskEventsStateMachineServerless.asl.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/ECSRunTask/ECSTaskEventsStateMachineServerless.asl.json -------------------------------------------------------------------------------- /src/ECSRunTask/RunTaskToCW/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/ECSRunTask/RunTaskToCW/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/src/ECSRunTask/RunTaskToCW/app.py -------------------------------------------------------------------------------- /src/ECSRunTask/RunTaskToCW/requirements.txt: -------------------------------------------------------------------------------- 1 | aws-embedded-metrics 2 | -------------------------------------------------------------------------------- /template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/template.yaml -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-MNP-CHILD-NODE-FAILED.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-MNP-CHILD-NODE-FAILED.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-MNP-CHILD-NODE.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-MNP-CHILD-NODE.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-MNP-MAIN-NODE.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-MNP-MAIN-NODE.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-RUNNABLE.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-RUNNABLE.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-RUNNING.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-RUNNING.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-STARTING.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-STARTING.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-SUCCEEDED.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/batch-job-state-change-events/batch-event-SUCCEEDED.json -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/run_tests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/run_tests.py -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/test_parse_job_attributes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/test_parse_job_attributes.py -------------------------------------------------------------------------------- /tests/BatchJobStatesTests/test_state_machine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/BatchJobStatesTests/test_state_machine.py -------------------------------------------------------------------------------- /tests/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/README.md -------------------------------------------------------------------------------- /tests/run_all_tests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/tests/run_all_tests.py -------------------------------------------------------------------------------- /uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-samples/aws-batch-runtime-monitoring/HEAD/uv.lock --------------------------------------------------------------------------------