├── .flake8
├── .github
    ├── ISSUE_TEMPLATE
    │   ├── bug_report.md
    │   └── feature_request.md
    └── workflows
    │   ├── coverage.yml
    │   ├── release.yml
    │   └── tests.yml
├── .gitignore
├── .pre-commit-config.yaml
├── ABOUT.md
├── LICENSE
├── README.md
├── imgs
    └── example.png
├── mypy.ini
├── noxfile.py
├── poetry.lock
├── pyproject.toml
├── src
    └── reportseff
    │   ├── __init__.py
    │   ├── console.py
    │   ├── db_inquirer.py
    │   ├── job.py
    │   ├── job_collection.py
    │   ├── output_renderer.py
    │   └── parameters.py
└── tests
    ├── conftest.py
    ├── test_db_inquirer.py
    ├── test_job.py
    ├── test_job_collection.py
    ├── test_output_renderer.py
    └── test_reportseff.py


/.flake8:
--------------------------------------------------------------------------------
 1 | [flake8]
 2 | select = ANN,B,B9,BLK,C,D,DAR,E,F,I,W
 3 | max-complexity = 10
 4 | ignore = E203,W503,E501,ANN101,ANN401
 5 | max-line-length = 80
 6 | application-import-names= reportseff,tests
 7 | import-order-style = google
 8 | docstring-convention = google
 9 | per-file-ignores =
10 |     tests/*:S101,ANN,DAR
11 |     noxfile.py:ANN,DAR
12 |     src/reportseff/console.py:DAR101
13 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/bug_report.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Bug report
 3 | about: Create a report to help us improve
 4 | title: ''
 5 | labels: bug
 6 | assignees: troycomi
 7 | 
 8 | ---
 9 | 
10 | **Describe the bug**
11 | A clear and concise description of what the bug is.
12 | 
13 | **To Reproduce**
14 | Steps to reproduce the behavior:
15 | 1. Go to '...'
16 | 2. Click on '....'
17 | 3. Scroll down to '....'
18 | 4. See error
19 | 
20 | **Expected behavior**
21 | A clear and concise description of what you expected to happen.
22 | 
23 | **Screenshots**
24 | If applicable, add screenshots to help explain your problem.
25 | 
26 | **Desktop (please complete the following information):**
27 |  - OS: [e.g. iOS]
28 |  - Version [e.g. 22]
29 | 
30 | **Debug Output**
31 | ```bash
32 | reportseff --debug [other options]
33 | # paste result here
34 | ```
35 | 
36 | **Additional context**
37 | Add any other context about the problem here.
38 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/feature_request.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Feature request
 3 | about: Suggest an idea for this project
 4 | title: ''
 5 | labels: enhancement
 6 | assignees: troycomi
 7 | 
 8 | ---
 9 | 
10 | **Is your feature request related to a problem? Please describe.**
11 | A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
12 | 
13 | **Describe the solution you'd like**
14 | A clear and concise description of what you want to happen.
15 | 
16 | **Describe alternatives you've considered**
17 | A clear and concise description of any alternative solutions or features you've considered.
18 | 
19 | **Additional context**
20 | Add any other context or screenshots about the feature request here.
21 | 


--------------------------------------------------------------------------------
/.github/workflows/coverage.yml:
--------------------------------------------------------------------------------
 1 | name: Coverage
 2 | on: [push, pull_request]
 3 | jobs:
 4 |   coverage:
 5 |     runs-on: ubuntu-latest
 6 |     steps:
 7 |     - uses: actions/checkout@v3
 8 |     - uses: wntrblm/nox@2022.11.21
 9 |       with:
10 |         python-versions: "3.9, 3.10, 3.11"
11 |     - run: pipx install poetry==1.3.1
12 |     - run: pipx inject poetry poetry-plugin-export
13 |     - run: nox --sessions tests-3.10 coverage
14 | 


--------------------------------------------------------------------------------
/.github/workflows/release.yml:
--------------------------------------------------------------------------------
 1 | name: Release
 2 | on:
 3 |   release:
 4 |     types: [published]
 5 | jobs:
 6 |   release:
 7 |     runs-on: ubuntu-latest
 8 |     steps:
 9 |     - uses: actions/checkout@v3
10 |     - uses: wntrblm/nox@2022.11.21
11 |       with:
12 |         python-versions: "3.9, 3.10, 3.11"
13 |     - run: pipx install poetry==1.3.1
14 |     - run: pipx inject poetry poetry-plugin-export
15 |     - run: nox
16 |     - run: poetry build
17 |     - run: poetry publish --username=__token__ --password=${{ secrets.PYPI_TOKEN }}
18 | 


--------------------------------------------------------------------------------
/.github/workflows/tests.yml:
--------------------------------------------------------------------------------
 1 | name: Tests
 2 | on: [push, pull_request]
 3 | jobs:
 4 |   tests:
 5 |     runs-on: ubuntu-latest
 6 |     steps:
 7 |     - uses: actions/checkout@v3
 8 |     - uses: wntrblm/nox@2022.11.21
 9 |       with:
10 |         python-versions: "3.9, 3.10, 3.11"
11 |     - run: pipx install poetry==1.3.1
12 |     - run: pipx inject poetry poetry-plugin-export
13 |     - run: nox
14 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | __pycache__/
2 | *.egg-info
3 | *.swp
4 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | repos:
 2 |   - repo: https://github.com/pre-commit/pre-commit-hooks
 3 |     rev: "v5.0.0"
 4 |     hooks:
 5 |       - id: check-added-large-files
 6 |       - id: check-case-conflict
 7 |       - id: check-merge-conflict
 8 |       - id: check-symlinks
 9 |       - id: check-yaml
10 |       - id: debug-statements
11 |       - id: end-of-file-fixer
12 |       - id: mixed-line-ending
13 |       - id: name-tests-test
14 |         args: ["--pytest-test-first"]
15 |       - id: requirements-txt-fixer
16 |       - id: trailing-whitespace
17 | 
18 |   - repo: https://github.com/pre-commit/pygrep-hooks
19 |     rev: v1.9.0
20 |     hooks:
21 |     - id: python-check-blanket-noqa
22 |     - id: python-no-eval
23 |     - id: python-use-type-annotations
24 |     - id: python-check-blanket-type-ignore
25 |     - id: python-check-mock-methods
26 | 
27 |   - repo: https://github.com/codespell-project/codespell
28 |     rev: v2.1.0
29 |     hooks:
30 |     - id: codespell
31 |       args: [--ignore-words-list, "absense,inout"]
32 | 
33 |   - repo: https://github.com/shellcheck-py/shellcheck-py
34 |     rev: v0.8.0.4
35 |     hooks:
36 |     - id: shellcheck
37 | 
38 |   - repo: https://github.com/astral-sh/ruff-pre-commit
39 |     rev: v0.5.5
40 |     hooks:
41 |       - id: ruff
42 |         args: [ --fix ]
43 |       - id: ruff-format
44 | 


--------------------------------------------------------------------------------
/ABOUT.md:
--------------------------------------------------------------------------------
  1 | # Monitoring slurm efficiency with reportseff
  2 | 
  3 | > Troy Comi
  4 | 
  5 | ## Motivation
  6 | 
  7 | As I started using Snakemake, I had hundreds of jobs which I wanted to get
  8 | performance information about. seff gave the efficiency information I wanted,
  9 | but for only a single job at a time. `sacct` handles multiple jobs, but couldn't
 10 | give the efficiency. With the current python implementation,
 11 | all job information is obtained from a single
 12 | `sacct` call and with click the output is colored to quickly see how things are
 13 | running. (But color isn't displayed below due to markdown limitations).
 14 | 
 15 | ## Be good to your scheduler
 16 | 
 17 | ### An introduction to scheduling efficiency
 18 | 
 19 | Have you ever hosted an event that had to provide food? Perhaps you sent out
 20 | RSVP's to estimate how many people would attend, guessed a handful of people
 21 | would show up but not respond, and ordered some pizza. If you ordered enough
 22 | food for 20 people and 18 showed, that would be a pizza efficiency of 90%.
 23 | But what if only 2 people showed up? Or 30? As extreme as these numbers seem,
 24 | memory and cpu usage efficiencies around 10% are not uncommon.
 25 | 
 26 | The goal of a scheduler is to take the user-provided resource
 27 | estimates for many jobs and decide who runs when. Let's say I have a small
 28 | cluster with 64 cores, 128 GB of memory and want to run an array job of
 29 | single-core processes with an estimated memory usage of 4 GB. The scheduler
 30 | will allow only 32 jobs to run at once (128 GB / 4 GB) leaving half of the
 31 | cores idling. If I actually only use 1 GB of memory, 64 jobs could be running
 32 | instead.
 33 | 
 34 | **Good jobs use the resources they promise to.**
 35 | 
 36 | In practice, many more details of the system and user are incorporated into
 37 | the decision to schedule a job. Once the scheduler decides a job will run,
 38 | the scheduler has to dispatch the job. The overhead associated with scheduling
 39 | only makes sense if the job will run for longer than a few minutes. Instead of
 40 | submitting 1000 jobs that perform 1 minute of work, group 100 subprocesses
 41 | together as 10 jobs with 100 minutes of work.
 42 | 
 43 | **Good jobs run long enough to matter.**
 44 | 
 45 | If every job on a cluster is efficient and long-running, the scheduler can
 46 | make accurate decisions on execution order and keep usage high.
 47 | 
 48 | ### Why it matters as a user?
 49 | 
 50 | "But my qos only allows 2 jobs to run at once if the time
 51 | is less than 2 hours! Can't I say my 10 minute job will take 2 hours?" Yes,
 52 | but it is *rude* to the scheduler. If that doesn't sway you, improperly
 53 | estimating resource usage can:
 54 | 
 55 | - Decrease your priority for subsequent jobs.
 56 | - Cause your account to be charged for the full, estimated usage.
 57 | - Have fewer of your jobs running simultaneously.
 58 | - Make it harder to fit your job into the available cluster resources,
 59 | increasing the queue time.
 60 | 
 61 | ### Monitoring efficiency
 62 | 
 63 | Before releasing a swarm of jobs, check the estimated vs predicted usage.
 64 | Tune your parameters to improve efficiency.
 65 | 
 66 | [Seff](https://github.com/SchedMD/slurm/tree/master/contribs/seff) provides
 67 | efficiency estimates for a single job. But to look at your usage
 68 | for many jobs or monitor usage, I wrote
 69 | [reportseff](https://github.com/troycomi/reportseff). It polls `sacct`
 70 | and calculates the same efficiency information as seff, but outputs
 71 | a tabular report.
 72 | 
 73 | During testing, I looked at random ranges of jobids on a Princeton cluster.
 74 | Here is some typical output, with jobids modified to protect the innocent:
 75 | 
 76 | ```txt
 77 |   Name      State        Time     CPU   Memory
 78 | XXXXX000  COMPLETED    00:01:53  97.3%  14.0%
 79 | XXXXX001  COMPLETED    00:02:19  84.2%  14.0%
 80 | XXXXX002  COMPLETED    00:06:33  28.2%  14.0%
 81 | XXXXX003  COMPLETED    00:04:59  39.1%  14.0%
 82 | XXXXX004  COMPLETED    00:02:31  97.4%  9.2%
 83 | XXXXX005  COMPLETED    00:02:38  98.1%  9.1%
 84 | XXXXX006  COMPLETED    00:02:24  97.2%  9.1%
 85 | XXXXX007  COMPLETED    00:02:40  98.1%  9.0%
 86 | XXXXX008  COMPLETED    00:02:39  96.2%  9.1%
 87 | XXXXX009  COMPLETED    00:02:45  96.4%  9.0%
 88 | XXXXX012  COMPLETED    00:00:53  58.5%  10.6%
 89 | XXXXX013  COMPLETED    00:02:13  38.3%  10.6%
 90 | XXXXX014  COMPLETED    00:37:02  44.9%  10.6%
 91 | XXXXX015  COMPLETED    00:44:33  34.0%  10.6%
 92 | XXXXX016  COMPLETED    00:38:29  29.6%  10.7%
 93 | XXXXX017  COMPLETED    00:19:57  74.5%  10.8%
 94 | XXXXX018  COMPLETED    00:14:25  95.0%  10.8%
 95 | XXXXX019  COMPLETED    00:35:38  2.6%   10.6%
 96 | XXXXX020  COMPLETED    00:02:16  38.2%  10.6%
 97 | XXXXX021  COMPLETED    00:02:34  46.1%  10.9%
 98 | XXXXX022  COMPLETED    00:20:53  7.1%   10.6%
 99 | XXXXX023  COMPLETED    00:01:00  95.0%  11.1%
100 | XXXXX024  COMPLETED    00:09:06  88.5%  10.5%
101 | XXXXX025  COMPLETED    00:08:08  95.3%  10.6%
102 | ```
103 | 
104 | This is from at least 3 different users across departments.
105 | 
106 | Notice how short the jobs are (most <5 minutes) and how little memory is used,
107 | about 500 MB of 4 GB in most cases. Another example is jobs with 4 cores using
108 | 25% of CPU. Though batching together short jobs is slightly difficult (nested
109 | for loops with some arithmetic), using the correct number of cores and cutting
110 | memory to improve usage is a simple fix.
111 | 
112 | Try it out and see if you have been good to your scheduler!
113 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2019 troycomi
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | [![Tests](https://github.com/troycomi/reportseff/workflows/Tests/badge.svg)](https://github.com/troycomi/reportseff/actions?workflow=Tests)
  2 | [![codecov](https://codecov.io/gh/troycomi/reportseff/branch/main/graph/badge.svg)](https://codecov.io/gh/troycomi/reportseff)
  3 | [![PyPI](https://img.shields.io/pypi/v/reportseff.svg)](https://pypi.org/project/reportseff/)
  4 | [![DOI](https://img.shields.io/badge/doi-10.1145/3569951.3604396-blue.svg?style=flat&labelColor=whitesmoke&logo=data%3Aimage%2Fpng%3Bbase64%2CiVBORw0KGgoAAAANSUhEUgAAAB8AAAAfCAYAAAAfrhY5AAAJsklEQVR42qWXd1DTaRrHf%2BiB2Hdt5zhrAUKz4IKEYu9IGiGFFJJQ0gkJCAKiWFDWBRdFhCQUF3UVdeVcRQEBxUI3yY9iEnQHb3bdW1fPubnyz%2F11M7lvEHfOQee2ZOYzPyDv%2B3yf9%2Fk95YX4fx%2BltfUt08GcFEuPR4U9hDDZ%2FVngIlhb%2FSiI6InkTgLzgDcgfvtnovhH4BzoVlrbwr55QnhCtBW4QHXnFrZbPBaQoBh4%2FSYH2EnpBEtqcDMVzB93wA%2F8AFwa23XFGcc8CkT3mxz%2BfXWtq9T9IQlLIXYEuHojudb%2BCM7Hgdq8ydi%2FAHiBXyY%2BLjwFlAEnS6Jnar%2FvnQVhvdzasad0eKvWZKe8hvDB2ofLZ%2FZEcWsh%2BhyIuyO5Bxs2iZIE4nRv7NWAb0EO8AC%2FWPxjYAWuOEX2MSXZVgPxzmRL3xKz3ScGpx6p6QnOx4mDIFqO0w6Q4fEhO5IzwxlSwyD2FYHzwAW%2BAZ4fEsf74gCumykwNHskLM7taQxLYjjIyy8MUtraGhTWdkfhkFJqtvuVl%2F9l2ZquDfEyrH8B0W06nnpH3JtIyRGpH1iJ6SfxDIHjRXHJmdQjLpfHeN54gnfFx4W9QRnovx%2FN20aXZeTD2J84hn3%2BqoF2Tqr14VqTPUCIcP%2B5%2Fly4qC%2BUL3sYxSvNj1NwsVYPsWdMUfomsdkYm3Tj0nbV0N1wRKwFe1MgKACDIBdMAhPE%2FwicwNWxll8Ag40w%2BFfhibJkGHmutjYeQ8gVlaN%2BjO51nDysa9TwNUFMqaGbKdRJZFfOJSp6mkRKsv0rRIpEVWjAvyFkxNOEpwvcAVPfEe%2Bl8ojeNTx3nXLBcWRrYGxSRjDEk0VlpxYrbe1ZmaQ5xuT0u3r%2B2qe5j0J5uytiZPGsRL2Jm32AldpxPUNJ3jmmsN4x62z1cXrbedXBQf2yvIFCeZrtyicZZG2U2nrrBJzYorI2EXLrvTfCSB43s41PKEvbZDEfQby6L4JTj%2FfIwam%2B4%2BwucBu%2BDgNK05Nle1rSt9HvR%2FKPC4U6LTfvUIaip1mjIa8fPzykii23h2eanT57zQ7fsyYH5QjywwlooAUcAdOh5QumgTHx6aAO7%2FL52eaQNEShrxfhL6albEDmfhGflrsT4tps8gTHNOJbeDeBlt0WJWDHSgxs6cW6lQqyg1FpD5ZVDfhn1HYFF1y4Eiaqa18pQf3zzYMBhcanlBjYfgWNayAf%2FASOgklu8bmgD7hADrk4cRlOL7NSOewEcbqSmaivT33QuFdHXj5sdvjlN5yMDrAECmdgDWG2L8P%2BAKLs9ZLZ7dJda%2BB4Xl84t7QvnKfvpXJv9obz2KgK8dXyqISyV0sXGZ0U47hOA%2FAiigbEMECJxC9aoKp86re5O5prxOlHkcksutSQJzxZRlPZmrOKhsQBF5zEZKybUC0vVjG8PqOnhOq46qyDTDnj5gZBriWCk4DvXrudQnXQmnXblebhAC2cCB6zIbM4PYgGl0elPSgIf3iFEA21aLdHYLHUQuVkpgi02SxFdrG862Y8ymYGMvXDzUmiX8DS5vKZyZlGmsSgQqfLub5RyLNS4zfDiZc9Edzh%2FtCE%2BX8j9k%2FqWB071rcZyMImne1SLkL4GRw4UPHMV3jjwEYpPG5uW5fAEot0aTSJnsGAwHJi2nvF1Y5OIqWziVCQd5NT7t6Q8guOSpgS%2Fa1dSRn8JGGaCD3BPXDyQRG4Bqhu8XrgAp0yy8DMSvvyVXDgJcJTcr1wQ2BvFKf65jqhvmxXUuDpGBlRvV36XvGjQzLi8KAKT2lYOnmxQPGorURSV0NhyTIuIyqOmKTMhQ%2BieEsgOgpc4KBbfDM4B3SIgFljvfHF6cef7qpyLBXAiQcXvg5l3Iunp%2FWv4dH6qFziO%2BL9PbrimQ9RY6MQphEfGUpOmma7KkGzuS8sPUFnCtIYcKCaI9EXo4HlQLgGrBjbiK5EqMj2AKWt9QWcIFMtnVvQVDQV9lXJJqdPVtUQpbh6gCI2Ov1nvZts7yYdsnvRgxiWFOtNJcOMVLn1vgptVi6qrNiFOfEjHCDB3J%2BHDLqUB77YgQGwX%2Fb1eYna3hGKdlqJKIyiE4nSbV8VFgxmxR4b5mVkkeUhMgs5YTi4ja2XZ009xJRHdkfwMi%2BfocaancuO7h%2FMlcLOa0V%2FSw6Dq47CumRQAKhgbOP8t%2BMTjuxjJGhXCY6XpmDDFqWlVYbQ1aDJ5Cptdw4oLbf3Ck%2BdWkVP0LpH7s9XLPXI%2FQX8ws%2Bj2In63IcRvOOo%2BTTjiN%2BlssfRsanW%2B3REVKoavBOAPTXABW4AL7e4NygHdpAKBscmlDh9Jysp4wxbnUNna3L3xBvyE1jyrGIkUHaqQMuxhHElV6oj1picvgL1QEuS5PyZTEaivqh5vUCKJqOuIgPFGESns8kyFk7%2FDxyima3cYxi%2FYOQCj%2F%2B9Ms2Ll%2Bhn4FmKnl7JkGXQGDKDAz9rUGL1TIlBpuJr9Be2JjK6qPzyDg495UxXYF7JY1qKimw9jWjF0iV6DRIqE%2B%2FeWG0J2ofmZTk0mLYVd4GLiFCOoKR0Cg727tWq981InYynvCuKW43aXgEjofVbxIqrm0VL76zlH3gQzWP3R3Bv9oXxclrlO7VVtgBRpSP4hMFWJ8BrUSBCJXC07l40X4jWuvtc42ofNCxtlX2JH6bdeojXgTh5TxOBKEyY5wvBE%2BACh8BtOPNPkApjoxi5h%2B%2FFMQQNpWvZaMH7MKFu5Ax8HoCQdmGkJrtnOiLHwD3uS5y8%2F2xTSDrE%2F4PT1yqtt6vGe8ldMBVMEPd6KwqiYECHDlfbvzphcWP%2BJiZuL5swoWQYlS%2Br7Yu5mNUiGD2retxBi9fl6RDGn4Ti9B1oyYy%2BMP5G87D%2FCpRlvdnuy0PY6RC8BzTA40NXqckQ9TaOUDywkYsudxJzPgyDoAWn%2BB6nEFbaVxxC6UXjJiuDkW9TWq7uRBOJocky9iMfUhGpv%2FdQuVVIuGjYqACbXf8aa%2BPeYNIHZsM7l4s5gAQuUAzRUoT51hnH3EWofXf2vkD5HJJ33vwE%2FaEWp36GHr6GpMaH4AAPuqM5eabH%2FhfG9zcCz4nN6cPinuAw6IHwtvyB%2FdO1toZciBaPh25U0ducR2PI3Zl7mokyLWKkSnEDOg1x5fCsJE9EKhH7HwFNhWMGMS7%2BqxyYsbHHRUDUH4I%2FAheQY7wujJNnFUH4KdCju83riuQeHU9WEqNzjsJFuF%2FdTDAZ%2FK7%2F1WaAU%2BAWymT59pVMT4g2AxcwNa0XEBDdBDpAPvgDIH73R25teeuAF5ime2Ul0OUIiG4GpSAEJeYW9wDTf43wfwHgHLKJoPznkwAAAABJRU5ErkJggg%3D%3D)](https://doi.org/10.1145/3569951.3604396)
  5 | 
  6 | # `reportseff`
  7 | 
  8 | > A python script for tabular display of slurm efficiency information
  9 | 
 10 | ![Example](https://github.com/troycomi/reportseff/raw/main/imgs/example.png)
 11 | 
 12 | ## About
 13 | 
 14 | ### Motivation
 15 | 
 16 | Whether a sys admin or cluster user, knowing how well you are estimating job
 17 | resources can help streamline job scheduling and maximize your priority. If you
 18 | have ever tried to use `sacct` you probably had some trouble interpreting the
 19 | output.  While `seff` or `jobstats` can provide detailed summaries, they don't
 20 | scale easily to array jobs or offer a way to see all the jobs from a single
 21 | user.  `reportseff` aims to fill this role.  Read more about the [motivation
 22 | for reportseff](https://github.com/troycomi/reportseff/blob/main/ABOUT.md).
 23 | 
 24 | ### Audience
 25 | 
 26 | If you are running more than one slurm job at a time, you should try
 27 | `reportseff`.  Users of HPC systems can get an idea how well they estimate
 28 | resource usage.  By tuning these values, you can get scheduled earlier and not
 29 | be penalized for unused allocations.  Since `reportseff` can parse job ids from
 30 | slurm output files, it simplifies the task of identifying which jobs have
 31 | failed and why. Sys admins can pipe `reportseff` output to identify users with
 32 | poor utilization or produce summaries at the end of a billing cycle.
 33 | 
 34 | ### Implementation
 35 | 
 36 | `reportseff` is a wrapper around `sacct` that provides more complex option
 37 | parsing, simpler options, and cleaner, colored outputs.  All querying is
 38 | performed in a single call to `sacct` and should have similar performance.
 39 | Multi-node and GPU utilization is acquired from information contained in the
 40 | `AdminComment` field, as generated by `jobstats`.
 41 | 
 42 | ## Usage
 43 | 
 44 | ### Installation
 45 | 
 46 | `reportseff` runs on python >= 3.6.
 47 | The only external dependency is click (>= 6.7).
 48 | Calling
 49 | 
 50 | ```sh
 51 | pip install --user reportseff
 52 | # OR
 53 | pipx install reportseff
 54 | ```
 55 | 
 56 | will create command line bindings and install click.
 57 | 
 58 | ### Sample Usage
 59 | 
 60 | Try `reportseff -u $USER` or just `reportseff` in a directory with some slurm
 61 | outputs.  You may be surprised by your results!
 62 | 
 63 | #### Single job
 64 | 
 65 | Calling `reportseff` with a single jobid will provide equivalent information to
 66 | seff for that job. `reportseff 24371789` and `reportseff map_fastq_24371789`
 67 | produce the following output:
 68 | 
 69 | ```txt
 70 |    JobID      State          Elapsed   CPUEff   MemEff
 71 | 24371789    COMPLETED       03:08:03   71.2%    45.7%
 72 | ```
 73 | 
 74 | #### Single array job
 75 | 
 76 | Providing either the raw job id or the array job id will get efficiency
 77 | information for a single element of the array job. `reportseff 24220929_421`
 78 | and `reportseff 24221219` generate:
 79 | 
 80 | ```txt
 81 |        JobID      State          Elapsed    CPUEff   MemEff
 82 | 24220929_421    COMPLETED       00:09:34    99.0%    34.6%
 83 | ```
 84 | 
 85 | #### Array job group
 86 | 
 87 | If the base job id of an array is provided, all elements of the array will
 88 | be added to the output. `reportseff 24220929`
 89 | 
 90 | ```txt
 91 |           JobID      State          Elapsed    CPUEff   MemEff
 92 |      24220929_1    COMPLETED       00:10:43    99.2%    33.4%
 93 |     24220929_11    COMPLETED       00:10:10    99.2%    37.5%
 94 |     24220929_21    COMPLETED       00:09:25    98.8%    36.1%
 95 |     24220929_31    COMPLETED       00:09:19    98.9%    33.3%
 96 |     24220929_41    COMPLETED       00:09:23    98.9%    33.3%
 97 |     24220929_51    COMPLETED       00:08:02    98.5%    36.3%
 98 |     ...
 99 |    24220929_951    COMPLETED       00:25:12    99.5%    33.5%
100 |    24220929_961    COMPLETED       00:39:26    99.7%    34.1%
101 |    24220929_971    COMPLETED       00:24:11    99.5%    34.2%
102 |    24220929_981    COMPLETED       00:24:50    99.5%    44.3%
103 |    24220929_991    COMPLETED       00:13:05    98.7%    33.7%
104 | ```
105 | 
106 | #### Glob expansion of slurm outputs
107 | 
108 | Because slurm output files can act as job id inputs, the following can
109 | get all seff information for a given job name:
110 | 
111 | ```txt
112 | slurm_out  ❯❯❯ reportseff split_ubam_24*
113 |               JobID      State          Elapsed   CPUEff   MemEff
114 | split_ubam_24342816    COMPLETED       23:30:32   99.9%    4.5%
115 | split_ubam_24342914    COMPLETED       22:40:51   99.9%    4.6%
116 | split_ubam_24393599    COMPLETED       23:43:36   99.4%    4.4%
117 | split_ubam_24393655    COMPLETED       21:36:58   99.3%    4.5%
118 | split_ubam_24418960     RUNNING        02:53:11    ---      ---
119 | split_ubam_24419972     RUNNING        01:26:26    ---      ---
120 | ```
121 | 
122 | #### No arguments
123 | 
124 | Without arguments, reportseff will try to find slurm output files in the
125 | current directory. Combine with `watch` to monitor job progress:
126 | `watch -cn 300 reportseff --color --modified-sort`
127 | 
128 | ```txt
129 |                 JobID           State          Elapsed   CPUEff   MemEff
130 |    split_ubam_24418960          RUNNING        02:56:14    ---      ---
131 | fastq_to_ubam_24419971          RUNNING        01:29:29    ---      ---
132 |    split_ubam_24419972          RUNNING        01:29:29    ---      ---
133 | fastq_to_ubam_24393600         COMPLETED     1-02:00:47   58.3%    41.1%
134 |     map_fastq_24419330          RUNNING        02:14:53    ---      ---
135 |     map_fastq_24419323          RUNNING        02:15:24    ---      ---
136 |     map_fastq_24419324          RUNNING        02:15:24    ---      ---
137 |     map_fastq_24419322          RUNNING        02:15:24    ---      ---
138 | mark_adapters_24418437         COMPLETED       01:29:23   99.8%    48.2%
139 | mark_adapters_24418436         COMPLETED       01:29:03   99.9%    47.4%
140 | ```
141 | 
142 | #### Filtering slurm output files
143 | 
144 | One useful application of `reportseff` is filtering a directory of slurm output
145 | files based on the state or time since running. Additionally, if only the
146 | `jobid` is specified as a format output, the filenames will be returned in a
147 | pipe-friendly manner:
148 | 
149 | ```txt
150 | old_runs   ❯❯❯ reportseff --since d=4 --state Timeout
151 | 
152 |                  JobID   State      Elapsed  CPUEff   MemEff
153 | call_variants_31550458  TIMEOUT    20:05:17  99.5%     0.0%
154 | call_variants_31550474  TIMEOUT    20:05:17  99.6%     0.0%
155 | call_variants_31550500  TIMEOUT    20:05:08  99.7%     0.0%
156 | old_runs   ❯❯❯ reportseff --since d=4 --state Timeout --format jobid
157 | call_variants_31550458
158 | call_variants_31550474
159 | call_variants_31550500
160 | ```
161 | 
162 | To find all lines with `output:` in jobs which have timed out or failed
163 | in the last 4 days:
164 | 
165 | ```sh
166 | reportseff --since 'd=4' --state TO,F --format jobid | xargs grep output:
167 | ```
168 | 
169 | ### Arguments
170 | 
171 | Jobs can be passed as arguments in the following ways:
172 | 
173 | - Job ID such as 1234567.  If the id is part of an array job, only the element
174 | for that ID will be displayed.  If the id is the base part of an array job,
175 | all elements in the array will be displayed.
176 | - Array Job ID such as 1234567\_89.  Will display only the element specified.
177 | - Slurm output file.  Format must be BASE\_%A\_%a.  BASE is optional as is a
178 | '.out' suffix.  Unix glob expansions can also be used to filter which jobs
179 | are displayed.
180 | - From current directory.  If no argument is supplied, `reportseff` will attempt
181 | to find slurm output files in the current directory as described above.
182 | If a user is provided, instead `reportseff` will show recent jobs for that user.
183 | If only `since` is set, all recent jobs for all users will be shown (if allowed).
184 | - Supplying a directory as a single argument will override the current
185 | directory to check for slurm outputs.
186 | 
187 | ### Options
188 | 
189 | - `--color/--no-color`: Force color output or not.  By default, will force color
190 |   output.  With the no-color flag, click will strip color codes for everything
191 |   besides stdout.
192 | - `--modified-sort`: Instead of sorting by filename/jobid, sort by last
193 |   modification time of the slurm output file.
194 | - `--debug`: Write sacct result to stderr.
195 | - `--user/-u`: Ignore job arguments and instead query sacct with provided user.
196 |   Returns all jobs from the last week.
197 | - `--state/-s`: Output only jobs with states matching one of the provided options.
198 |   Accepts comma separated values of job codes (e.g. 'R') or full names
199 |   (e.g. RUNNING).  Case insensitive.
200 | - `--not-state/-S`: Output only jobs with states not matching any of the provided options.
201 |   Accepts comma separated values of job codes (e.g. 'R') or full names
202 |   (e.g. RUNNING).  Case insensitive.
203 | - `--format`: Provide a comma separated list of columns to produce. Prefixing the
204 |   argument with `+` adds the specified values to the defaults.  Values can
205 |   be any valid column name to sacct and the custom efficiency values: TimeEff,
206 |   cpuEff, MemEff.  Can also optionally set alignment (<, ^, >) and maximum width.
207 |   Default is center-aligned with a width of the maximum column entry.  For
208 |   example, `--format 'jobid%>,state%10,memeff%<5'` produces 3 columns with:
209 |   - JobId aligned right, width set automatically
210 |   - State with width 10 (center aligned by default)
211 |   - MemEff aligned left, width 5
212 | - `--slurm-format`: The filename pattern passed to sbatch during job submission.
213 |   Overrides the default regex for job id parsing from filenames.  E.g. to match
214 |   filenames like `123456.out` set `--slurm-format %j.out`.
215 | - `--since`: Limit results to those occurring after the specified time.  Accepts
216 |   sacct formats and a comma separated list of key/value pairs.  To get jobs in
217 |   the last hour and a half, can pass `h=1,m=30`.
218 | -`--until`: Limit results to those occurring before the specified time. Accepts
219 |   sacct formats and a comma separated list of key/value pairs.
220 |   Useful in combination with the 'since' option to query a specific range.
221 | - `--partition`: Limit results to a specific partition.
222 | - `--cluster/-M`: Select specific cluster (for multi-cluster systems)
223 | - `--node/-n`: Display information for multi-node jobs; requires additional
224 |   sacct fields from jobstats.
225 | - `--node-and-gpu/-g`: Display information for multi-node jobs and GPU information;
226 |   requires additional sacct fields from jobstats.
227 | - `--parsable/-p`: Ignore formatting and output as a `|` delimited table.  Useful
228 |   for piping into more complex analyses.
229 | 
230 | ## Status, Contributions, and Support
231 | 
232 | `reportseff` is actively maintained but currently feature complete.  If there
233 | is a function missing, please open an issue to discuss its merit!
234 | 
235 | Bug reports, pull requests, and any feedback are welcome! Prior to submitting
236 | a pull request, be sure any new features have been tested and all unit tests
237 | are passing. In the cloned repo with
238 | [poetry](https://github.com/python-poetry/poetry#installation) installed:
239 | 
240 | ```sh
241 | poetry install
242 | poetry run pytest
243 | poetry run pre-commit install
244 | nox
245 | ```
246 | 
247 | ## Troubleshooting
248 | 
249 | ### I can't install, what is pip?
250 | 
251 | [pip](https://pip.pypa.io/en/stable/) is the package installer for python.  If
252 | you get an error that pip isn't found, look for a python/anaconda/conda module.
253 | [pipx](https://pypa.github.io/pipx/) ensures that each application is installed
254 | in an isolated environment.  This resolves issues of dependency versions and
255 | allows applications to be run from any environment.
256 | 
257 | ### The output has no color with many jobs!
258 | 
259 | Click should determine if the output supports color display and react automatically
260 | in a way you expect.  Check that your terminal is setup to display colors and
261 | that your pager (probably less) will display color by default.  Some commands,
262 | e.g. `watch` aren't handled properly even when invoked to support color.  Here
263 | are some useful settings for your `.bashrc`:
264 | ```
265 | # have less display colors by default.  Will fix `reportseff` not showing colors
266 | export LESS="-R"
267 | # for watch aliases, include the `--color` option
268 | watch -cn 300 reportseff --color --modified-sort
269 | #      ^                 ^^^^^^^
270 | ```
271 | You can always for display of color (or suppress it) with the `--color/--no-color`
272 | options
273 | 
274 | ### I get an error about broken pipes when chaining to other commands
275 | 
276 | Python will report that the consumer of process output has closed the stream
277 | (i.e. the pipe) while still attempting to write.  Newer versions of click
278 | should suppress the warning output, but it seems to not always work.  Besides
279 | some extra printing on stderr, the output is not affected.
280 | 
281 | ### My jobs don't have any information about multiple nodes or GPU efficiency
282 | 
283 | Because `sacct` doesn't currently record this information, `reportseff`
284 | retrieves it from a custom field from `jobstats`, developed at Princeton
285 | University.  If you are outside a Research Computing cluster, that information
286 | will likely be absent.  Node-level reporting is only shown for jobs which use
287 | multiple nodes or GPUs.  If you need a list of where jobs were run, you can add
288 | `--format +NodeList`.
289 | 
290 | ## Acknowledgments
291 | 
292 | The code for calling sacct and parsing the returning information was taken
293 | from [Slurmee](https://github.com/PrincetonUniversity/slurmee).
294 | 
295 | Style and tooling from [hypermodern python](https://cjolowicz.github.io/posts/hypermodern-python-01-setup/)
296 | 
297 | Code review provided from a [repo-review](https://researchcomputing.princeton.edu/services/repo-review-consultations)
298 | which vastly improved this readme.
299 | 


--------------------------------------------------------------------------------
/imgs/example.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/troycomi/reportseff/9dd39ecf52db79cafa5f7c32716f9d2af7d63fa6/imgs/example.png


--------------------------------------------------------------------------------
/mypy.ini:
--------------------------------------------------------------------------------
1 | [mypy]
2 | 
3 | [mypy-nox.*,pytest]
4 | ignore_missing_imports = True
5 | 


--------------------------------------------------------------------------------
/noxfile.py:
--------------------------------------------------------------------------------
  1 | """Nox sessions."""
  2 | 
  3 | import tempfile
  4 | 
  5 | import nox
  6 | 
  7 | locations = "src", "tests", "noxfile.py"
  8 | nox.options.sessions = "lint", "pip_audit", "mypy", "pytype", "tests", "tests_old_click"
  9 | package = "reportseff"
 10 | 
 11 | 
 12 | def install_with_constraints(session, *args, **kwargs):
 13 |     """Install packages with poetry's lock file."""
 14 |     with tempfile.NamedTemporaryFile() as requirements:
 15 |         session.run(
 16 |             "poetry",
 17 |             "export",
 18 |             "--with",
 19 |             "dev",
 20 |             "--format=requirements.txt",
 21 |             "--without-hashes",
 22 |             f"--output={requirements.name}",
 23 |             external=True,
 24 |         )
 25 |         # strip extras
 26 |         session.run(
 27 |             "sed",
 28 |             "-i",
 29 |             r"s/\[.*\]//g",
 30 |             f"{requirements.name}",
 31 |             external=True,
 32 |         )
 33 |         session.install(f"--constraint={requirements.name}", *args, **kwargs)
 34 | 
 35 | 
 36 | @nox.session(python=["3.9", "3.10", "3.11"])
 37 | def tests(session):
 38 |     """Run test suite with pytest and coverage."""
 39 |     args = session.posargs
 40 |     session.install(".")
 41 |     install_with_constraints(
 42 |         session, "coverage[toml]", "pytest", "pytest-cov", "pytest-mock"
 43 |     )
 44 |     session.run("pytest", "--cov", *args)
 45 | 
 46 | 
 47 | @nox.session(python=["3.9", "3.10", "3.11"])
 48 | def tests_old_click(session):
 49 |     """Run test suite with pytest and coverage, using click 6.7."""
 50 |     args = session.posargs
 51 |     session.install(".")
 52 |     session.run("pip", "install", "click==6.7")
 53 |     install_with_constraints(
 54 |         session, "coverage[toml]", "pytest", "pytest-cov", "pytest-mock"
 55 |     )
 56 |     session.run("pytest", "--cov", *args)
 57 | 
 58 | 
 59 | @nox.session(python="3.10")
 60 | def black(session):
 61 |     """Format code with black."""
 62 |     args = session.posargs or locations
 63 |     install_with_constraints(session, "ruff")
 64 |     session.run("ruff", "format", *args)
 65 | 
 66 | 
 67 | @nox.session(python="3.10")
 68 | def lint(session):
 69 |     """Lint code with ruff."""
 70 |     args = session.posargs or locations
 71 |     install_with_constraints(
 72 |         session,
 73 |         "ruff",
 74 |     )
 75 |     session.run("ruff", "check", *args)
 76 | 
 77 | 
 78 | @nox.session(python="3.10")
 79 | def pip_audit(session):
 80 |     """Scan dependencies for insecure packages."""
 81 |     with tempfile.NamedTemporaryFile() as requirements:
 82 |         session.run(
 83 |             "poetry",
 84 |             "export",
 85 |             "--with",
 86 |             "dev",
 87 |             "--format=requirements.txt",
 88 |             "--without-hashes",
 89 |             f"--output={requirements.name}",
 90 |             external=True,
 91 |         )
 92 |         install_with_constraints(session, "pip-audit")
 93 |         session.run(
 94 |             "pip-audit",
 95 |             "-r",
 96 |             requirements.name,
 97 |         )
 98 | 
 99 | 
100 | @nox.session(python=["3.9", "3.10"])
101 | def mypy(session):
102 |     """Type-check with mypy."""
103 |     args = session.posargs or locations
104 |     install_with_constraints(session, "mypy", "types-click")
105 |     session.run("mypy", *args)
106 | 
107 | 
108 | @nox.session(python="3.10")
109 | def pytype(session):
110 |     """Run the static type checker pytype."""
111 |     args = session.posargs or ["--disable=import-error", *locations]
112 |     install_with_constraints(session, "pytype")
113 |     session.run("pytype", *args)
114 | 
115 | 
116 | @nox.session(python="3.10")
117 | def typeguard(session):
118 |     """Runtime type checking during unit tests."""
119 |     args = session.posargs
120 |     session.run("poetry", "install", "--only", "main", external=True)
121 |     install_with_constraints(session, "pytest", "pytest-mock", "typeguard")
122 |     session.run("pytest", f"--typeguard-packages={package}", *args)
123 | 
124 | 
125 | @nox.session(python="3.10")
126 | def coverage(session):
127 |     """Upload coverage data."""
128 |     install_with_constraints(session, "coverage[toml]", "codecov")
129 |     session.run("coverage", "xml", "--fail-under=0")
130 |     session.run("codecov", *session.posargs)
131 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
  1 | [tool.poetry]
  2 | name = "reportseff"
  3 | version = "2.8.3"
  4 | description= "Tablular seff output"
  5 | authors = ["Troy Comi <troycomi@gmail.com>"]
  6 | license = "MIT"
  7 | readme = "README.md"
  8 | homepage= "https://github.com/troycomi/reportseff"
  9 | repository= "https://github.com/troycomi/reportseff"
 10 | keywords= ["slurm","seff"]
 11 | 
 12 | [tool.poetry.dependencies]
 13 | python = ">=3.9.1,<4.0"
 14 | click = ">=6.7"
 15 | importlib-metadata = {version = "^4.8.2", python = "<3.8"}
 16 | 
 17 | [tool.poetry.dev-dependencies]
 18 | pytest = "^8.2.2"
 19 | pytest-mock = "^3.14.0"
 20 | coverage = {extras = ["toml"], version = "^7.5.4"}
 21 | pytest-cov = "^5.0.0"
 22 | mypy = "^1.10.1"
 23 | types-click = "^7.1.8"
 24 | pytype = "^2024.4.11"
 25 | typeguard = "^4.3.0"
 26 | darglint = ">=1.8.1"
 27 | codecov = ">=2.1.13"
 28 | ruff = "^0.5.5"
 29 | 
 30 | [tool.poetry.scripts]
 31 | reportseff = "reportseff.console:main"
 32 | 
 33 | [tool.poetry.group.dev-dependencies.dependencies]
 34 | pip-audit = "^2.9.0"
 35 | 
 36 | [build-system]
 37 | requires = ["poetry-core>=1.0.0"]
 38 | build-backend = "poetry.core.masonry.api"
 39 | 
 40 | # pyproject.toml
 41 | [tool.coverage.paths]
 42 | source = ["src", "*/site-packages"]
 43 | 
 44 | [tool.coverage.run]
 45 | branch = true
 46 | source = ["reportseff"]
 47 | 
 48 | [tool.coverage.report]
 49 | show_missing = true
 50 | fail_under = 100
 51 | 
 52 | [tool.ruff.lint]
 53 | select = [
 54 |   "A",  # builtins
 55 |   "ANN",  # annotations
 56 |   "ARG",  # tidy imports
 57 |   "B",  # bugbear
 58 |   "BLE",
 59 |   "C4",  # comprehensions
 60 |   "COM",  # commas
 61 |   "D",  # pydocstyle
 62 |   "E",  # pycode style Error
 63 |   "ERA",  # commented out code
 64 |   "F",  # pyflakes
 65 |   "FA",  # error message
 66 |   "FBT",  # boolean trap
 67 |   "FURB",  # refurb
 68 |   "I",  # isort
 69 |   "ICN",  # import conventions
 70 |   "INT",  # gettext
 71 |   "ISC",  # String concatenation
 72 |   "N",  # pep8-naming
 73 |   "PERF",  # perflint
 74 |   "PIE",  # pie
 75 |   "PL",  # pylint
 76 |   "PT",  # pytest style
 77 |   "PTH",  # use pathlib
 78 |   "Q",  # Quotes
 79 |   "RET",  # return
 80 |   "RSE",  # raise
 81 |   "RUF",  # ruff
 82 |   "S",  # bandit
 83 |   "SIM",  # simplify
 84 |   "SLF",  # Self
 85 |   "T10",  # debugger
 86 |   "T20",  # print
 87 |   "TCH",  # type checking
 88 |   "TD",  # todos
 89 |   "TID",  # tidy imports
 90 |   "TRY",  # tryceratops
 91 |   "UP",  # pyupgrade
 92 |   "W",  # pycode style Warning
 93 | ]
 94 | 
 95 | ignore = [
 96 |   "ANN101",  # missing self
 97 |   "ANN401",  # allow Any
 98 |   "COM812",  # allow missing commas on last element
 99 |   "ISC001",  # recommended by format
100 | ]
101 | 
102 | 
103 | [tool.ruff.lint.per-file-ignores]
104 | "tests/*" = [
105 |   "ANN",  # type annotations
106 |   "S101",  # use assert
107 |   "PLR2004",  # magic numbers in tests
108 |   "SLF001",  # allow private methods in tests
109 | ]
110 | 
111 | "noxfile.py" = [
112 |   "ANN",  # type annotations
113 | ]
114 | 
115 | [tool.ruff.lint.pydocstyle]
116 | convention = "google"
117 | 


--------------------------------------------------------------------------------
/src/reportseff/__init__.py:
--------------------------------------------------------------------------------
 1 | """Tabular efficiency with reportseff."""
 2 | 
 3 | try:
 4 |     from importlib.metadata import PackageNotFoundError, version  # type: ignore[import]
 5 | except ImportError:  # pragma: no cover
 6 |     from importlib.metadata import PackageNotFoundError, version  # type: ignore[import]
 7 | 
 8 | 
 9 | try:
10 |     __version__ = version(__name__)
11 | except PackageNotFoundError:  # pragma: no cover
12 |     __version__ = "unknown"
13 | 


--------------------------------------------------------------------------------
/src/reportseff/console.py:
--------------------------------------------------------------------------------
  1 | """CLI for reportseff."""
  2 | 
  3 | from __future__ import annotations
  4 | 
  5 | import sys
  6 | from shutil import which
  7 | from typing import Any
  8 | 
  9 | import click
 10 | 
 11 | from . import __version__
 12 | from .db_inquirer import BaseInquirer, SacctInquirer
 13 | from .job_collection import JobCollection
 14 | from .output_renderer import OutputRenderer, RenderOptions
 15 | from .parameters import ReportseffParameters
 16 | 
 17 | MAX_ENTRIES_TO_ECHO = 20
 18 | 
 19 | 
 20 | @click.command()
 21 | @click.option(
 22 |     "--modified-sort",
 23 |     default=False,
 24 |     is_flag=True,
 25 |     help="If set, will sort outputs by modified time of files",
 26 | )
 27 | @click.option(
 28 |     "--color/--no-color",
 29 |     default=None,
 30 |     help="Force color output. No color will use click defaults",
 31 | )
 32 | @click.option(
 33 |     "--format",
 34 |     "format_str",
 35 |     default="JobID%>,State,Elapsed%>,TimeEff,CPUEff,MemEff",
 36 |     help="Comma-separated list of columns to include. Options "
 37 |     "are any valid sacct input along with CPUEff, MemEff, Energy, "
 38 |     "and TimeEff.  In systems with jobstat caching, GPU usage can be "
 39 |     "added with GPUEff, GPUMem or GPU (for both). "
 40 |     "A width and alignment may optionally be provided "
 41 |     'after "%", e.g. JobID%>15 aligns job id right with max '
 42 |     "width of 15 characters. Generally NAME[[%:][ALIGNMENT][WIDTH[e$]?]]. "
 43 |     "When an `e` or `$` is present after a width argument, "
 44 |     "the output will be truncated to the right."
 45 |     "Prefix with a + to add to the defaults. "
 46 |     "A single format token will suppress the header line. "
 47 |     "Wrap in quotes to pass a string literal, "
 48 |     "otherwise alignment may be misinterpreted.",
 49 | )
 50 | @click.option(
 51 |     "--slurm-format",
 52 |     default="",
 53 |     help="Filename pattern passed to sbatch.  By default, will handle "
 54 |     "patterns like slurm_%j.out, %x_%j, or slurm_%A_%a.  In particular, the "
 55 |     "jobid is expected to start with '_'.  Setting this to the same entry "
 56 |     "as used in sbatch will allow parsing slurm outputs like `1234.out`.  "
 57 |     "Array jobs must have %A_%a to properly interface with sacct.",
 58 | )
 59 | @click.option(
 60 |     "--debug", default=False, is_flag=True, help="Print raw db query to stderr"
 61 | )
 62 | @click.option(
 63 |     "-u",
 64 |     "--user",
 65 |     default="",
 66 |     help="Ignore jobs, return all jobs in last week from user",
 67 | )
 68 | @click.option(
 69 |     "--partition",
 70 |     default="",
 71 |     help="Only include jobs with the specified partition",
 72 | )
 73 | @click.option(
 74 |     "-M",
 75 |     "--cluster",
 76 |     default="",
 77 |     help="Select specific cluster, for multi-cluster system only",
 78 | )
 79 | @click.option(
 80 |     "--extra-args",
 81 |     default="",
 82 |     help="Extra arguments to forward to sacct",
 83 | )
 84 | @click.option(
 85 |     "-s", "--state", default="", help="Only include jobs with the specified states"
 86 | )
 87 | @click.option(
 88 |     "-S", "--not-state", default="", help="Include jobs without the specified states"
 89 | )
 90 | @click.option(
 91 |     "--since",
 92 |     default="",
 93 |     help="Only include jobs after this time. Can be valid sacct "
 94 |     "or as a comma separated list of time deltas, e.g. d=2,h=1 "
 95 |     "means 2 days, 1 hour before current time. Weeks, days, "
 96 |     "hours, and minutes can use case-insensitive abbreviations. "
 97 |     "Minutes is the minimum resolution, while weeks is the coarsest.",
 98 | )
 99 | @click.option(
100 |     "--until",
101 |     default="",
102 |     help="Only include jobs before this time. Can be valid sacct "
103 |     "or as a comma separated list of time deltas, e.g. d=2,h=1 "
104 |     "means 2 days, 1 hour before current time. Weeks, days, "
105 |     "hours, and minutes can use case-insensitive abbreviations. "
106 |     "Minutes is the minimum resolution, while weeks is the coarsest.",
107 | )
108 | @click.option(
109 |     "--node/--no-node",
110 |     "-n/-N",
111 |     default=False,
112 |     help="Report node-level statistics. Adds `jobid` to format for proper display.",
113 | )
114 | @click.option(
115 |     "--node-and-gpu/--no-node-gpu",
116 |     "-g/-G",
117 |     default=False,
118 |     help=(
119 |         "Report each GPU for each node. "
120 |         "Sets `node` and adds `GPU` to format automatically."
121 |     ),
122 | )
123 | @click.option(
124 |     "--parsable",
125 |     "-p",
126 |     is_flag=True,
127 |     default=False,
128 |     help="Output will be delmited without a delimiter at the end. "
129 |     "Delimiter is by default '|', to change it see --delimiter flag.",
130 | )
131 | @click.option(
132 |     "--delimiter",
133 |     "-d",
134 |     default="|",
135 |     help="Delimiter used for parsable output. The default default "
136 |     "delimiter is '|' when --parsable is specified. "
137 |     "This option is ignored if --parsable or -p is not specified.",
138 | )
139 | @click.version_option(version=__version__)
140 | @click.argument("jobs", nargs=-1)
141 | def main(**kwargs: Any) -> None:
142 |     """Main entry point for reportseff."""
143 |     args = ReportseffParameters(**kwargs)
144 | 
145 |     output, entries = get_jobs(args)
146 | 
147 |     if entries > MAX_ENTRIES_TO_ECHO:
148 |         click.echo_via_pager(output, color=args.color)
149 |     else:
150 |         click.echo(output, color=args.color)
151 | 
152 | 
153 | def get_jobs(args: ReportseffParameters) -> tuple[str, int]:
154 |     """Helper method to get jobs from db_inquirer.
155 | 
156 |     Returns:
157 |         The string to display, tabulated and colored
158 |         The number of jobs found to use paging properly
159 | 
160 |     Raises:
161 |         Exception: if there is an error processing entries
162 |     """
163 |     job_collection = JobCollection()
164 | 
165 |     if args.slurm_format:
166 |         job_collection.set_custom_seff_format(args.slurm_format)
167 | 
168 |     inquirer, renderer = get_implementation(
169 |         args.format_str,
170 |         node=args.node,
171 |         node_and_gpu=args.node_and_gpu,
172 |         parsable=args.parsable,
173 |         delimiter=args.delimiter,
174 |     )
175 | 
176 |     inquirer.set_state(args.state)
177 |     inquirer.set_not_state(args.not_state)
178 | 
179 |     inquirer.set_since(args.since)
180 |     inquirer.set_until(args.until)
181 | 
182 |     inquirer.set_partition(args.partition)
183 |     inquirer.set_cluster(args.cluster)
184 | 
185 |     inquirer.set_extra_args(args.extra_args)
186 | 
187 |     add_jobs = False
188 | 
189 |     try:
190 |         if args.user:
191 |             inquirer.set_user(args.user)
192 |             add_jobs = True
193 |         elif inquirer.has_since() and not args.jobs:  # since is set
194 |             inquirer.all_users()
195 |             add_jobs = True
196 |         else:
197 |             job_collection.set_jobs(args.jobs)
198 | 
199 |     except ValueError as error:
200 |         click.secho(str(error), fg="red", err=True)
201 |         sys.exit(1)
202 | 
203 |     job_collection.set_partition_limits(inquirer.get_partition_timelimits())
204 |     db_output = get_db_output(
205 |         inquirer,
206 |         renderer,
207 |         job_collection,
208 |         debug=args.debug,
209 |     )
210 |     entry = None
211 |     try:
212 |         for entry in db_output:
213 |             job_collection.process_entry(entry, add_job=add_jobs)
214 |     except Exception:
215 |         click.echo(f"Error processing entry: {entry}", err=True)
216 |         raise
217 | 
218 |     found_jobs = job_collection.get_sorted_jobs(change_sort=args.modified_sort)
219 |     found_jobs = [j for j in found_jobs if j.state]
220 | 
221 |     return renderer.format_jobs(found_jobs), len(found_jobs)
222 | 
223 | 
224 | def get_implementation(
225 |     format_str: str,
226 |     *,
227 |     node: bool = False,
228 |     node_and_gpu: bool = False,
229 |     parsable: bool = False,
230 |     delimiter: str = " ",
231 | ) -> tuple[BaseInquirer, OutputRenderer]:
232 |     """Get system-specific objects.
233 | 
234 |     Args:
235 |         format_str: the formatting options specified by user
236 |         node: control if node-level stats are displayed
237 |         node_and_gpu: control if node and gpu stats are displayed
238 |         parsable: produce output with a delimiter separating columns
239 |         delimiter: delimiter used for parsable output
240 | 
241 |     Returns:
242 |         A db_inqurirer
243 |         An output renderer
244 |     """
245 |     if which("sacct") is not None:
246 |         inquirer = SacctInquirer()
247 |         renderer = OutputRenderer(
248 |             inquirer.get_valid_formats(),
249 |             RenderOptions(
250 |                 node=node or node_and_gpu,
251 |                 gpu=node_and_gpu,
252 |                 parsable=parsable,
253 |                 delimiter=delimiter,
254 |             ),
255 |             format_str,
256 |         )
257 |     else:
258 |         click.secho("No supported scheduling systems found!", fg="red", err=True)
259 |         sys.exit(1)
260 | 
261 |     return inquirer, renderer
262 | 
263 | 
264 | def get_db_output(
265 |     inquirer: BaseInquirer,
266 |     renderer: OutputRenderer,
267 |     job_collection: JobCollection,
268 |     *,
269 |     debug: bool,
270 | ) -> list[dict[str, str]]:
271 |     """Get output from inquirer.
272 | 
273 |     Returns:
274 |         The db inquirer entries for the provided objects
275 |     """
276 | 
277 |     def print_debug(info: str) -> None:
278 |         click.echo(info, err=True)
279 | 
280 |     debug_cmd = None
281 |     if debug:
282 |         debug_cmd = print_debug
283 | 
284 |     try:
285 |         result = inquirer.get_db_output(
286 |             renderer.query_columns, job_collection.get_jobs(), debug_cmd
287 |         )
288 |     except RuntimeError as error:
289 |         click.secho(str(error), fg="red", err=True)
290 |         sys.exit(1)
291 | 
292 |     return result
293 | 


--------------------------------------------------------------------------------
/src/reportseff/db_inquirer.py:
--------------------------------------------------------------------------------
  1 | """Abstract and concrete implementations of scheduler databases."""
  2 | 
  3 | from __future__ import annotations
  4 | 
  5 | import datetime
  6 | import re
  7 | import shlex
  8 | import subprocess
  9 | from abc import ABC, abstractmethod
 10 | from typing import Callable
 11 | 
 12 | import click
 13 | 
 14 | 
 15 | class BaseInquirer(ABC):
 16 |     """Abstract interface for inquiring different schedulers."""
 17 | 
 18 |     @abstractmethod
 19 |     def __init__(self) -> None:
 20 |         """Initialize a new inquirer."""
 21 | 
 22 |     @abstractmethod
 23 |     def get_valid_formats(self) -> list[str]:
 24 |         """Get the valid formatting options supported by the inquirer.
 25 | 
 26 |         Returns:
 27 |             List of valid format options
 28 |         """
 29 | 
 30 |     @abstractmethod
 31 |     def set_sacct_args(self, jobs: list[str]) -> list[str]:
 32 |         """Set arguments of sacct query.
 33 | 
 34 |         Args:
 35 |             jobs: list of job names
 36 | 
 37 |         Returns:
 38 |             String of sacct arguments
 39 | 
 40 |         Raises:
 41 |             RuntimeError: if sacct doesn't return properly
 42 |         """
 43 | 
 44 |     @abstractmethod
 45 |     def get_db_output(
 46 |         self,
 47 |         columns: list[str],
 48 |         jobs: list[str],
 49 |         debug_cmd: Callable | None,
 50 |     ) -> list[dict[str, str]]:
 51 |         """Query the database with the supplied columns.
 52 | 
 53 |         Args:
 54 |             columns: validated format names as strings
 55 |             jobs: list of job names
 56 |             debug_cmd: If specified, the raw output will passed to this function
 57 | 
 58 |         Returns:
 59 |             List of rows, where each row is a dictionary
 60 |             with the columns as keys and entries as values
 61 |             Output order is not garunteed to match the jobs list
 62 | 
 63 |         """
 64 | 
 65 |     @abstractmethod
 66 |     def set_user(self, user: str) -> None:
 67 |         """Set the collection of jobs based on the provided user.
 68 | 
 69 |         Args:
 70 |             user: user name
 71 |         """
 72 | 
 73 |     @abstractmethod
 74 |     def set_partition(self, partition: str) -> None:
 75 |         """Set the collection of jobs based on the provided partition.
 76 | 
 77 |         Args:
 78 |             partition: partition name
 79 |         """
 80 | 
 81 |     @abstractmethod
 82 |     def set_cluster(self, cluster: str) -> None:
 83 |         """Set the collection of jobs based on the provided cluster.
 84 | 
 85 |         Args:
 86 |             cluster: cluster name
 87 |         """
 88 | 
 89 |     @abstractmethod
 90 |     def set_extra_args(self, extra_args: str) -> None:
 91 |         """Set extra arguments to be forwarded to sacct.
 92 | 
 93 |         Args:
 94 |             extra_args: list of arguments
 95 |         """
 96 | 
 97 |     @abstractmethod
 98 |     def all_users(self) -> None:
 99 |         """Ignore provided jobs, query for all users."""
100 | 
101 |     @abstractmethod
102 |     def set_state(self, state: str) -> None:
103 |         """Set the state to include output jobs.
104 | 
105 |         Args:
106 |             state: comma separated list of state names or codes
107 |         """
108 | 
109 |     @abstractmethod
110 |     def set_not_state(self, state: str) -> None:
111 |         """Set the state to exclude from output jobs.
112 | 
113 |         Args:
114 |             state: comma separated list of state names or codes
115 |         """
116 | 
117 |     @abstractmethod
118 |     def parse_date(self, d: str) -> str:
119 |         """Parse and convert custom string date format.
120 | 
121 |         Args:
122 |             d: the string of date.
123 | 
124 |         Returns:
125 |             converted string of date
126 |         """
127 | 
128 |     @abstractmethod
129 |     def set_until(self, until: str) -> None:
130 |         """Set the filter for time of jobs to consider.
131 | 
132 |         Args:
133 |             until: the string for filtering.  If specified as time=amount
134 |                 will subtract that amount from the current time
135 |         """
136 | 
137 |     @abstractmethod
138 |     def set_since(self, since: str) -> None:
139 |         """Set the filter for time of jobs to consider.
140 | 
141 |         Args:
142 |             since: the string for filtering.  If specified as time=amount
143 |                 will subtract that amount from the current time
144 |         """
145 | 
146 |     @abstractmethod
147 |     def has_since(self) -> bool:
148 |         """Tests if `since` has been set.
149 | 
150 |         Returns:
151 |             True if set_since has been called on this inquirer
152 |         """
153 | 
154 |     @abstractmethod
155 |     def get_partition_timelimits(self) -> dict:
156 |         """Get partition time limits.
157 | 
158 |         Returns:
159 |             dict mapping partition names to maximum timelimits.
160 |         """
161 | 
162 | 
163 | class SacctInquirer(BaseInquirer):
164 |     """Implementation of BaseInquirer for the sacct slurm function."""
165 | 
166 |     def __init__(self) -> None:
167 |         """Initialize a new inquirer."""
168 |         self.default_args = "sacct --parsable -n --delimiter=^|^".split()
169 |         self.user: str | None = None
170 |         self.state: set | None = None
171 |         self.not_state: set | None = None
172 |         self.since: str | None = None
173 |         self.until: str | None = None
174 |         self.query_all_users: bool = False
175 |         self.partition: str | None = None
176 |         self.cluster: str | None = None
177 |         self.extra_args: str | None = None
178 | 
179 |     def get_valid_formats(self) -> list[str]:
180 |         """Get the valid formatting options supported by the inquirer.
181 | 
182 |         Returns:
183 |             List of valid format options
184 | 
185 |         Raises:
186 |             RuntimeError: if sacct raises an error
187 |         """
188 |         command_args = "sacct --helpformat".split()
189 |         cmd_result = subprocess.run(
190 |             args=command_args,
191 |             stdout=subprocess.PIPE,
192 |             encoding="utf8",
193 |             check=True,
194 |             text=True,
195 |             shell=False,
196 |         )
197 |         if cmd_result.returncode != 0:
198 |             msg = "Error retrieving sacct options with --helpformat"
199 |             raise RuntimeError(msg)
200 |         return cmd_result.stdout.split()
201 | 
202 |     def set_sacct_args(self, jobs: list[str]) -> list[str]:
203 |         """Set arguments of sacct query.
204 | 
205 |         Args:
206 |             jobs: list of job names
207 | 
208 |         Returns:
209 |             String of sacct arguments
210 | 
211 |         """
212 |         args = []
213 |         if self.user:
214 |             if not self.since:
215 |                 start_date = datetime.date.today() - datetime.timedelta(days=7)
216 |                 self.since = start_date.strftime("%m%d%y")  # MMDDYY
217 |             args += [f"--user={self.user}"]
218 |         elif self.query_all_users:
219 |             args += ["--allusers"]
220 |         else:
221 |             args += ["--jobs=" + ",".join(jobs)]
222 | 
223 |         if self.since:
224 |             args += [f"--starttime={self.since}"]
225 |         if self.partition:
226 |             args += [f"--partition={self.partition}"]
227 |         if self.cluster:
228 |             args += [f"--cluster={self.cluster}"]
229 |         if self.until:
230 |             args += [f"--endtime={self.until}"]
231 |         if self.extra_args:
232 |             args += shlex.split(self.extra_args)
233 |         return args
234 | 
235 |     def get_db_output(
236 |         self,
237 |         columns: list[str],
238 |         jobs: list[str],
239 |         debug_cmd: Callable | None = None,
240 |     ) -> list[dict[str, str]]:
241 |         """Query the database with the supplied columns.
242 | 
243 |         Args:
244 |             columns: validated format names as strings
245 |             jobs: list of job names
246 |             debug_cmd: If specified, the raw output will passed to this function
247 | 
248 |         Returns:
249 |             List of rows, where each row is a dictionary
250 |             with the columns as keys and entries as values
251 |             Output order is not guaranteed to match the jobs list
252 | 
253 |         Raises:
254 |             RuntimeError: if sacct doesn't return properly
255 |         """
256 |         args = [*self.default_args, "--format=" + ",".join(columns)]
257 |         args += self.set_sacct_args(jobs)
258 |         try:
259 |             cmd_result = subprocess.run(
260 |                 args=args,
261 |                 stdout=subprocess.PIPE,
262 |                 encoding="utf8",
263 |                 check=True,
264 |                 text=True,
265 |                 shell=False,
266 |             )
267 |             cmd_result.check_returncode()
268 | 
269 |         except subprocess.CalledProcessError as error:
270 |             msg = f"Error running sacct!\n{error.stderr}"
271 |             raise RuntimeError(msg) from error
272 | 
273 |         sacct_line_split = re.compile(r"\^\|\^\n")
274 |         # convert newlines to printable \n
275 |         lines = [
276 |             line.replace("\n", "\\n")
277 |             for line in sacct_line_split.split(cmd_result.stdout)
278 |         ]
279 |         if debug_cmd is not None:
280 |             debug_cmd("\n".join(line.replace("\n", "\\n") for line in lines))
281 | 
282 |         sacct_split = re.compile(r"\^\|\^")
283 |         result = [dict(zip(columns, sacct_split.split(line))) for line in lines if line]
284 | 
285 |         # Sometimes the main job has a different state than the sub jobs
286 |         # e.g. timeouts have a state of canceled for the batch jobs.
287 |         # When state filtering is active, need to filter main ids, then retain
288 |         # only the jobs with matching job ids
289 |         if self.state or self.not_state:
290 |             main_jobs = [r for r in result if "." not in r["JobID"]]
291 |             if self.state:
292 |                 # split to get first word in entries like "CANCELLED BY X"
293 |                 main_jobs = [
294 |                     r for r in main_jobs if r["State"].split()[0] in self.state
295 |                 ]
296 | 
297 |             if self.not_state:
298 |                 # split to get first word in entries like "CANCELLED BY X"
299 |                 main_jobs = [
300 |                     r for r in main_jobs if r["State"].split()[0] not in self.not_state
301 |                 ]
302 | 
303 |             main_job_ids = {r["JobID"] for r in main_jobs}
304 |             result = [r for r in result if r["JobID"].split(".")[0] in main_job_ids]
305 | 
306 |         return result
307 | 
308 |     def set_user(self, user: str) -> None:
309 |         """Set the collection of jobs based on the provided user.
310 | 
311 |         Args:
312 |             user: user name
313 |         """
314 |         self.user = user
315 | 
316 |     def set_partition(self, partition: str) -> None:
317 |         """Set the collection of jobs based on the provided partition.
318 | 
319 |         Args:
320 |             partition: partition name
321 |         """
322 |         self.partition = partition
323 | 
324 |     def set_cluster(self, cluster: str) -> None:
325 |         """Set the specific cluster in multi-cluster environment.
326 | 
327 |         Args:
328 |             cluster: cluster name
329 |         """
330 |         self.cluster = cluster
331 | 
332 |     def set_extra_args(self, extra_args: str) -> None:
333 |         """Set extra arguments to be forwarded to sacct.
334 | 
335 |         Args:
336 |             extra_args: list of arguments
337 |         """
338 |         self.extra_args = extra_args
339 | 
340 |     def all_users(self) -> None:
341 |         """Query for all users if `since` is set."""
342 |         self.query_all_users = True
343 | 
344 |     def set_state(self, state: str) -> None:
345 |         """Set the state to include output jobs.
346 | 
347 |         Args:
348 |             state: comma separated list of state names or codes
349 |         """
350 |         if not state:
351 |             return
352 | 
353 |         self.state = get_states_as_set(state)
354 |         # add a single value if it's empty here
355 |         if not self.state:
356 |             click.secho("No valid states provided to include", fg="yellow", err=True)
357 |             self.state.add(None)
358 | 
359 |     def set_not_state(self, state: str) -> None:
360 |         """Set the state to exclude from output jobs.
361 | 
362 |         Args:
363 |             state: comma separated list of state names or codes
364 | 
365 |         """
366 |         if not state:
367 |             return
368 | 
369 |         self.not_state = get_states_as_set(state)
370 |         # add a single value if it's empty here
371 |         if not self.not_state:
372 |             click.secho("No valid states provided to exclude", fg="yellow", err=True)
373 |             self.not_state = None
374 | 
375 |     def parse_date(self, d: str) -> str:
376 |         """Parse and convert custom string date format.
377 | 
378 |         Args:
379 |             d: the string of date.
380 | 
381 |         Returns:
382 |             converted string of date
383 |         """
384 |         abbrev_to_key = {
385 |             "w": "weeks",
386 |             "W": "weeks",
387 |             "d": "days",
388 |             "D": "days",
389 |             "h": "hours",
390 |             "H": "hours",
391 |             "m": "minutes",
392 |             "M": "minutes",
393 |         }
394 |         valid_args = ["weeks", "days", "hours", "minutes"]
395 |         date_args = {}
396 | 
397 |         args = d.split(",")
398 |         for arg in args:
399 |             if "=" not in arg:
400 |                 continue
401 | 
402 |             toks = arg.split("=")
403 | 
404 |             # convert key to name
405 |             if toks[0] in abbrev_to_key:
406 |                 toks[0] = abbrev_to_key[toks[0]]
407 | 
408 |             toks[0] = toks[0].lower()
409 | 
410 |             if toks[0] in valid_args:
411 |                 try:
412 |                     date_args[toks[0]] = int(toks[1])
413 |                 except ValueError:
414 |                     continue
415 | 
416 |         date = datetime.datetime.today()
417 |         date -= datetime.timedelta(**date_args)
418 |         return date.strftime("%Y-%m-%dT%H:%M")  # MMDDYY
419 | 
420 |     def set_until(self, until: str) -> None:
421 |         """Set the filter for time of jobs to consider.
422 | 
423 |         Args:
424 |             until: the string for filtering. If specified as time=amount
425 |                 will subtract that amount from the current time
426 |         """
427 |         if not until:
428 |             return
429 |         if "=" in until:  # handle custom format
430 |             self.until = self.parse_date(until)
431 |         else:
432 |             self.until = until
433 | 
434 |     def set_since(self, since: str) -> None:
435 |         """Set the filter for time of jobs to consider.
436 | 
437 |         Args:
438 |             since: the string for filtering.  If specified as time=amount
439 |                 will subtract that amount from the current time
440 |         """
441 |         if not since:
442 |             return
443 |         if "=" in since:  # handle custom format
444 |             self.since = self.parse_date(since)
445 |         else:
446 |             self.since = since
447 | 
448 |     def has_since(self) -> bool:
449 |         """Check if since has been set.
450 | 
451 |         Returns:
452 |             True if since has been set properly
453 |         """
454 |         return bool(self.since)
455 | 
456 |     def get_partition_timelimits(self) -> dict:
457 |         """Get partition time limits.
458 | 
459 |         Returns:
460 |             dict mapping partition names to maximum timelimits.
461 | 
462 |         Raises:
463 |             RuntimeError: if scontrol raises an error
464 |         """
465 |         args = ""
466 |         if self.cluster:
467 |             args = f"--cluster {self.cluster}"
468 | 
469 |         command_args = f"scontrol {args} show partition".split()
470 |         cmd_result = subprocess.run(
471 |             args=command_args,
472 |             stdout=subprocess.PIPE,
473 |             encoding="utf8",
474 |             check=True,
475 |             text=True,
476 |             shell=False,
477 |         )
478 |         if cmd_result.returncode != 0:
479 |             msg = "Error retrieving information from scontrol"
480 |             raise RuntimeError(msg)
481 | 
482 |         partition_name = re.compile(r"^PartitionName=(?P<name>\S+)$")
483 |         time_limit = re.compile(r"MaxTime=(?P<time>\S+)")
484 | 
485 |         partition = ""
486 |         result = {}
487 |         for line in cmd_result.stdout.split():
488 |             match = re.match(partition_name, line)
489 |             if match:
490 |                 partition = match.group("name")
491 |             match = re.match(time_limit, line)
492 |             if match:
493 |                 result[partition] = match.group("time")
494 | 
495 |         return result
496 | 
497 | 
498 | def get_states_as_set(state_list: str) -> set:
499 |     """Helper method to parse the state string.
500 | 
501 |     Args:
502 |         state_list: comma separated string with codes and states
503 | 
504 |     Returns:
505 |         Set with valid state names in upper case
506 |     """
507 |     codes_to_states = {
508 |         "BF": "BOOT_FAIL",
509 |         "CA": "CANCELLED",
510 |         "CD": "COMPLETED",
511 |         "DL": "DEADLINE",
512 |         "F": "FAILED",
513 |         "NF": "NODE_FAIL",
514 |         "OOM": "OUT_OF_MEMORY",
515 |         "PD": "PENDING",
516 |         "PR": "PREEMPTED",
517 |         "R": "RUNNING",
518 |         "RQ": "REQUEUED",
519 |         "RS": "RESIZING",
520 |         "RV": "REVOKED",
521 |         "S": "SUSPENDED",
522 |         "TO": "TIMEOUT",
523 |     }
524 |     possible_states = set(codes_to_states.values())
525 |     states = {
526 |         codes_to_states.get(state, state) for state in state_list.upper().split(",")
527 |     }
528 | 
529 |     for state in states:
530 |         if state not in possible_states:
531 |             click.secho(f"Unknown state {state}", fg="yellow", err=True)
532 | 
533 |     return states.intersection(possible_states)
534 | 


--------------------------------------------------------------------------------
/src/reportseff/job.py:
--------------------------------------------------------------------------------
  1 | """Module for representing scheduler jobs."""
  2 | 
  3 | from __future__ import annotations
  4 | 
  5 | import base64
  6 | import gzip
  7 | import json
  8 | import re
  9 | from datetime import timedelta
 10 | from typing import Any, Generator
 11 | 
 12 | multiple_map = {
 13 |     "K": 1024**0,
 14 |     "M": 1024**1,
 15 |     "G": 1024**2,
 16 |     "T": 1024**3,
 17 |     "E": 1024**4,
 18 | }
 19 | 
 20 | state_colors = {
 21 |     "FAILED": "red",
 22 |     "TIMEOUT": "red",
 23 |     "OUT_OF_MEMORY": "red",
 24 |     "RUNNING": "cyan",
 25 |     "CANCELLED": "yellow",
 26 |     "COMPLETED": "green",
 27 |     "PENDING": "blue",
 28 | }
 29 | 
 30 | #: Regex for DDHHMMSS style timestamps
 31 | DDHHMMSS_RE = re.compile(
 32 |     r"(?P<days>\d+)-(?P<hours>\d{2}):(?P<minutes>\d{2}):(?P<seconds>\d{2})"
 33 | )
 34 | #: Regex for HHMMSS style timestamps
 35 | HHMMSS_RE = re.compile(r"(?P<hours>\d{2}):(?P<minutes>\d{2}):(?P<seconds>\d{2})")
 36 | #: Regex for HHMMmmm style timestamps
 37 | MMSSMMM_RE = re.compile(
 38 |     r"(?P<minutes>\d{2}):(?P<seconds>\d{2}).(?P<milliseconds>\d{3})"
 39 | )
 40 | #: Regex for maxRSS and reqmem
 41 | MEM_RE = re.compile(
 42 |     r"(?P<memory>[-+]?\d*\.\d+|\d+)(?P<multiple>[KMGTE]?)(?P<type>[nc]?)"
 43 | )
 44 | ADMIN_COMMENT_MIN_LENGTH = 10
 45 | 
 46 | 
 47 | class Job:
 48 |     """Representation of scheduler job."""
 49 | 
 50 |     def __init__(self, job: str, jobid: str, filename: str | None) -> None:
 51 |         """Initialize new job.
 52 | 
 53 |         Args:
 54 |             job: the base job number
 55 |             jobid: same as job unless an array job
 56 |             filename: the output file associated with this job
 57 |         """
 58 |         self.job = job
 59 |         self.jobid = jobid
 60 |         self.filename = filename
 61 |         self.stepmem = 0.0
 62 |         self.totalmem: float | None = None
 63 |         self.time: str | None = "---"
 64 |         self.time_eff: str | float = "---"
 65 |         self.cpu: str | float | None = "---"
 66 |         self.state: str | None = None
 67 |         self.mem_eff: float | None = None
 68 |         self.gpu: float | None = None
 69 |         self.gpu_mem: float | None = None
 70 |         self.energy: int = 0
 71 |         self.other_entries: dict[str, Any] = {}
 72 |         # safe to cache now
 73 |         self.other_entries["JobID"] = self.name()
 74 |         self.comment_data: dict = {}
 75 | 
 76 |     def __eq__(self, other: Any) -> bool:
 77 |         """Test for equality.
 78 | 
 79 |         Args:
 80 |             other: the other object
 81 | 
 82 |         Returns:
 83 |             true if the other object is a Job and all attributes match
 84 |         """
 85 |         if not isinstance(other, Job):
 86 |             return False
 87 | 
 88 |         return self.__dict__ == other.__dict__
 89 | 
 90 |     def __repr__(self) -> str:
 91 |         """Job representation.
 92 | 
 93 |         Returns:
 94 |             The job string representation
 95 |         """
 96 |         return f"Job(job={self.job}, jobid={self.jobid}, filename={self.filename})"
 97 | 
 98 |     def update(self, entry: dict) -> None:
 99 |         """Update the job properties based on the db_inquirer entry.
100 | 
101 |         Args:
102 |             entry: the db_inquirer entry for the matching job
103 |         """
104 |         if "." not in entry["JobID"]:
105 |             self.state = entry["State"].split()[0]
106 | 
107 |         if self.state == "PENDING":
108 |             self._cache_entries()
109 |             return
110 | 
111 |         # main job id
112 |         if self.jobid == entry["JobID"]:
113 |             self._update_main_job(entry)
114 |             self._cache_entries()
115 | 
116 |         elif self.state != "RUNNING":
117 |             for k, value in entry.items():
118 |                 if k not in self.other_entries or not self.other_entries[k]:
119 |                     self.other_entries[k] = value
120 |             mem = parsemem(entry["MaxRSS"]) if "MaxRSS" in entry else 0
121 |             tasks = int(entry.get("NTasks", 1))
122 |             self.stepmem = max(self.stepmem, mem * tasks)
123 | 
124 |             if "TRESUsageOutAve" in entry:
125 |                 self.energy = max(
126 |                     self.energy,
127 |                     _parse_energy(entry["TRESUsageOutAve"]),
128 |                 )
129 | 
130 |     def _update_main_job(self, entry: dict) -> None:
131 |         """Update properties for the main job.
132 | 
133 |         Args:
134 |             entry: the entry where the jobid matches exactly, e.g. not batch or ex
135 |         """
136 |         for k, value in entry.items():
137 |             if k not in self.other_entries or not self.other_entries[k]:
138 |                 self.other_entries[k] = value
139 |         self.time = entry.get("Elapsed")
140 | 
141 |         requested = 0
142 |         if "Timelimit" in entry and entry["Timelimit"] not in (
143 |             "UNLIMITED",
144 |             "Partition_Limit",
145 |         ):
146 |             requested = _parse_slurm_timedelta(entry["Timelimit"])
147 | 
148 |         wall = _parse_slurm_timedelta(entry["Elapsed"]) if "Elapsed" in entry else 0
149 | 
150 |         if requested != 0:
151 |             self.time_eff = round(wall / requested * 100, 1)
152 | 
153 |         if self.state == "RUNNING":
154 |             return
155 | 
156 |         total_cpu = _parse_slurm_timedelta(entry.get("TotalCPU", "00:00.000"))
157 |         alloc_cpus = int(entry.get("AllocCPUS", 0))
158 | 
159 |         cpu_time = total_cpu / alloc_cpus if alloc_cpus != 0 else 0.0
160 | 
161 |         if wall == 0:
162 |             self.cpu = None
163 |         else:
164 |             self.cpu = round(cpu_time / wall * 100, 1)
165 | 
166 |         if "REQMEM" in entry and "NNodes" in entry and "AllocCPUS" in entry:
167 |             self.totalmem = parsemem(
168 |                 entry["REQMEM"], int(entry["NNodes"]), int(entry["AllocCPUS"])
169 |             )
170 | 
171 |         if (
172 |             "AdminComment" in entry
173 |             and len(entry["AdminComment"]) > ADMIN_COMMENT_MIN_LENGTH
174 |         ):
175 |             self._parse_admin_comment(entry["AdminComment"])
176 | 
177 |     def _parse_admin_comment(self, comment: str) -> None:
178 |         """Use admin command to override efficiency values.
179 | 
180 |         Decodes and parses admincommand from jobstats.
181 | 
182 |         Args:
183 |             comment: The AdminComment field.
184 |         """
185 |         data = _parse_admin_comment_to_dict(comment)
186 | 
187 |         if data is None:
188 |             return
189 | 
190 |         for node, node_data in data["nodes"].items():
191 |             self.comment_data[node] = _get_node_data(data, node_data)
192 | 
193 |         self.cpu = _average_nested_dict("CPUEff", self.comment_data)
194 |         self.mem_eff = _average_nested_dict("MemEff", self.comment_data)
195 |         if data["gpus"]:
196 |             self.gpu = _average_nested_dict("GPUEff", self.comment_data)
197 |             self.gpu_mem = _average_nested_dict("GPUMem", self.comment_data)
198 | 
199 |     def _cache_entries(self) -> None:
200 |         self.other_entries["State"] = self.state
201 |         self.other_entries["TimeEff"] = self.time_eff
202 |         self.other_entries["CPUEff"] = self.cpu if self.cpu else "---"
203 |         self.other_entries["GPUEff"] = self.gpu if self.gpu is not None else "---"
204 |         if self.gpu_mem is not None:
205 |             self.other_entries["GPUMem"] = self.gpu_mem
206 |         else:
207 |             self.other_entries["GPUMem"] = "---"
208 | 
209 |     def name(self) -> str:
210 |         """The name of the job.
211 | 
212 |         Returns:
213 |             The filename (if set) or jobid
214 |         """
215 |         if self.filename:
216 |             return self.filename
217 |         return self.jobid
218 | 
219 |     def get_entry(self, key: str) -> Any:
220 |         """Get an attribute by name.
221 | 
222 |         Args:
223 |             key: the attribute to query
224 | 
225 |         Returns:
226 |             The value of that attribute or "---" if not found
227 |         """
228 |         if key == "MemEff":
229 |             if self.mem_eff:  # set by admin comment
230 |                 return self.mem_eff
231 |             if self.totalmem:
232 |                 return round(self.stepmem / self.totalmem * 100, 1)
233 |             return "---"
234 | 
235 |         if key == "Energy":
236 |             return self.energy
237 | 
238 |         return self.other_entries.get(key, "---")
239 | 
240 |     def get_node_entries(
241 |         self, key: str, *, gpu: bool = False
242 |     ) -> Generator[Any, None, None]:
243 |         """Get an attribute by name for each node in job.
244 | 
245 |         Args:
246 |             key: the attribute to query
247 |             gpu: True if gpu values should also be split
248 | 
249 |         Yields:
250 |             A generator with values for provided attribute.  If the key does
251 |             not change in nodes/gpus it will yield an empty string
252 |         """
253 |         yield self.get_entry(key)
254 |         if len(self.comment_data) > 1 or (gpu and self.gpu is not None):
255 |             for node, data in self.comment_data.items():
256 |                 # get node-level data
257 |                 if key == "JobID":
258 |                     yield f"  {node}"
259 |                 else:
260 |                     to_yield = data.get(key, "")
261 |                     to_yield = (
262 |                         to_yield if isinstance(to_yield, str) else round(to_yield, 1)
263 |                     )
264 |                     yield to_yield
265 |                 if (
266 |                     gpu and self.gpu is not None and "gpus" in data
267 |                 ):  # has gpus to report
268 |                     for gpu_name, gpu_data in data["gpus"].items():
269 |                         if key == "JobID":
270 |                             yield f"    {gpu_name}"
271 |                         else:
272 |                             to_yield = gpu_data.get(key, "")
273 |                             to_yield = (
274 |                                 to_yield
275 |                                 if isinstance(to_yield, str)
276 |                                 else round(to_yield, 1)
277 |                             )
278 |                             yield to_yield
279 | 
280 | 
281 | def _parse_slurm_timedelta(delta: str) -> int:
282 |     """Parse one of the three formats used in TotalCPU.
283 | 
284 |     Based on which regex matches, convert into a timedelta
285 |     and return total seconds.
286 | 
287 |     Args:
288 |         delta: The time duration
289 | 
290 |     Returns:
291 |         Number of seconds elapsed during the delta
292 | 
293 |     Raises:
294 |         ValueError: if unable to parse delta
295 |     """
296 |     match = re.match(DDHHMMSS_RE, delta)
297 |     if match:
298 |         return int(
299 |             timedelta(
300 |                 days=int(match.group("days")),
301 |                 hours=int(match.group("hours")),
302 |                 minutes=int(match.group("minutes")),
303 |                 seconds=int(match.group("seconds")),
304 |             ).total_seconds()
305 |         )
306 |     match = re.match(HHMMSS_RE, delta)
307 |     if match:
308 |         return int(
309 |             timedelta(
310 |                 hours=int(match.group("hours")),
311 |                 minutes=int(match.group("minutes")),
312 |                 seconds=int(match.group("seconds")),
313 |             ).total_seconds()
314 |         )
315 |     match = re.match(MMSSMMM_RE, delta)
316 |     if match:
317 |         return int(
318 |             timedelta(
319 |                 minutes=int(match.group("minutes")),
320 |                 seconds=int(match.group("seconds")),
321 |                 milliseconds=int(match.group("milliseconds")),
322 |             ).total_seconds()
323 |         )
324 |     msg = f"Failed to parse time {delta!r}"
325 |     raise ValueError(msg)
326 | 
327 | 
328 | def parsemem(mem: str, nodes: int = 1, cpus: int = 1) -> float:
329 |     """Parse memory representations of reqmem and maxrss.
330 | 
331 |     Args:
332 |         mem: the memory representation
333 |         nodes: the number of nodes in the job
334 |         cpus: the number of cpus in the job
335 | 
336 |     Returns:
337 |         The number of bytes for the job.
338 |         if mem is empty, return 0.
339 |         if mem ends with n or c, scale by the provided nodes or cpus respectively
340 |         the multiple of memory (e.g. M or G) is always scaled if provided
341 | 
342 |     Raises:
343 |         ValueError: if unable to parse mem
344 |     """
345 |     if mem in ("", "0"):
346 |         return 0
347 |     match = re.fullmatch(MEM_RE, mem)
348 |     if not match:
349 |         msg = f"Failed to parse memory {mem!r}"
350 |         raise ValueError(msg)
351 |     memory = float(match.group("memory"))
352 | 
353 |     if match.group("multiple") != "":
354 |         memory *= multiple_map[match.group("multiple")]
355 | 
356 |     if match.group("type") != "":
357 |         if match.group("type") == "n":
358 |             memory *= nodes
359 |         else:
360 |             memory *= cpus
361 |     return memory
362 | 
363 | 
364 | def _parse_energy(tres: str) -> int:
365 |     """Parse energy usage from tres entry.
366 | 
367 |     Args:
368 |         tres: the tres entry from sacct
369 | 
370 |     Returns:
371 |         The energy usage for the job.  If missing, will return 0.
372 |     """
373 |     for entry in tres.split(","):
374 |         tokens = entry.split("=")
375 |         if tokens[0] == "energy":
376 |             return int(tokens[1])
377 |     return 0
378 | 
379 | 
380 | def _parse_admin_comment_to_dict(comment: str) -> dict | None:
381 |     """Attempt to parse AdminComment.
382 | 
383 |     Args:
384 |         comment: The AdminComment field.
385 | 
386 |     Returns:
387 |         the decoded dict
388 |         None if the comment isn't recognized but can be ignored
389 | 
390 |     Raises:
391 |         ValueError: if the comment doesn't start with JS1.
392 |         ValueError: if the comment can't be decoded.
393 |     """
394 |     comment_type = comment[:3]
395 | 
396 |     if not comment_type.startswith("JS"):
397 |         # ignore comments that aren't from jobstats (JS)
398 |         return None
399 | 
400 |     if comment_type not in ("JS1",):
401 |         msg = f"Unknown comment type {comment_type!r}"
402 |         raise ValueError(msg)
403 |     try:
404 |         return json.loads(gzip.decompress(base64.b64decode(comment[4:])))
405 |     except Exception as exception:
406 |         msg = f"Cannot decode comment {comment!r}"
407 |         raise ValueError(msg) from exception
408 | 
409 | 
410 | def _get_node_data(comment_data: dict, node_data: dict) -> dict:
411 |     """Parse node level data from admin comment values.
412 | 
413 |     Args:
414 |         comment_data: The AdminComment field.
415 |         node_data: Data for this node.
416 | 
417 |     Returns:
418 |         the dict with efficiency information for this node
419 |     """
420 | 
421 |     def get_gpu_value(comment_data: dict, key: str, gpu_number: int) -> float:
422 |         if key in comment_data and gpu_number in comment_data[key]:
423 |             return comment_data[key][gpu_number]
424 |         return 0
425 | 
426 |     result = {
427 |         "MemEff": node_data["used_memory"] / node_data["total_memory"] * 100,
428 |     }
429 | 
430 |     if node_data["cpus"] == 0 or comment_data["total_time"] == 0:
431 |         result["CPUEff"] = 0
432 |     else:
433 |         time_per_cpu = node_data["total_time"] / node_data["cpus"]
434 |         result["CPUEff"] = time_per_cpu / comment_data["total_time"] * 100
435 | 
436 |     if comment_data["gpus"] and "gpu_total_memory" in node_data:
437 |         result["gpus"] = {
438 |             gpu: {
439 |                 "GPUEff": get_gpu_value(node_data, "gpu_utilization", gpu),
440 |                 "GPUMem": round(
441 |                     get_gpu_value(node_data, "gpu_used_memory", gpu)
442 |                     / get_gpu_value(node_data, "gpu_total_memory", gpu)
443 |                     * 100,
444 |                     1,
445 |                 ),
446 |             }
447 |             for gpu in node_data["gpu_total_memory"]
448 |         }
449 |         result["GPUEff"] = _average_nested_dict("GPUEff", result["gpus"])
450 |         result["GPUMem"] = _average_nested_dict("GPUMem", result["gpus"])
451 |     return result
452 | 
453 | 
454 | def _average_nested_dict(nested_key: str, data: dict) -> float:
455 |     """Average nested values in data dictionary.
456 | 
457 |     Args:
458 |         nested_key: The key to key for averaging
459 |         data: The dict to average.
460 | 
461 |     Returns:
462 |         the mean value, rounded to one decimal
463 |     """
464 |     return round(
465 |         sum(value[nested_key] for value in data.values() if nested_key in value)
466 |         / len(data),
467 |         1,
468 |     )
469 | 


--------------------------------------------------------------------------------
/src/reportseff/job_collection.py:
--------------------------------------------------------------------------------
  1 | """Module representing a collection of jobs."""
  2 | 
  3 | from __future__ import annotations
  4 | 
  5 | import re
  6 | from pathlib import Path
  7 | from typing import TYPE_CHECKING
  8 | 
  9 | from .job import Job
 10 | 
 11 | if TYPE_CHECKING:  # pragma: no cover
 12 |     from .output_renderer import OutputRenderer
 13 | 
 14 | 
 15 | class JobCollection:
 16 |     """A group of jobs."""
 17 | 
 18 |     def __init__(self) -> None:
 19 |         """Create a new job collection with default options."""
 20 |         self.columns = [
 21 |             "JobIDRaw",
 22 |             "JobID",
 23 |             "State",
 24 |             "AllocCPUS",
 25 |             "TotalCPU",
 26 |             "Elapsed",
 27 |             "Timelimit",
 28 |             "REQMEM",
 29 |             "MaxRSS",
 30 |             "NNodes",
 31 |             "NTasks",
 32 |             "Partition",
 33 |         ]
 34 | 
 35 |         self.job_file_regex = re.compile(
 36 |             r"^.*?[_-](?P<jobid>(?P<job>[0-9]+)(_[0-9]+)?)(\.out)?$"
 37 |         )
 38 |         self.job_regex = re.compile(r"^(?P<jobid>(?P<job>[0-9]+)(_[][\-0-9]+)?)$")
 39 | 
 40 |         self.jobs: dict[str, Job] = {}
 41 |         self.renderer: OutputRenderer | None = None
 42 |         self.dir_name: Path | None = None
 43 |         self.partition_timelimits: dict = {}
 44 | 
 45 |     def get_columns(self) -> list[str]:
 46 |         """The list of columns requested from inquirer.
 47 | 
 48 |         Returns:
 49 |             The current columns of this collection.
 50 |         """
 51 |         return self.columns
 52 | 
 53 |     def get_jobs(self) -> list[str]:
 54 |         """List of jobs to get from inquirer.
 55 | 
 56 |         Returns:
 57 |             job names as a sorted list
 58 |         """
 59 |         return sorted({job.job for job in self.jobs.values()})
 60 | 
 61 |     def set_out_dir(self, directory: str) -> None:
 62 |         """Set this collection's directory to try parsing out jobs from output files.
 63 | 
 64 |         If directory is empty, will use the current directory, otherwise will
 65 |         try to get the full path name.
 66 | 
 67 |         Args:
 68 |             directory: the directory to search for job names.
 69 | 
 70 |         Raises:
 71 |             ValueError: if the directory does not exist
 72 |             ValueError: if the directory contains no files
 73 |             ValueError: if the directory contains no valid files
 74 |         """
 75 |         # set and validate working directory to full path
 76 |         working_directory = Path(directory).resolve() if directory else Path.cwd()
 77 | 
 78 |         if not working_directory.exists():
 79 |             msg = f"{working_directory} does not exist!"
 80 |             raise ValueError(msg)
 81 | 
 82 |         # get files from directory
 83 |         files = [file for file in working_directory.iterdir() if file.is_file()]
 84 |         if len(files) == 0:
 85 |             msg = f"{working_directory} contains no files!"
 86 |             raise ValueError(msg)
 87 | 
 88 |         for file in files:
 89 |             self.process_seff_file(file.name)
 90 | 
 91 |         if len(self.jobs) == 0:
 92 |             msg = (
 93 |                 f"{working_directory} contains no valid output files!"
 94 |                 "\nDo you need to set a custom format with `--slurm-format`?"
 95 |             )
 96 |             raise ValueError(msg)
 97 |         self.dir_name = working_directory
 98 | 
 99 |     def set_jobs(self, jobs: tuple) -> None:
100 |         """Set the collection jobs to the provided job ids.
101 | 
102 |         if jobs is empty, use the current working directory
103 |         if jobs is a singleton and a directory, set to that directory
104 |         else, parse jobs as files or raw job ids
105 | 
106 |         Args:
107 |             jobs: Tuple of job names to use for populating the collection
108 | 
109 |         Raises:
110 |             ValueError: if no valid jobs are provided
111 |         """
112 |         if jobs == ():
113 |             # look in current directory for slurm outputs
114 |             self.set_out_dir("")
115 |             return
116 |         if len(jobs) == 1 and Path(jobs[0]).is_dir():
117 |             self.set_out_dir(jobs[0])
118 |             return
119 |         for job_id in jobs:
120 |             match = self.job_regex.match(job_id)
121 | 
122 |             if match:
123 |                 self.add_job(match.group("job"), match.group("jobid"))
124 |             else:
125 |                 self.process_seff_file(job_id)
126 | 
127 |         if len(self.jobs) == 0:
128 |             msg = "No valid jobs provided!"
129 |             raise ValueError(msg)
130 | 
131 |     def process_seff_file(self, filename: str) -> None:
132 |         """Try to parse out job information from the supplied filename.
133 | 
134 |         Args:
135 |             filename: the filename to try and match
136 |         """
137 |         match = self.job_file_regex.match(filename)
138 |         if match:
139 |             self.add_job(match.group("job"), match.group("jobid"), filename)
140 | 
141 |     def set_custom_seff_format(self, filename_pattern: str) -> None:
142 |         """Set the slurm output file parser to a custom value.
143 | 
144 |         Args:
145 |             filename_pattern: the pattern passed to sbatch
146 | 
147 |         Raises:
148 |             ValueError: the jobid cannot be determined from the provided pattern
149 |         """
150 |         pattern = re.escape(filename_pattern)
151 |         # if %j is present, use that for jobid and job
152 |         if "%j" in pattern:
153 |             pattern = pattern.replace("%j", r"(?P<jobid>(?P<job>[0-9]+))")
154 |         # if %a is present, it must follow %A to match expected slurm outputs
155 |         elif "%A_%a" in pattern:
156 |             pattern = pattern.replace(
157 |                 "%A_%a",
158 |                 r"(?P<jobid>(?P<job>[0-9]+)_[0-9]+)",
159 |             )
160 |         # if %A alone is present, use that for jobid and job
161 |         elif "%A" in pattern:
162 |             pattern = pattern.replace(
163 |                 "%A",
164 |                 r"(?P<jobid>(?P<job>[0-9]+))",
165 |             )
166 |         else:
167 |             msg = (
168 |                 f"Unable to determine jobid from {filename_pattern}. "
169 |                 "Pattern should include one of ('%j', '%A', '%A_%a')"
170 |             )
171 |             raise ValueError(msg)
172 | 
173 |         tokens = re.split(r"(%[^%])", pattern)
174 |         # combine sequential tokens
175 |         processed_tokens = [""]
176 |         for token in tokens:
177 |             if not token:
178 |                 continue
179 |             if token.startswith("%") and processed_tokens[-1].startswith(".*"):
180 |                 continue
181 |             if token.startswith("%"):
182 |                 processed_tokens.append(".*")
183 |             else:
184 |                 processed_tokens.append(token)
185 |         self.job_file_regex = re.compile("^" + "".join(processed_tokens) + "$")
186 | 
187 |     def add_job(self, job: str, jobid: str, filename: str | None = None) -> None:
188 |         """Add a job to the collection.
189 | 
190 |         Args:
191 |             job: the 'base' job number
192 |             jobid: equal to the job unless it is an array job
193 |             filename: the filename of the out file this job is derived from
194 |         """
195 |         self.jobs[jobid] = Job(job, jobid, filename)
196 | 
197 |     def process_entry(self, entry: dict, *, add_job: bool = False) -> None:
198 |         """Update the jobs collection with information from the provided entry.
199 | 
200 |         Args:
201 |             entry: the account entry from a db inquirer
202 |             add_job: if true, will add the job to the collection if it doesn't exist
203 |         """
204 |         job_id = entry["JobID"].split(".")[0]
205 |         job_id_raw = entry["JobIDRaw"].split(".")[0]
206 |         if job_id not in self.jobs:
207 |             match = self.job_regex.match(job_id)
208 |             # job is in jobs
209 |             if match and (match.group("job") in self.jobs or add_job):
210 |                 self.add_job(match.group("job"), job_id)
211 |             # check if the job_id is an array job
212 |             elif job_id_raw in self.jobs:
213 |                 old_job = self.jobs.pop(job_id_raw)
214 |                 self.add_job(old_job.job, job_id, old_job.filename)
215 |             else:
216 |                 return
217 | 
218 |         # handle partition limit for timelimit
219 |         if (
220 |             "Timelimit" in entry
221 |             and entry["Timelimit"] == "Partition_Limit"
222 |             and "Partition" in entry
223 |             and entry["Partition"] in self.partition_timelimits
224 |         ):
225 |             entry["Timelimit"] = self.partition_timelimits[entry["Partition"]]
226 | 
227 |         self.jobs[job_id].update(entry)
228 | 
229 |     def get_sorted_jobs(self, *, change_sort: bool) -> list[Job]:
230 |         """Sort the jobs.
231 | 
232 |         Args:
233 |             change_sort: a switch to indicate the type of sorting
234 |                 if true will sort by the modified time of the file or job number
235 |                 if false will sort by the if the file exists,
236 |                 the length, then the content
237 | 
238 |         Returns:
239 |             sorted list of jobs to display
240 |         """
241 | 
242 |         def get_time(job: Job) -> float:
243 |             # handle None and '', use numeric representation of name
244 |             idnum = float(re.sub("[^0-9.]", "", job.jobid.replace("_", ".")))
245 |             file = job.filename
246 |             if file:
247 |                 path = Path(file)
248 |                 if self.dir_name:
249 |                     path = self.dir_name / file
250 |                 if path.exists():
251 |                     return path.stat().st_mtime
252 |             return idnum
253 | 
254 |         def get_file_name(job: Job) -> tuple[bool, int, str]:
255 |             file = Path(job.name())
256 |             file = self.dir_name / file if self.dir_name else file
257 |             return (not file.exists(), len(str(file)), str(file))
258 | 
259 |         if change_sort:
260 |             return sorted(self.jobs.values(), key=get_time, reverse=True)
261 | 
262 |         return sorted(self.jobs.values(), key=get_file_name)
263 | 
264 |     def set_partition_limits(self, limits: dict) -> None:
265 |         """Set partition limits from db inquirer.
266 | 
267 |         Args:
268 |             limits: dict of partition to partition timelimit
269 |         """
270 |         self.partition_timelimits = limits
271 | 


--------------------------------------------------------------------------------
/src/reportseff/output_renderer.py:
--------------------------------------------------------------------------------
  1 | """Module for rendering tabulated values."""
  2 | 
  3 | from __future__ import annotations
  4 | 
  5 | import copy
  6 | import re
  7 | from dataclasses import dataclass
  8 | from typing import Any, Callable, Generator
  9 | 
 10 | import click
 11 | 
 12 | from .job import Job, state_colors
 13 | 
 14 | #: Regex for format tokens, NAME[%[ALIGNMENT][WIDTH[e?]]]
 15 | FORMAT_RE = re.compile(
 16 |     r"(?P<title>[^%:]+)"  # must have title
 17 |     r"([%:]"  # may have other formatting
 18 |     r"(?P<alignment>[<^>])?"  # like alignment
 19 |     r"((?P<width>\d+)(?P<end>[e$])?)?"  # if width is present, may have an e
 20 |     r")?"
 21 | )
 22 | 
 23 | # efficiency limits for mid and high measurements
 24 | MID_LIMIT_LOW = 20
 25 | MID_LIMIT_HIGH = 90
 26 | MID_LIMIT_GOOD = 60
 27 | HIGH_LIMIT_LOW = 20
 28 | HIGH_LIMIT_GOOD = 80
 29 | 
 30 | 
 31 | @dataclass
 32 | class RenderOptions:
 33 |     """Data class for holding output rendering options.
 34 | 
 35 |     Args:
 36 |         node: bool indicating if node-level data should be reported
 37 |         gpu: in addition to node, should each GPU be reported
 38 |         parsable: should output be rendered in a parsable format
 39 |         delimiter: string to use for separating columns when parsable is set
 40 |     """
 41 | 
 42 |     node: bool = False
 43 |     gpu: bool = False
 44 |     parsable: bool = False
 45 |     delimiter: str = "|"
 46 | 
 47 |     def __post_init__(self) -> None:
 48 |         """Post init method to handle delimiter and parsable."""
 49 |         if not self.parsable:
 50 |             self.delimiter = " "
 51 | 
 52 | 
 53 | class OutputRenderer:
 54 |     """A collection of formatting columns for rendering output."""
 55 | 
 56 |     def __init__(
 57 |         self,
 58 |         valid_titles: list,
 59 |         options: RenderOptions,
 60 |         format_str: str = "JobID%>,State,Elapsed%>,CPUEff,MemEff",
 61 |     ) -> None:
 62 |         """Initialize renderer with format string and list of valid titles.
 63 | 
 64 |         Args:
 65 |             valid_titles: List of valid options for format tokens
 66 |             format_str: comma separated list of format tokens
 67 |             options: RenderOptions controlling display behavior
 68 |         """
 69 |         self.options = options
 70 |         # values required for proper parsing, need not be included in output
 71 |         self.required = ["JobID", "JobIDRaw", "State", "AdminComment"]
 72 |         # values derived from other values, list includes all dependent values
 73 |         self.derived: dict[str, list] = {
 74 |             "CPUEff": ["TotalCPU", "AllocCPUS", "Elapsed"],
 75 |             "MemEff": ["REQMEM", "NNodes", "AllocCPUS", "MaxRSS", "NTasks"],
 76 |             "TimeEff": ["Elapsed", "Timelimit"],
 77 |             "GPU": [],
 78 |             "GPUMem": [],
 79 |             "GPUEff": [],
 80 |             "Energy": ["TRESUsageOutAve"],
 81 |         }
 82 | 
 83 |         # build formatters
 84 |         self.formatters = build_formatters(format_str)
 85 | 
 86 |         # validate with titles and derived keys
 87 |         valid_titles += self.derived.keys()
 88 |         self.query_columns = self.validate_formatters(valid_titles)
 89 | 
 90 |         # build columns for sacct call
 91 |         self.correct_columns()
 92 | 
 93 |     def validate_formatters(self, valid_titles: list) -> list:
 94 |         """Validate titles of formatters attribute.
 95 | 
 96 |         Expands GPU to GPUEff and GPUMem in formatters
 97 | 
 98 |         Args:
 99 |             valid_titles: List of valid options for format tokens
100 | 
101 |         Returns:
102 |             Return list of validated strings to query
103 |         """
104 |         result = [fmt.validate_title(valid_titles) for fmt in self.formatters]
105 | 
106 |         if self.options.node:
107 |             if "JobID" not in self.formatters:
108 |                 self.formatters.insert(0, ColumnFormatter("JobID"))
109 |             # ensure alignment is <, regardless of inputs
110 |             self.formatters[self.formatters.index("JobID")].alignment = "<"
111 | 
112 |         if "GPU" in self.formatters:
113 |             ind = self.formatters.index("GPU")
114 |             self.formatters[ind].title = "GPUEff"
115 |             gpu_mem = copy.copy(self.formatters[ind])
116 |             gpu_mem.title = "GPUMem"
117 |             gpu_mem.color_function = lambda x: render_eff(x, "mid")
118 |             self.formatters.insert(ind + 1, gpu_mem)
119 | 
120 |         if (
121 |             self.options.gpu
122 |             and "GPUEff" not in self.formatters
123 |             and "GPUMem" not in self.formatters
124 |         ):
125 |             # need to assign color functions as that normally happens before this
126 |             formatter = ColumnFormatter("GPUEff")
127 |             self.formatters.append(formatter)
128 |             formatter = ColumnFormatter("GPUMem")
129 |             self.formatters.append(formatter)
130 | 
131 |         return result
132 | 
133 |     def correct_columns(self) -> None:
134 |         """Expand derived values of query columns and remove duplicates."""
135 |         result: list[list] = [self.derived.get(c, [c]) for c in self.query_columns]
136 |         # flatten
137 |         flat_result = [item for sublist in result for item in sublist]
138 | 
139 |         # add in required values
140 |         flat_result += self.required
141 | 
142 |         # remove duplicates
143 |         self.query_columns = sorted(set(flat_result))
144 | 
145 |     def format_jobs(self, jobs: list[Job]) -> str:
146 |         """Given list of jobs, build output table.
147 | 
148 |         Args:
149 |             jobs: List of job objects
150 | 
151 |         Returns:
152 |             Formatted table as single string
153 |         """
154 |         result = ""
155 |         delimiter = self.options.delimiter
156 | 
157 |         if len(self.formatters) == 0:
158 |             return result
159 | 
160 |         if len(self.formatters) == 1:
161 |             # if only one formatter is present, override the alignment
162 |             self.formatters[0].no_formatting()
163 |             # skip adding the title to result
164 | 
165 |         else:
166 |             for fmt in self.formatters:
167 |                 if self.options.parsable:
168 |                     fmt.no_formatting()
169 |                 else:
170 |                     fmt.compute_width(
171 |                         jobs, node=self.options.node, gpu=self.options.gpu
172 |                     )
173 | 
174 |             result += delimiter.join(
175 |                 fmt.format_title(bold=not self.options.parsable)
176 |                 for fmt in self.formatters
177 |             )
178 |             if len(jobs) != 0:
179 |                 result += "\n"
180 | 
181 |         if self.options.node:
182 |             # join each row by newlines
183 |             result += "\n".join(
184 |                 # join each column entry by spaces
185 |                 delimiter.join(str(column) for column in columns).rstrip()
186 |                 # for each job
187 |                 for job in jobs
188 |                 # columns is a tuple of generators from format_node_job
189 |                 for columns in zip(
190 |                     *(
191 |                         fmt.format_node_job(job, gpu=self.options.gpu)
192 |                         for fmt in self.formatters
193 |                     ),
194 |                 )
195 |             )
196 | 
197 |         else:
198 |             result += "\n".join(
199 |                 delimiter.join(fmt.format_job(job) for fmt in self.formatters).rstrip()
200 |                 for job in jobs
201 |             )
202 | 
203 |         return result
204 | 
205 | 
206 | class ColumnFormatter:
207 |     """A single column formatting object."""
208 | 
209 |     def __init__(self, token: str) -> None:
210 |         """Build column entry.
211 | 
212 |         Args:
213 |             token: format string of the form NAME[%[ALIGNMENT][WIDTH[e?]]]
214 | 
215 |         Raises:
216 |             ValueError: if unable to parse the format token
217 |         """
218 |         match = re.fullmatch(FORMAT_RE, token)
219 |         if not match or (
220 |             ("%" in token or ":" in token)
221 |             and not match.group("alignment")
222 |             and not match.group("width")
223 |         ):
224 |             err = f"Unable to parse format token {token!r}"
225 |             if "%" in token:
226 |                 err += ", did you forget to wrap in quotes?"
227 |             raise ValueError(err)
228 | 
229 |         self.title = match.group("title")
230 | 
231 |         self.alignment = match.group("alignment")
232 |         if not self.alignment:
233 |             self.alignment = "^"
234 | 
235 |         self.width = None
236 |         if match.group("width"):
237 |             self.width = int(match.group("width"))  # none will be calculated later
238 | 
239 |         self.end = match.group("end")
240 | 
241 |         self.color_function: Callable[[str], tuple[str, Any]] = lambda x: (str(x), None)
242 |         fold_title = self.title.casefold()
243 |         if fold_title == "state":
244 |             self.color_function = color_state
245 |         elif fold_title in ("cpueff", "gpueff", "gpu"):
246 |             self.color_function = lambda x: render_eff(x, "high")
247 |         elif fold_title in ("timeeff", "memeff", "gpumem"):
248 |             self.color_function = lambda x: render_eff(x, "mid")
249 | 
250 |     def __eq__(self, other: Any) -> bool:
251 |         """Test for equality.
252 | 
253 |         Args:
254 |             other: other object
255 | 
256 |         Returns:
257 |             True if the other object is a column formatter with matching attributes
258 |             or if this title match the other object as a string
259 | 
260 |         """
261 |         if isinstance(other, ColumnFormatter):
262 |             for k in self.__dict__:
263 |                 if k != "color_function" and self.__dict__[k] != other.__dict__[k]:
264 |                     return False
265 |             return True
266 |         if isinstance(other, str):
267 |             return self.title == other
268 |         return False
269 | 
270 |     def __repr__(self) -> str:
271 |         """Recreate format string of formatter.
272 | 
273 |         Returns:
274 |             String representation of column formatter
275 |         """
276 |         return f"{self.title}%{self.alignment}{self.width}"
277 | 
278 |     def validate_title(self, valid_titles: list[str]) -> str:
279 |         """Validate the title against a list.
280 | 
281 |         Tries to find this formatter's title in the valid titles list in a case
282 |         insensitive manner.  If found, replace with valid_title to correct
283 |         capitalization to match valid_titles entry.
284 | 
285 |         Args:
286 |             valid_titles: list of valid title strings
287 | 
288 |         Returns:
289 |             The self title validated from the valid_titles list
290 | 
291 |         Raises:
292 |             ValueError: if self.title is not found in the valid list
293 |         """
294 |         fold_title = self.title.casefold()
295 |         for title in valid_titles:
296 |             if fold_title == title.casefold():
297 |                 self.title = title
298 |                 return title
299 | 
300 |         msg = (
301 |             f"{self.title!r} is not a valid title. "
302 |             "Run sacct --helpformat for a list of allowed values."
303 |         )
304 |         raise ValueError(msg)
305 | 
306 |     def compute_width(
307 |         self,
308 |         jobs: list[Job],
309 |         *,
310 |         node: bool = False,
311 |         gpu: bool = False,
312 |     ) -> None:
313 |         """Set width for this column based on job listing.
314 | 
315 |         Determine the max width of all entries if the width attribute is unset.
316 |         Includes title in determination
317 | 
318 |         Args:
319 |             jobs: List of job objects to consider
320 |             node: If True, report individual node stats
321 |             gpu: If True, report individual gpu stats
322 |         """
323 |         if self.width is not None:
324 |             return
325 | 
326 |         self.width = len(self.title)
327 |         if len(jobs) > 0:
328 |             if node:
329 |                 width = max(
330 |                     len(str(entry))
331 |                     for job in jobs
332 |                     for entry in job.get_node_entries(self.title, gpu=gpu)
333 |                 )
334 |             else:
335 |                 width = max(len(str(job.get_entry(self.title))) for job in jobs)
336 |             self.width = max(self.width, width)
337 | 
338 |         self.width += 2  # add some boarder
339 | 
340 |     def no_formatting(self) -> None:
341 |         """Set the formatter to just display the entries."""
342 |         self.alignment = "<"
343 |         self.width = None
344 |         self.color_function = lambda x: (str(x), None)
345 | 
346 |     def format_title(self, *, bold: bool = True) -> str:
347 |         """Format title of column for printing.
348 | 
349 |         Args:
350 |             bold: if true, the resulting string will be styled bold
351 | 
352 |         Returns:
353 |             the formatted title
354 |         """
355 |         result = self.format_entry(self.title)
356 |         return click.style(result, bold=bold)
357 | 
358 |     def format_job(self, job: Job) -> str:
359 |         """Format the provided job for printing.
360 | 
361 |         Args:
362 |             job: the Job to format
363 | 
364 |         Returns:
365 |             the formatted job entry
366 |         """
367 |         value = job.get_entry(self.title)
368 |         return self.format_entry(*self.color_function(value))
369 | 
370 |     def format_node_job(
371 |         self,
372 |         job: Job,
373 |         *,
374 |         gpu: bool = False,
375 |     ) -> Generator[str, None, None]:
376 |         """Format the provided job for printing with individual node stats.
377 | 
378 |         Args:
379 |             job: the Job to format
380 |             gpu: If True, report individual gpu stats
381 | 
382 |         Returns:
383 |             generator with values for the job
384 |         """
385 |         return (
386 |             self.format_entry(*self.color_function(value))
387 |             for value in job.get_node_entries(self.title, gpu=gpu)
388 |         )
389 | 
390 |     def format_entry(self, entry: str, color: str | None = None) -> str:
391 |         """Format the entry to match width, alignment, and color.
392 | 
393 |         If no color is supplied, will just return string
394 |         If supplied, use click.style to change fg
395 |         If the entry is longer than self.width, truncate the end
396 | 
397 |         Args:
398 |             entry: the string to format
399 |             color: set foreground of style string
400 | 
401 |         Returns:
402 |             entry colored, aligned, and possibly truncated
403 |         """
404 |         if self.width is None:
405 |             result = entry
406 |         else:
407 |             entry = entry[-self.width :] if self.end else entry[: self.width]
408 |             result = (f"{{:{self.alignment}{self.width}}}").format(entry)
409 | 
410 |         if color:
411 |             result = click.style(result, fg=color)
412 |         return result
413 | 
414 | 
415 | def color_state(value: str) -> tuple[str, str | None]:
416 |     """Get the color name of the provided state string.
417 | 
418 |     Args:
419 |         value: the state name of the job
420 | 
421 |     Returns:
422 |         The state value and it's color (if found) or None
423 |     """
424 |     return value, state_colors.get(value, None)
425 | 
426 | 
427 | def render_eff(value: str | float, target_type: str) -> tuple[str, str | None]:
428 |     """Return a styled string for efficiency values.
429 | 
430 |     Args:
431 |         value: the number or string to render
432 |         target_type: "mid" or "high", the type of color map to use
433 | 
434 |     Returns:
435 |         A tuple with:
436 |         the value formatted with a percent sybol
437 |         the color or None if it should remain the default
438 |     """
439 |     color_maps = {"mid": color_mid, "high": color_high}
440 |     if isinstance(value, str):  # a "---"
441 |         color = None
442 |     else:
443 |         color = color_maps[target_type](value)
444 |         value = f"{value}%"
445 |     return value, color
446 | 
447 | 
448 | def color_mid(value: float) -> str | None:
449 |     """Determine color for efficiency value where "mid" values are the target.
450 | 
451 |     Args:
452 |         value: percent (0-100) of value to color
453 | 
454 |     Returns:
455 |         The color string for click or None if color should be unchanged
456 |     """
457 |     if value < MID_LIMIT_LOW or value > MID_LIMIT_HIGH:
458 |         return "red"
459 |     if value > MID_LIMIT_GOOD:
460 |         return "green"
461 |     return None
462 | 
463 | 
464 | def color_high(value: float) -> str | None:
465 |     """Determine color for efficiency value where "high" values are the target.
466 | 
467 |     Args:
468 |         value: percent (0-100) of value to color
469 | 
470 |     Returns:
471 |         The color string for click or None if color should be unchanged
472 |     """
473 |     if value < HIGH_LIMIT_LOW:
474 |         return "red"
475 |     if value > HIGH_LIMIT_GOOD:
476 |         return "green"
477 |     return None
478 | 
479 | 
480 | def build_formatters(format_str: str) -> list:
481 |     """Generate list of formatters from comma separated list in format string.
482 | 
483 |     Args:
484 |         format_str: comma separated list of format tokens
485 | 
486 |     Returns:
487 |         Return list of ColumnFormatters
488 |     """
489 |     return [ColumnFormatter(fmt) for fmt in format_str.split(",") if fmt != ""]
490 | 


--------------------------------------------------------------------------------
/src/reportseff/parameters.py:
--------------------------------------------------------------------------------
 1 | """Command line parameter collection."""
 2 | 
 3 | from dataclasses import dataclass
 4 | 
 5 | 
 6 | @dataclass
 7 | class ReportseffParameters:
 8 |     """Collection of parameters from the command line.
 9 | 
10 |     Basically a dataclass but I want to be python 3.6 compatible without the
11 |     pip package
12 |     """
13 | 
14 |     color: bool
15 |     jobs: tuple
16 |     debug: bool = False
17 |     format_str: str = ""
18 |     modified_sort: bool = False
19 |     node: bool = False
20 |     node_and_gpu: bool = False
21 |     not_state: str = ""
22 |     parsable: bool = False
23 |     delimiter: str = ""
24 |     since: str = ""
25 |     until: str = ""
26 |     state: str = ""
27 |     slurm_format: str = ""
28 |     user: str = ""
29 |     partition: str = ""
30 |     cluster: str = ""
31 |     extra_args: str = ""
32 | 
33 |     def __post_init__(self) -> None:
34 |         """Post init method to handle prepending format string with +."""
35 |         if self.format_str.startswith("+"):
36 |             self.format_str = (
37 |                 "JobID%>,State,Elapsed%>,TimeEff,CPUEff,MemEff," + self.format_str[1:]
38 |             )
39 | 


--------------------------------------------------------------------------------
/tests/conftest.py:
--------------------------------------------------------------------------------
  1 | """Collect common fixtures."""
  2 | 
  3 | import base64
  4 | import gzip
  5 | import json
  6 | 
  7 | import pytest
  8 | 
  9 | 
 10 | def to_comment(info: dict) -> str:
 11 |     """Convert jobstats dict to compressed base64 to match AdminComment."""
 12 |     return "JS1:" + base64.b64encode(
 13 |         gzip.compress(json.dumps(info, sort_keys=True, indent=4).encode("ascii"))
 14 |     ).decode("ascii")
 15 | 
 16 | 
 17 | @pytest.fixture()
 18 | def get_jobstats():
 19 |     """Fixture to produce jobstats-like encoding."""
 20 |     return to_comment
 21 | 
 22 | 
 23 | def to_sacct_dict(sacct_line: str) -> dict:
 24 |     """Convert debug print statement to dictionary like from sacct."""
 25 |     columns = (
 26 |         "AdminComment",
 27 |         "AllocCPUS",
 28 |         "Elapsed",
 29 |         "JobID",
 30 |         "JobIDRaw",
 31 |         "MaxRSS",
 32 |         "NNodes",
 33 |         "REQMEM",
 34 |         "State",
 35 |         "Timelimit",
 36 |         "TotalCPU",
 37 |         "NTasks",
 38 |     )
 39 |     return dict(zip(columns, sacct_line.split("|")))
 40 | 
 41 | 
 42 | @pytest.fixture()
 43 | def single_core():
 44 |     """Single core 8206163."""
 45 |     comment = to_comment(
 46 |         {
 47 |             "gpus": False,
 48 |             "nodes": {
 49 |                 "tiger-h26c1n19": {
 50 |                     "cpus": 1,
 51 |                     "total_memory": 16106127360,
 52 |                     "total_time": 54515.3,
 53 |                     "used_memory": 582283264,
 54 |                 }
 55 |             },
 56 |             "total_time": 54677,
 57 |         }
 58 |     )
 59 | 
 60 |     # sacct info is from another job!
 61 |     return [
 62 |         to_sacct_dict(
 63 |             f"{comment}|2|02:14:11|39889258_1426|39895850||1|8G|COMPLETED|02:55:00|03:43:27"
 64 |         ),
 65 |         to_sacct_dict(
 66 |             "|2|02:14:11|39889258_1426.batch|39895850.batch|4224K|1||COMPLETED||00:00.081"
 67 |         ),
 68 |         to_sacct_dict(
 69 |             "|2|02:14:11|39889258_1426.extern|39895850.extern|0|1||COMPLETED||00:00.001"
 70 |         ),
 71 |         to_sacct_dict(
 72 |             "|2|02:14:11|39889258_1426.0|39895850.0|3501608K|1||COMPLETED||03:43:27"
 73 |         ),
 74 |     ]
 75 | 
 76 | 
 77 | @pytest.fixture()
 78 | def multi_node():
 79 |     """Multiple nodes with 20 cpus, 80 GB, 9 minutes 8205048."""
 80 |     comment = to_comment(
 81 |         {
 82 |             "gpus": False,
 83 |             "nodes": {
 84 |                 "tiger-h19c1n15": {
 85 |                     "cpus": 20,
 86 |                     "total_memory": 83886080000,
 87 |                     "total_time": 542.0,
 88 |                     "used_memory": 3790352384,
 89 |                 },
 90 |                 "tiger-h26c2n13": {
 91 |                     "cpus": 20,
 92 |                     "total_memory": 83886080000,
 93 |                     "total_time": 0.0,
 94 |                     "used_memory": 0,
 95 |                 },
 96 |                 "tiger-i26c2n11": {
 97 |                     "cpus": 20,
 98 |                     "total_memory": 83886080000,
 99 |                     "total_time": 0.0,
100 |                     "used_memory": 0,
101 |                 },
102 |                 "tiger-i26c2n15": {
103 |                     "cpus": 20,
104 |                     "total_memory": 83886080000,
105 |                     "total_time": 0.0,
106 |                     "used_memory": 0,
107 |                 },
108 |             },
109 |             "total_time": 146,
110 |         }
111 |     )
112 | 
113 |     return [
114 |         to_sacct_dict(
115 |             f"{comment}|80|00:02:26|8205048|8205048||4|312.50G|COMPLETED|01:00:00|16:01.272"
116 |         ),
117 |         to_sacct_dict(
118 |             "|20|00:02:26|8205048.batch|8205048.batch|1764224K|1||COMPLETED||16:01.268"
119 |         ),
120 |         to_sacct_dict(
121 |             "|80|00:02:26|8205048.extern|8205048.extern|0|4||COMPLETED||00:00.004"
122 |         ),
123 |     ]
124 | 
125 | 
126 | @pytest.fixture()
127 | def single_gpu():
128 |     """One gpu, used all 16 GB, 30% eff 8197399."""
129 |     comment = to_comment(
130 |         {
131 |             "gpus": True,
132 |             "nodes": {
133 |                 "tiger-i23g14": {
134 |                     "cpus": 1,
135 |                     "gpu_total_memory": {"3": 17071734784},
136 |                     "gpu_used_memory": {"3": 17040539648},
137 |                     "gpu_utilization": {"3": 29.4},
138 |                     "total_memory": 34359738368,
139 |                     "total_time": 17368.0,
140 |                     "used_memory": 3250450432,
141 |                 }
142 |             },
143 |             "total_time": 18203,
144 |         }
145 |     )
146 | 
147 |     return [
148 |         to_sacct_dict(
149 |             f"{comment}|1|05:03:23|8197399|8197399||1|32G|COMPLETED|23:59:00|04:49:38"
150 |         ),
151 |         to_sacct_dict(
152 |             "|1|05:03:23|8197399.batch|8197399.batch|3132024K|1||COMPLETED||04:49:38"
153 |         ),
154 |         to_sacct_dict(
155 |             "|1|05:03:23|8197399.extern|8197399.extern|0|1||COMPLETED||00:00:00"
156 |         ),
157 |     ]
158 | 
159 | 
160 | @pytest.fixture()
161 | def multi_gpu():
162 |     """4 gpus, 30% mem eff, 3% util 8189521."""
163 |     comment = to_comment(
164 |         {
165 |             "gpus": True,
166 |             "nodes": {
167 |                 "tiger-i19g9": {
168 |                     "cpus": 28,
169 |                     "gpu_total_memory": {
170 |                         "0": 17071734784,
171 |                         "1": 17071734784,
172 |                         "2": 17071734784,
173 |                         "3": 17071734784,
174 |                     },
175 |                     "gpu_used_memory": {
176 |                         "0": 5146542080,
177 |                         "1": 5146542080,
178 |                         "2": 5146542080,
179 |                         "3": 5146542080,
180 |                     },
181 |                     "gpu_utilization": {"0": 3.5, "1": 3.5, "2": 3.2, "3": 3.8},
182 |                     "total_memory": 117440512000,
183 |                     "total_time": 201481.2,
184 |                     "used_memory": 30866018304,
185 |                 }
186 |             },
187 |             "total_time": 68687,
188 |         }
189 |     )
190 |     return [
191 |         to_sacct_dict(
192 |             f"{comment}|28|19:04:47|8189521|8189521||1|112000M|"
193 |             "CANCELLED by 129276|23:00:00|2-07:51:43"
194 |         ),
195 |         to_sacct_dict(
196 |             "|28|19:04:48|8189521.batch|8189521.batch|29036860K|1||CANCELLED||2-07:51:43"
197 |         ),
198 |         to_sacct_dict(
199 |             "|28|19:04:47|8189521.extern|8189521.extern|0|1||COMPLETED||00:00:00"
200 |         ),
201 |     ]
202 | 
203 | 
204 | @pytest.fixture()
205 | def multi_node_multi_gpu():
206 |     """Made up job with multiple nodes and gpus."""
207 |     comment = to_comment(
208 |         {
209 |             "gpus": True,
210 |             "nodes": {
211 |                 "tiger-i19g9": {
212 |                     "cpus": 28,
213 |                     "gpu_total_memory": {
214 |                         "0": 17071734784,
215 |                         "1": 17071734784,
216 |                         "2": 17071734784,
217 |                         "3": 17071734784,
218 |                     },
219 |                     "gpu_used_memory": {
220 |                         "0": 5146542080,
221 |                         "1": 5146542080,
222 |                         "2": 5146542080,
223 |                         "3": 5146542080,
224 |                     },
225 |                     "gpu_utilization": {"0": 3.5, "1": 3.5, "2": 3.2, "3": 3.8},
226 |                     "total_memory": 117440512000,
227 |                     "total_time": 201481.2,
228 |                     "used_memory": 30866018304,
229 |                 },
230 |                 "tiger-i19g10": {
231 |                     "cpus": 28,
232 |                     "gpu_total_memory": {
233 |                         "0": 17071734783,
234 |                         "1": 17071734783,
235 |                         "2": 17071734783,
236 |                         "3": 17071734783,
237 |                     },
238 |                     "gpu_used_memory": {
239 |                         "0": 5146542380,
240 |                         "1": 5146542380,
241 |                         "2": 5146542322,
242 |                         "3": 5146542380,
243 |                     },
244 |                     "gpu_utilization": {"0": 7.5, "1": 7.5, "2": 7.2, "3": 7.8},
245 |                     "total_memory": 117440512000,
246 |                     "total_time": 201411.2,
247 |                     "used_memory": 30266018304,
248 |                 },
249 |             },
250 |             "total_time": 68687,
251 |         }
252 |     )
253 |     return [
254 |         to_sacct_dict(
255 |             f"{comment}|28|19:04:47|8189521|8189521||1|112000M|"
256 |             "CANCELLED by 129276|23:00:00|2-07:51:43"
257 |         ),
258 |         to_sacct_dict(
259 |             "|28|19:04:48|8189521.batch|8189521.batch|29036860K|1||CANCELLED||2-07:51:43"
260 |         ),
261 |         to_sacct_dict(
262 |             "|28|19:04:47|8189521.extern|8189521.extern|0|1||COMPLETED||00:00:00"
263 |         ),
264 |     ]
265 | 
266 | 
267 | @pytest.fixture()
268 | def short_job():
269 |     """Used for jobs which don't last long enough 8205464."""
270 |     comment = "JS1:Short"
271 |     return [
272 |         to_sacct_dict(
273 |             f"{comment}|8|00:00:02|8205464|8205464||1|64G|FAILED|1-00:00:00|00:01.608"
274 |         ),
275 |         to_sacct_dict("|8|00:00:02|8205464.batch|8205464.batch|0|1||FAILED||00:00.020"),
276 |         to_sacct_dict(
277 |             "|8|00:00:02|8205464.extern|8205464.extern|0|1||COMPLETED||00:00:00"
278 |         ),
279 |         to_sacct_dict("|8|00:00:02|8205464.0|8205464.0|0|1||FAILED||00:01.587"),
280 |     ]
281 | 
282 | 
283 | @pytest.fixture()
284 | def bad_gpu():
285 |     """Job with a failure due to bad gpu."""
286 |     return [
287 |         to_sacct_dict(
288 |             "JS1:H4sIAMMP3WMC/12NQQrDIBRE7/LXthj1q9/LhFAlFLSGRhdFvHuTphTS5TDz3"
289 |             "jR4ZB9WcA18iHG6RC5n3GPJZYpjCik/X+CUIEXaCNIM6hr8rxi0sUSEKNgXKfcUwA"
290 |             "mjub4Sg9tSN/3AYF7qeJY2kOAsbrxUSIL3Y3TyHxuDUiuJovf+f2Ok/WD7SX8DnGN"
291 |             "K388AAAA=|1|07:42:18|45352405|45352405||1|4G|CANCELLED by 349394|"
292 |             "23:00:00|07:40:23"
293 |         ),
294 |         to_sacct_dict(
295 |             "|1|07:42:20|45352405.batch|45352405.batch|1644460K|1||CANCELLED||07:40:23"
296 |         ),
297 |         to_sacct_dict(
298 |             "|1|07:42:19|45352405.extern|45352405.extern|104K|1||COMPLETED||00:00:00"
299 |         ),
300 |     ]
301 | 
302 | 
303 | @pytest.fixture()
304 | def bad_gpu_used():
305 |     """Job with a failure due to gpu with no utilization."""
306 |     return [
307 |         to_sacct_dict(
308 |             "JS1:H4sIAN7HCGQC/1WOQQ6DIBBF7zJrawYGRvAyxlRiSFBMi4vWcPeitk1c/sy8//4GcxzcE9oNBhdCfwuoR7nHFFMfuslN8fGCViORYGUQsYL16Yb/RZGyDbNhNNUXSn5y0FpGZFNzBfdlLQYhKxiXtbsWb1BsRhtrSWkrSztdcj6hi/JkGk2sSMuDEEYSSqFY849IPvh3n3ycd6L82FrnnK8jDQmpDqAslPkDhnD5Hg8BAAA=|12|23:05:24|46044267|46044267||1|48000M|TIMEOUT|23:00:00|11-02:46:01"
309 |         ),
310 |         to_sacct_dict(
311 |             "|12|23:05:55|46044267.batch|46044267.batch|42475564K|1||CANCELLED||11-02:46:01"
312 |         ),
313 |         to_sacct_dict(
314 |             "|12|23:05:24|46044267.extern|46044267.extern|0|1||COMPLETED||00:00:00"
315 |         ),
316 |     ]
317 | 
318 | 
319 | @pytest.fixture()
320 | def multinode_job():
321 |     """Job run on multiple nodes."""
322 |     return [
323 |         to_sacct_dict(
324 |             "|720|12-14:16:39|6196869|6196869||20|191846Mn|COMPLETED|UNLIMITED|451-06:00:24"
325 |         ),
326 |         to_sacct_dict(
327 |             "|36|12-14:16:39|6196869.batch|6196869.batch|33824748K|1|191846Mn|COMPLETED||451-06:00:24"
328 |         ),
329 |     ]
330 | 
331 | 
332 | @pytest.fixture()
333 | def issue_41():
334 |     """Job run on multiple nodes, with multiple tasks."""
335 |     return [
336 |         to_sacct_dict(
337 |             "|8|00:00:53|131042|131042||1|16000M|COMPLETED|00:01:00|06:57.815|8"
338 |         ),
339 |         to_sacct_dict(
340 |             "|8|00:00:53|131042.batch|131042.batch|20264K|1||COMPLETED||00:00.034|8"
341 |         ),
342 |         to_sacct_dict(
343 |             "|8|00:00:53|131042.extern|131042.extern|1052K|1||COMPLETED||00:00.001|8"
344 |         ),
345 |         to_sacct_dict(
346 |             "|8|00:00:53|131042.0|131042.0|1947276K|1||COMPLETED||06:57.779|8"
347 |         ),
348 |     ]
349 | 
350 | 
351 | @pytest.fixture()
352 | def console_jobs():
353 |     """Collection of sacct outputs for test_reportseff."""
354 |     # indexed on job id
355 |     return {
356 |         "25569410_notime": (
357 |             "^|^1^|^21:14:48^|^25569410^|^25569410^|^^|^1^|^1^|^4000Mc^|^"
358 |             "COMPLETED^|^19:28:36^|^\n"
359 |             "^|^1^|^21:14:49^|^25569410.extern^|^25569410.extern^|^1548K^|^"
360 |             "1^|^1^|^4000Mc^|^COMPLETED^|^00:00:00^|^\n"
361 |             "^|^1^|^21:14:43^|^25569410.0^|^25569410.0^|^62328K"
362 |             "^|^1^|^1^|^4000Mc^|^COMPLETED^|^19:28:36^|^\n"
363 |         ),
364 |         "24418435_notime": (
365 |             "^|^1^|^01:27:42^|^24418435^|^24418435^|^^|^1^|^1^|^1Gn^|^"
366 |             "COMPLETED^|^01:27:29^|^\n"
367 |             "^|^1^|^01:27:42^|^24418435.batch^|^24418435.batch^|^499092K^|^"
368 |             "1^|^1^|^1Gn^|^COMPLETED^|^01:27:29^|^\n"
369 |             "^|^1^|^01:27:42^|^24418435.extern^|^24418435.extern^|^1376K^|^"
370 |             "1^|^1^|^1Gn^|^COMPLETED^|^00:00:00^|^\n"
371 |         ),
372 |         "24418435": (
373 |             "^|^1^|^01:27:42^|^24418435^|^24418435^|^^|^1^|^1^|^1Gn^|^"
374 |             "COMPLETED^|^03:00:00^|^01:27:29^|^\n"
375 |             "^|^1^|^01:27:42^|^24418435.batch^|^24418435.batch^|^499092K^|^"
376 |             "1^|^1^|^1Gn^|^COMPLETED^|^^|^01:27:29^|^\n"
377 |             "^|^1^|^01:27:42^|^24418435.extern^|^24418435.extern^|^1376K^|^"
378 |             "1^|^1^|^1Gn^|^COMPLETED^|^^|^00:00:00^|^\n"
379 |         ),
380 |         "23000233": (
381 |             "^|^16^|^00:00:00^|^23000233^|^23000233^|^^|^1^|^1^|^4000Mc^|^"
382 |             "CANCELLED by 129319^|^6-00:00:00^|^00:00:00^|^\n"
383 |         ),
384 |         "24221219": (
385 |             "^|^1^|^00:09:34^|^24220929_421^|^24221219^|^^|^1^|^1^|^16000Mn^|^"
386 |             "COMPLETED^|^09:28.052^|^\n"
387 |             "^|^1^|^00:09:34^|^24220929_421.batch^|^24221219.batch"
388 |             "^|^5664932K^|^1^|^1^|^16000Mn^|^COMPLETED^|^09:28.051^|^\n"
389 |             "^|^1^|^00:09:34^|^24220929_421.extern^|^24221219.extern"
390 |             "^|^1404K^|^1^|^1^|^16000Mn^|^COMPLETED^|^00:00:00^|^\n"
391 |         ),
392 |         "24221220": (
393 |             "^|^1^|^00:09:33^|^24220929_431^|^24221220^|^^|^1^|^1^|^16000Mn^|^"
394 |             "PENDING^|^09:27.460^|^\n"
395 |             "^|^1^|^00:09:33^|^24220929_431.batch^|^24221220.batch"
396 |             "^|^5518572K^|^1^|^1^|^16000Mn^|^PENDING^|^09:27.459^|^\n"
397 |             "^|^1^|^00:09:33^|^24220929_431.extern^|^24221220.extern"
398 |             "^|^1400K^|^1^|^1^|^16000Mn^|^PENDING^|^00:00:00^|^\n"
399 |         ),
400 |         "23000381": (
401 |             "^|^8^|^00:00:12^|^23000381^|^23000381^|^^|^1^|^1^|^4000Mc^|^FAILED^|^00:00:00^|^\n"
402 |             "^|^8^|^00:00:12^|^23000381.batch^|^23000381.batch^|^^|^1^|^1^|^4000Mc^|^"
403 |             "FAILED^|^00:00:00^|^\n"
404 |             "^|^8^|^00:00:12^|^23000381.extern^|^23000381.extern^|^1592K^|^1^|^1^|^4000Mc^|^"
405 |             "COMPLETED^|^00:00:00^|^\n"
406 |         ),
407 |         "23000210": (
408 |             "^|^8^|^00:00:00^|^23000210^|^23000210^|^^|^1^|^1^|^20000Mn^|^"
409 |             "FAILED^|^00:00.007^|^\n"
410 |             "^|^8^|^00:00:00^|^23000210.batch^|^23000210.batch^|^1988K^|^1^|^1^|^20000Mn^|^"
411 |             "FAILED^|^00:00.006^|^\n"
412 |             "^|^8^|^00:00:00^|^23000210.extern^|^23000210.extern^|^1556K^|^1^|^1^|^20000Mn^|^"
413 |             "COMPLETED^|^00:00:00^|^\n"
414 |         ),
415 |     }
416 | 


--------------------------------------------------------------------------------
/tests/test_db_inquirer.py:
--------------------------------------------------------------------------------
  1 | """Test sacct implementation of db inqurirer."""
  2 | 
  3 | import datetime
  4 | import subprocess
  5 | 
  6 | import pytest
  7 | from reportseff import db_inquirer
  8 | 
  9 | 
 10 | @pytest.fixture()
 11 | def sacct():
 12 |     """Default sacct inquirer."""
 13 |     return db_inquirer.SacctInquirer()
 14 | 
 15 | 
 16 | def test_sacct_init(sacct):
 17 |     """Check default options on new object."""
 18 |     assert sacct.default_args == ["sacct", "--parsable", "-n", "--delimiter=^|^"]
 19 |     assert sacct.user is None
 20 | 
 21 | 
 22 | def test_sacct_get_valid_formats(sacct, mocker):
 23 |     """Check valid parsing of help format."""
 24 |     mock_sacct = mocker.MagicMock
 25 |     mock_sacct.returncode = 1
 26 |     # these are the values for 18.08.7
 27 |     mock_sacct.stdout = (
 28 |         "Account             AdminComment        AllocCPUS           AllocGRES"
 29 |         "\nAllocNodes          AllocTRES           AssocID             AveCPU"
 30 |         "\nAveCPUFreq          AveDiskRead         AveDiskWrite        "
 31 |         "AvePages           \nAveRSS              AveVMSize           BlockID "
 32 |         "Cluster            \nComment             ConsumedEnergy      "
 33 |         "ConsumedEnergyRaw   CPUTime            \nCPUTimeRAW "
 34 |         "DerivedExitCode     Elapsed             ElapsedRaw         \nEligible"
 35 |         " End                 ExitCode            GID                \nGroup"
 36 |         " JobID               JobIDRaw            JobName            \nLayout"
 37 |         " MaxDiskRead         MaxDiskReadNode     MaxDiskReadTask    "
 38 |         "\nMaxDiskWrite        MaxDiskWriteNode    MaxDiskWriteTask    "
 39 |         "MaxPages           \nMaxPagesNode        MaxPagesTask        MaxRSS"
 40 |         " MaxRSSNode         \nMaxRSSTask          MaxVMSize           "
 41 |         "MaxVMSizeNode       MaxVMSizeTask      \nMcsLabel            "
 42 |         "MinCPU              MinCPUNode          MinCPUTask         \nNCPUS"
 43 |         " NNodes              NodeList            NTasks             "
 44 |         "\nPriority Partition           QOS                 QOSRAW           "
 45 |         "\nReqCPUFreq          ReqCPUFreqMin       ReqCPUFreqMax       "
 46 |         "ReqCPUFreqGov      \nReqCPUS             ReqGRES             ReqMem "
 47 |         "ReqNodes           \nReqTRES             Reservation         "
 48 |         "ReservationId       Reserved           \nResvCPU             "
 49 |         "ResvCPURAW          Start               State              \nSubmit "
 50 |         "Suspended           SystemCPU           SystemComment      "
 51 |         "\nTimelimit           TimelimitRaw        TotalCPU            "
 52 |         "TRESUsageInAve     \nTRESUsageInMax      TRESUsageInMaxNode "
 53 |         "TRESUsageInMaxTask  TRESUsageInMin     \nTRESUsageInMinNode "
 54 |         "TRESUsageInMinTask  TRESUsageInTot      TRESUsageOutAve "
 55 |         "\nTRESUsageOutMax     TRESUsageOutMaxNode TRESUsageOutMaxTask "
 56 |         "TRESUsageOutMin    \nTRESUsageOutMinNode TRESUsageOutMinTask "
 57 |         "TRESUsageOutTot     UID                \nUser                "
 58 |         "UserCPU             WCKey               WCKeyID            "
 59 |         "\nWorkDir            \n"
 60 |     )
 61 |     mocker.patch("reportseff.db_inquirer.subprocess.run", return_value=mock_sacct)
 62 |     with pytest.raises(
 63 |         Exception, match="Error retrieving sacct options with --helpformat"
 64 |     ):
 65 |         sacct.get_valid_formats()
 66 | 
 67 |     mock_sacct.returncode = 0
 68 |     result = [
 69 |         "Account",
 70 |         "AdminComment",
 71 |         "AllocCPUS",
 72 |         "AllocGRES",
 73 |         "AllocNodes",
 74 |         "AllocTRES",
 75 |         "AssocID",
 76 |         "AveCPU",
 77 |         "AveCPUFreq",
 78 |         "AveDiskRead",
 79 |         "AveDiskWrite",
 80 |         "AvePages",
 81 |         "AveRSS",
 82 |         "AveVMSize",
 83 |         "BlockID",
 84 |         "Cluster",
 85 |         "Comment",
 86 |         "ConsumedEnergy",
 87 |         "ConsumedEnergyRaw",
 88 |         "CPUTime",
 89 |         "CPUTimeRAW",
 90 |         "DerivedExitCode",
 91 |         "Elapsed",
 92 |         "ElapsedRaw",
 93 |         "Eligible",
 94 |         "End",
 95 |         "ExitCode",
 96 |         "GID",
 97 |         "Group",
 98 |         "JobID",
 99 |         "JobIDRaw",
100 |         "JobName",
101 |         "Layout",
102 |         "MaxDiskRead",
103 |         "MaxDiskReadNode",
104 |         "MaxDiskReadTask",
105 |         "MaxDiskWrite",
106 |         "MaxDiskWriteNode",
107 |         "MaxDiskWriteTask",
108 |         "MaxPages",
109 |         "MaxPagesNode",
110 |         "MaxPagesTask",
111 |         "MaxRSS",
112 |         "MaxRSSNode",
113 |         "MaxRSSTask",
114 |         "MaxVMSize",
115 |         "MaxVMSizeNode",
116 |         "MaxVMSizeTask",
117 |         "McsLabel",
118 |         "MinCPU",
119 |         "MinCPUNode",
120 |         "MinCPUTask",
121 |         "NCPUS",
122 |         "NNodes",
123 |         "NodeList",
124 |         "NTasks",
125 |         "Priority",
126 |         "Partition",
127 |         "QOS",
128 |         "QOSRAW",
129 |         "ReqCPUFreq",
130 |         "ReqCPUFreqMin",
131 |         "ReqCPUFreqMax",
132 |         "ReqCPUFreqGov",
133 |         "ReqCPUS",
134 |         "ReqGRES",
135 |         "ReqMem",
136 |         "ReqNodes",
137 |         "ReqTRES",
138 |         "Reservation",
139 |         "ReservationId",
140 |         "Reserved",
141 |         "ResvCPU",
142 |         "ResvCPURAW",
143 |         "Start",
144 |         "State",
145 |         "Submit",
146 |         "Suspended",
147 |         "SystemCPU",
148 |         "SystemComment",
149 |         "Timelimit",
150 |         "TimelimitRaw",
151 |         "TotalCPU",
152 |         "TRESUsageInAve",
153 |         "TRESUsageInMax",
154 |         "TRESUsageInMaxNode",
155 |         "TRESUsageInMaxTask",
156 |         "TRESUsageInMin",
157 |         "TRESUsageInMinNode",
158 |         "TRESUsageInMinTask",
159 |         "TRESUsageInTot",
160 |         "TRESUsageOutAve",
161 |         "TRESUsageOutMax",
162 |         "TRESUsageOutMaxNode",
163 |         "TRESUsageOutMaxTask",
164 |         "TRESUsageOutMin",
165 |         "TRESUsageOutMinNode",
166 |         "TRESUsageOutMinTask",
167 |         "TRESUsageOutTot",
168 |         "UID",
169 |         "User",
170 |         "UserCPU",
171 |         "WCKey",
172 |         "WCKeyID",
173 |         "WorkDir",
174 |     ]
175 |     assert sacct.get_valid_formats() == result
176 | 
177 | 
178 | def test_sacct_get_db_output(sacct, mocker):
179 |     """get_db_output returns subprocess output as dictionary."""
180 |     mocker.patch(
181 |         "reportseff.db_inquirer.subprocess.run",
182 |         side_effect=subprocess.CalledProcessError(1, "test"),
183 |     )
184 |     with pytest.raises(RuntimeError) as exception:
185 |         sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split())
186 |     assert "Error running sacct!" in str(exception)
187 | 
188 |     mock_sacct = mocker.MagicMock()
189 |     mock_sacct.returncode = 0
190 |     mock_sacct.stdout = "c1j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
191 |     mock_sub = mocker.patch(
192 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
193 |     )
194 |     result = sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split())
195 |     assert result == [
196 |         {"c1": "c1j1", "c2": "c2j1"},
197 |         {"c1": "c1j2", "c2": "c2j2"},
198 |         {"c1": "c1j3", "c2": "c2j3"},
199 |     ]
200 |     mock_sub.assert_called_once_with(
201 |         args=(
202 |             "sacct --parsable -n --delimiter=^|^ " "--format=c1,c2 --jobs=j1,j2,j3"
203 |         ).split(),
204 |         stdout=mocker.ANY,
205 |         encoding=mocker.ANY,
206 |         check=mocker.ANY,
207 |         shell=False,
208 |         text=True,
209 |     )
210 | 
211 |     debug = []
212 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
213 |     assert debug[0] == ("c1j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
214 | 
215 | 
216 | def test_sacct_get_db_output_no_newline(sacct, mocker):
217 |     """Can process output without newlines."""
218 |     mock_sacct = mocker.MagicMock()
219 |     mock_sacct.returncode = 0
220 |     mock_sacct.stdout = (
221 |         "16^|^00:00:00^|^23000233^|^23000233^|^^|^1^|^4000Mc^|^CANCELLED by 129319^|^"
222 |         "6-00:00:00^|^00:00:00"
223 |     )
224 |     mock_sub = mocker.patch(
225 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
226 |     )
227 |     debug = []
228 |     result = sacct.get_db_output(
229 |         [
230 |             "AllocCPUS",
231 |             "Elapsed",
232 |             "JobID",
233 |             "JobIDRaw",
234 |             "MaxRSS",
235 |             "NNodes",
236 |             "REQMEM",
237 |             "State",
238 |             "Timelimit",
239 |             "TotalCPU",
240 |         ],
241 |         ["23000233"],
242 |         debug.append,
243 |     )
244 |     assert result == [
245 |         {
246 |             "AllocCPUS": "16",
247 |             "Elapsed": "00:00:00",
248 |             "JobID": "23000233",
249 |             "JobIDRaw": "23000233",
250 |             "MaxRSS": "",
251 |             "NNodes": "1",
252 |             "REQMEM": "4000Mc",
253 |             "State": "CANCELLED by 129319",
254 |             "Timelimit": "6-00:00:00",
255 |             "TotalCPU": "00:00:00",
256 |         }
257 |     ]
258 |     mock_sub.assert_called_once()
259 | 
260 |     assert debug[0] == (
261 |         "16^|^00:00:00^|^23000233^|^23000233^|^^|^1^|^4000Mc^|^CANCELLED by 129319^|^"
262 |         "6-00:00:00^|^00:00:00"
263 |     )
264 | 
265 | 
266 | def test_sacct_set_user(sacct):
267 |     """Can set user."""
268 |     sacct.set_user("user")
269 |     assert sacct.user == "user"
270 | 
271 | 
272 | def test_sacct_get_db_output_user(sacct, mocker):
273 |     """User and since affects subprocess call."""
274 |     mocker.patch(
275 |         "reportseff.db_inquirer.subprocess.run",
276 |         side_effect=subprocess.CalledProcessError(1, "test"),
277 |     )
278 |     mock_date = mocker.MagicMock()
279 |     mock_date.today.return_value = datetime.date(2018, 1, 20)
280 |     mock_date.side_effect = datetime.date
281 |     mocker.patch("reportseff.db_inquirer.datetime.date", mock_date)
282 |     with pytest.raises(Exception, match="Error running sacct!"):
283 |         sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split())
284 | 
285 |     mock_sacct = mocker.MagicMock()
286 |     mock_sacct.returncode = 0
287 |     mock_sacct.stdout = "c1j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
288 |     mock_sub = mocker.patch(
289 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
290 |     )
291 |     sacct.set_user("user")
292 |     result = sacct.get_db_output("c1 c2".split(), {})
293 |     assert result == [
294 |         {"c1": "c1j1", "c2": "c2j1"},
295 |         {"c1": "c1j2", "c2": "c2j2"},
296 |         {"c1": "c1j3", "c2": "c2j3"},
297 |     ]
298 |     mock_sub.assert_called_once_with(
299 |         args=(
300 |             "sacct --parsable -n --delimiter=^|^ "
301 |             "--format=c1,c2 --user=user --starttime=011318"
302 |         ).split(),
303 |         stdout=mocker.ANY,
304 |         encoding=mocker.ANY,
305 |         check=mocker.ANY,
306 |         text=True,
307 |         shell=False,
308 |     )
309 | 
310 |     debug = []
311 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
312 |     assert debug[0] == ("c1j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
313 | 
314 | 
315 | def test_sacct_set_partition(sacct):
316 |     """Can set partition."""
317 |     sacct.set_partition("partition")
318 |     assert sacct.partition == "partition"
319 | 
320 | 
321 | def test_sacct_set_cluster(sacct):
322 |     """Can set cluster."""
323 |     sacct.set_cluster("cluster")
324 |     assert sacct.cluster == "cluster"
325 | 
326 | 
327 | def test_sacct_get_db_output_partition(sacct, mocker):
328 |     """Subprocess call is affected by partition argument."""
329 |     mock_sacct = mocker.MagicMock()
330 |     mock_sacct.returncode = 0
331 |     mock_sacct.stdout = "c1j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
332 |     mock_sub = mocker.patch(
333 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
334 |     )
335 |     sacct.set_partition("partition")
336 |     result = sacct.get_db_output("c1 c2".split(), {})
337 |     assert result == [
338 |         {"c1": "c1j1", "c2": "c2j1"},
339 |         {"c1": "c1j2", "c2": "c2j2"},
340 |         {"c1": "c1j3", "c2": "c2j3"},
341 |     ]
342 |     mock_sub.assert_called_once_with(
343 |         args=(
344 |             "sacct --parsable -n --delimiter=^|^ "
345 |             "--format=c1,c2 --jobs= --partition=partition"
346 |         ).split(),
347 |         stdout=mocker.ANY,
348 |         encoding=mocker.ANY,
349 |         check=mocker.ANY,
350 |         text=True,
351 |         shell=False,
352 |     )
353 | 
354 |     debug = []
355 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
356 |     assert debug[0] == ("c1j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
357 | 
358 | 
359 | def test_sacct_get_db_output_since(sacct, mocker):
360 |     """Subprocess call is affected by since argument."""
361 |     mock_sacct = mocker.MagicMock()
362 |     mock_sacct.returncode = 0
363 |     mock_sacct.stdout = "c1j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
364 |     mock_sub = mocker.patch(
365 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
366 |     )
367 |     sacct.set_since("time")
368 |     result = sacct.get_db_output("c1 c2".split(), {})
369 |     assert result == [
370 |         {"c1": "c1j1", "c2": "c2j1"},
371 |         {"c1": "c1j2", "c2": "c2j2"},
372 |         {"c1": "c1j3", "c2": "c2j3"},
373 |     ]
374 |     mock_sub.assert_called_once_with(
375 |         args=(
376 |             "sacct --parsable -n --delimiter=^|^ "
377 |             "--format=c1,c2 --jobs= --starttime=time "
378 |         ).split(),
379 |         stdout=mocker.ANY,
380 |         encoding=mocker.ANY,
381 |         check=mocker.ANY,
382 |         text=True,
383 |         shell=False,
384 |     )
385 | 
386 |     debug = []
387 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
388 |     assert debug[0] == ("c1j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
389 | 
390 | 
391 | def test_sacct_get_db_output_until(sacct, mocker):
392 |     """Subprocess call is affected by until argument."""
393 |     mock_sacct = mocker.MagicMock()
394 |     mock_sacct.returncode = 0
395 |     mock_sacct.stdout = "c1j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
396 |     mock_sub = mocker.patch(
397 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
398 |     )
399 |     sacct.set_until("time")
400 |     result = sacct.get_db_output("c1 c2".split(), {})
401 |     assert result == [
402 |         {"c1": "c1j1", "c2": "c2j1"},
403 |         {"c1": "c1j2", "c2": "c2j2"},
404 |         {"c1": "c1j3", "c2": "c2j3"},
405 |     ]
406 |     mock_sub.assert_called_once_with(
407 |         args=(
408 |             "sacct --parsable -n --delimiter=^|^ --format=c1,c2 --jobs= --endtime=time "
409 |         ).split(),
410 |         stdout=mocker.ANY,
411 |         encoding=mocker.ANY,
412 |         check=mocker.ANY,
413 |         text=True,
414 |         shell=False,
415 |     )
416 | 
417 |     debug = []
418 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
419 |     assert debug[0] == ("c1j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
420 | 
421 | 
422 | def test_sacct_set_state(sacct, capsys):
423 |     """Decodes state properly and sets to upper."""
424 |     sacct.set_state("BF,ca,cD,Dl,F,NF,OOM,PD,PR,R,RQ,RS,RV,S,TO")
425 |     assert sacct.state == {
426 |         "BOOT_FAIL",
427 |         "CANCELLED",
428 |         "COMPLETED",
429 |         "DEADLINE",
430 |         "FAILED",
431 |         "NODE_FAIL",
432 |         "OUT_OF_MEMORY",
433 |         "PENDING",
434 |         "PREEMPTED",
435 |         "RUNNING",
436 |         "REQUEUED",
437 |         "RESIZING",
438 |         "REVOKED",
439 |         "SUSPENDED",
440 |         "TIMEOUT",
441 |     }
442 | 
443 |     # sets to upper and removes duplicates
444 |     sacct.set_state("TiMeOuT,running,FAILED,failed")
445 |     assert sacct.state == {"TIMEOUT", "RUNNING", "FAILED"}
446 | 
447 |     # sets while warning of missing
448 |     sacct.set_state("unknown,r,F")
449 |     assert sacct.state == {"RUNNING", "FAILED"}
450 |     assert capsys.readouterr().err == "Unknown state UNKNOWN\n"
451 | 
452 |     sacct.set_state("unknown,z")
453 |     assert sacct.state == {None}
454 |     assert set(capsys.readouterr().err.split("\n")) == {
455 |         "Unknown state UNKNOWN",
456 |         "Unknown state Z",
457 |         "No valid states provided to include",
458 |         "",
459 |     }
460 | 
461 |     # remove duplicate unknowns
462 |     sacct.set_state("unknown,z,z,z")
463 |     assert sacct.state == {None}
464 |     assert set(capsys.readouterr().err.split("\n")) == {
465 |         "Unknown state UNKNOWN",
466 |         "Unknown state Z",
467 |         "No valid states provided to include",
468 |         "",
469 |     }
470 | 
471 | 
472 | def test_sacct_set_until(sacct, mocker):
473 |     """Can set since with various formats."""
474 |     # no equal sign, retain argument
475 |     sacct.set_until("022399")
476 |     assert sacct.until == "022399"
477 |     # also no error checking
478 |     sacct.set_until("asdf")
479 |     assert sacct.until == "asdf"
480 | 
481 |     # has an equal sign, handles year, month, day, hour, minute
482 |     mock_date = mocker.MagicMock()
483 |     mock_date.today.return_value = datetime.datetime(2018, 1, 20, 10, 15, 20)
484 |     mock_date.side_effect = lambda *args, **kw: datetime.date(*args, **kw)
485 |     mocker.patch("reportseff.db_inquirer.datetime.datetime", mock_date)
486 | 
487 |     sacct.set_until("w=2")
488 |     assert sacct.until == "2018-01-06T10:15"
489 | 
490 |     sacct.set_until("W=2")
491 |     assert sacct.until == "2018-01-06T10:15"
492 | 
493 |     sacct.set_until("weeks=2")
494 |     assert sacct.until == "2018-01-06T10:15"
495 | 
496 |     sacct.set_until("d=2")
497 |     assert sacct.until == "2018-01-18T10:15"
498 | 
499 |     sacct.set_until("D=2")
500 |     assert sacct.until == "2018-01-18T10:15"
501 | 
502 |     sacct.set_until("days=2")
503 |     assert sacct.until == "2018-01-18T10:15"
504 | 
505 |     sacct.set_until("H=-4")
506 |     assert sacct.until == "2018-01-20T14:15"
507 | 
508 |     sacct.set_until("h=4")
509 |     assert sacct.until == "2018-01-20T06:15"
510 | 
511 |     sacct.set_until("hours=4")
512 |     assert sacct.until == "2018-01-20T06:15"
513 | 
514 |     sacct.set_until("M=3")
515 |     assert sacct.until == "2018-01-20T10:12"
516 | 
517 |     sacct.set_until("m=3")
518 |     assert sacct.until == "2018-01-20T10:12"
519 | 
520 |     sacct.set_until("minutes=3")
521 |     assert sacct.until == "2018-01-20T10:12"
522 | 
523 |     # unknown code, don't add
524 |     sacct.set_until("z=3")
525 |     assert sacct.until == "2018-01-20T10:15"
526 | 
527 |     # can't parse arg to int, don't add
528 |     sacct.set_until("M=z")
529 |     assert sacct.until == "2018-01-20T10:15"
530 | 
531 |     # can't parse args without =, ignore
532 |     sacct.set_until("a,M=3,z")
533 |     assert sacct.until == "2018-01-20T10:12"
534 | 
535 |     # handle multiple
536 |     sacct.set_until("w=2,d=1,h=3,m=4,z,H=a")
537 |     assert sacct.until == "2018-01-05T07:11"
538 | 
539 |     # last repeat wins
540 |     sacct.set_until("m=300,mInUtes=3")
541 |     assert sacct.until == "2018-01-20T10:12"
542 | 
543 | 
544 | def test_sacct_set_since(sacct, mocker):
545 |     """Can set since with various formats."""
546 |     # no equal sign, retain argument
547 |     sacct.set_since("022399")
548 |     assert sacct.since == "022399"
549 |     # also no error checking
550 |     sacct.set_since("asdf")
551 |     assert sacct.since == "asdf"
552 | 
553 |     # has an equal sign, handles year, month, day, hour, minute
554 |     mock_date = mocker.MagicMock()
555 |     mock_date.today.return_value = datetime.datetime(2018, 1, 20, 10, 15, 20)
556 |     mock_date.side_effect = lambda *args, **kw: datetime.date(*args, **kw)
557 |     mocker.patch("reportseff.db_inquirer.datetime.datetime", mock_date)
558 | 
559 |     sacct.set_since("w=2")
560 |     assert sacct.since == "2018-01-06T10:15"
561 | 
562 |     sacct.set_since("W=2")
563 |     assert sacct.since == "2018-01-06T10:15"
564 | 
565 |     sacct.set_since("weeks=2")
566 |     assert sacct.since == "2018-01-06T10:15"
567 | 
568 |     sacct.set_since("d=2")
569 |     assert sacct.since == "2018-01-18T10:15"
570 | 
571 |     sacct.set_since("D=2")
572 |     assert sacct.since == "2018-01-18T10:15"
573 | 
574 |     sacct.set_since("days=2")
575 |     assert sacct.since == "2018-01-18T10:15"
576 | 
577 |     sacct.set_since("H=-4")
578 |     assert sacct.since == "2018-01-20T14:15"
579 | 
580 |     sacct.set_since("h=4")
581 |     assert sacct.since == "2018-01-20T06:15"
582 | 
583 |     sacct.set_since("hours=4")
584 |     assert sacct.since == "2018-01-20T06:15"
585 | 
586 |     sacct.set_since("M=3")
587 |     assert sacct.since == "2018-01-20T10:12"
588 | 
589 |     sacct.set_since("m=3")
590 |     assert sacct.since == "2018-01-20T10:12"
591 | 
592 |     sacct.set_since("minutes=3")
593 |     assert sacct.since == "2018-01-20T10:12"
594 | 
595 |     # unknown code, don't add
596 |     sacct.set_since("z=3")
597 |     assert sacct.since == "2018-01-20T10:15"
598 | 
599 |     # can't parse arg to int, don't add
600 |     sacct.set_since("M=z")
601 |     assert sacct.since == "2018-01-20T10:15"
602 | 
603 |     # can't parse args without =, ignore
604 |     sacct.set_since("a,M=3,z")
605 |     assert sacct.since == "2018-01-20T10:12"
606 | 
607 |     # handle multiple
608 |     sacct.set_since("w=2,d=1,h=3,m=4,z,H=a")
609 |     assert sacct.since == "2018-01-05T07:11"
610 | 
611 |     # last repeat wins
612 |     sacct.set_since("m=300,mInUtes=3")
613 |     assert sacct.since == "2018-01-20T10:12"
614 | 
615 | 
616 | def test_sacct_get_db_output_user_state(sacct, mocker):
617 |     """Can set user and state at the same time."""
618 |     mocker.patch(
619 |         "reportseff.db_inquirer.subprocess.run",
620 |         side_effect=subprocess.CalledProcessError(1, "test"),
621 |     )
622 |     mock_date = mocker.MagicMock()
623 |     mock_date.today.return_value = datetime.date(2018, 1, 20)
624 |     mock_date.side_effect = datetime.date
625 |     mocker.patch("reportseff.db_inquirer.datetime.date", mock_date)
626 |     with pytest.raises(Exception, match="Error running sacct!"):
627 |         sacct.get_db_output("JobID c2".split(), "j1 j2 j3".split())
628 | 
629 |     mock_sacct = mocker.MagicMock()
630 |     mock_sacct.returncode = 0
631 |     mock_sacct.stdout = (
632 |         "c1j1^|^c2j1^|^RUNNING^|^\n"
633 |         "c1j2^|^c2j2^|^RUNNING^|^\n"
634 |         "c1j3^|^c2j3^|^COMPLETED^|^\n"
635 |     )
636 |     mock_sub = mocker.patch(
637 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
638 |     )
639 |     sacct.set_user("user")
640 |     sacct.set_state("R")
641 |     result = sacct.get_db_output("JobID c2 State".split(), {})
642 |     assert result == [
643 |         {"JobID": "c1j1", "c2": "c2j1", "State": "RUNNING"},
644 |         {"JobID": "c1j2", "c2": "c2j2", "State": "RUNNING"},
645 |     ]
646 |     mock_sub.assert_called_once_with(
647 |         args=(
648 |             "sacct --parsable -n --delimiter=^|^ --format=JobID,c2,State"
649 |             " --user=user --starttime=011318"
650 |         ).split(),
651 |         stdout=mocker.ANY,
652 |         encoding=mocker.ANY,
653 |         check=mocker.ANY,
654 |         text=True,
655 |         shell=False,
656 |     )
657 | 
658 |     # debug is not affected by state
659 |     debug = []
660 |     sacct.get_db_output("JobID c2 State".split(), "j1 j2 j3".split(), debug.append)
661 |     assert debug[0] == (
662 |         "c1j1^|^c2j1^|^RUNNING\nc1j2^|^c2j2^|^RUNNING\nc1j3^|^c2j3^|^COMPLETED\n"
663 |     )
664 | 
665 | 
666 | def test_partition_timelimit_failure(sacct, mocker):
667 |     """Get error when scontrol fails."""
668 |     mock_sacct = mocker.MagicMock()
669 |     mock_sacct.returncode = 1
670 |     mock_sacct.stdout = ""
671 |     mocker.patch("reportseff.db_inquirer.subprocess.run", return_value=mock_sacct)
672 | 
673 |     with pytest.raises(RuntimeError) as exception:
674 |         sacct.get_partition_timelimits()
675 | 
676 |     assert "Error retrieving information from scontrol" in str(exception.value)
677 | 
678 | 
679 | def test_partition_timelimit(sacct, mocker):
680 |     """Can process scontrol output."""
681 |     mock_sacct = mocker.MagicMock()
682 |     mock_sacct.returncode = 0
683 |     mock_sacct.stdout = (
684 |         "PartitionName=cpu\n"
685 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
686 |         "   MaxNodes=UNLIMITED MaxTime=15-00:00:00 MinNodes=0\n"
687 |         "\n"
688 |         "PartitionName=datascience\n"
689 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
690 |         "   MaxNodes=UNLIMITED MaxTime=MAXTIME MinNodes=0\n"
691 |         "\n"
692 |         "PartitionName=gpu\n"
693 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
694 |         "   MaxNodes=UNLIMITED MaxTime=12-00:00:00 MinNodes=0\n"
695 |     )
696 |     mock_run = mocker.patch(
697 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
698 |     )
699 | 
700 |     limits = sacct.get_partition_timelimits()
701 |     assert limits == {
702 |         "cpu": "15-00:00:00",
703 |         "datascience": "MAXTIME",
704 |         "gpu": "12-00:00:00",
705 |     }
706 | 
707 |     assert mock_run.call_args.kwargs["args"] == "scontrol show partition".split()
708 | 
709 | 
710 | def test_partition_timelimit_with_cluster(sacct, mocker):
711 |     """Can process scontrol output."""
712 |     mock_sacct = mocker.MagicMock()
713 |     mock_sacct.returncode = 0
714 |     mock_sacct.stdout = (
715 |         "PartitionName=cpu\n"
716 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
717 |         "   MaxNodes=UNLIMITED MaxTime=15-00:00:00 MinNodes=0\n"
718 |         "\n"
719 |         "PartitionName=datascience\n"
720 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
721 |         "   MaxNodes=UNLIMITED MaxTime=MAXTIME MinNodes=0\n"
722 |         "\n"
723 |         "PartitionName=gpu\n"
724 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
725 |         "   MaxNodes=UNLIMITED MaxTime=12-00:00:00 MinNodes=0\n"
726 |     )
727 |     mock_run = mocker.patch(
728 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
729 |     )
730 | 
731 |     sacct.set_cluster("Testing")
732 |     limits = sacct.get_partition_timelimits()
733 |     assert limits == {
734 |         "cpu": "15-00:00:00",
735 |         "datascience": "MAXTIME",
736 |         "gpu": "12-00:00:00",
737 |     }
738 | 
739 |     assert (
740 |         mock_run.call_args.kwargs["args"]
741 |         == "scontrol --cluster Testing show partition".split()
742 |     )
743 | 
744 | 
745 | def test_partition_timelimit_issue_11(sacct, mocker):
746 |     """Can process scontrol output from issue 11."""
747 |     mock_sacct = mocker.MagicMock()
748 |     mock_sacct.returncode = 0
749 |     mock_sacct.stdout = (
750 |         "PartitionName=mainqueue\n"
751 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
752 |         "   AllocNodes=ALL Default=YES QoS=N/A\n"
753 |         "   DefaultTime=NONE DisableRootJobs=NO ExclusiveUser=NO GraceTime=0\n"
754 |         "   MaxNodes=UNLIMITED MaxTime=UNLIMITED MinNodes=0 LLN=NO\n"
755 |         "   Nodes=bignode\n"
756 |         "   PriorityJobFactor=1 PriorityTier=1 RootOnly=NO ReqResv=NO\n"
757 |         "   OverTimeLimit=NONE PreemptMode=OFF\n"
758 |         "   State=UP TotalCPUs=128 TotalNodes=1 SelectTypeParameters=NONE\n"
759 |         "   JobDefaults=(null)\n"
760 |         "   DefMemPerNode=UNLIMITED MaxMemPerNode=UNLIMITED\n"
761 |         "PartitionName=mainqueue2\n"
762 |         "   AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL\n"
763 |         "   AllocNodes=ALL Default=YES QoS=N/A\n"
764 |         "   DefaultTime=NONE DisableRootJobs=NO ExclusiveUser=NO GraceTime=0\n"
765 |         "   MaxNodes=UNLIMITED MaxTime=10-00:00:00 MinNodes=0 LLN=NO\n"
766 |         "   Nodes=bignode\n"
767 |         "   PriorityJobFactor=1 PriorityTier=1 RootOnly=NO ReqResv=NO\n"
768 |         "   OverTimeLimit=NONE PreemptMode=OFF\n"
769 |         "   State=UP TotalCPUs=128 TotalNodes=1 SelectTypeParameters=NONE\n"
770 |         "   JobDefaults=(null)\n"
771 |         "   DefMemPerNode=UNLIMITED MaxMemPerNode=UNLIMITED\n"
772 |     )
773 |     mocker.patch("reportseff.db_inquirer.subprocess.run", return_value=mock_sacct)
774 | 
775 |     limits = sacct.get_partition_timelimits()
776 |     assert limits == {
777 |         "mainqueue": "UNLIMITED",
778 |         "mainqueue2": "10-00:00:00",
779 |     }
780 | 
781 | 
782 | def test_extra_args_setting(sacct):
783 |     """Setting extra args are properly handled."""
784 |     sacct.set_extra_args('-D --units M --nodelist "node1 node2"')
785 |     assert sacct.extra_args == '-D --units M --nodelist "node1 node2"'
786 |     assert sacct.set_sacct_args(["123"]) == [
787 |         "--jobs=123",
788 |         "-D",
789 |         "--units",
790 |         "M",
791 |         "--nodelist",
792 |         "node1 node2",
793 |     ]
794 | 
795 | 
796 | def test_sacct_get_db_output_issue_30(sacct, mocker):
797 |     """Handle cases where jobname has a pipe."""
798 |     mock_sacct = mocker.MagicMock()
799 |     mock_sacct.returncode = 0
800 |     mock_sacct.stdout = "c1 | j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
801 |     mock_sub = mocker.patch(
802 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
803 |     )
804 |     result = sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split())
805 |     assert result == [
806 |         {"c1": "c1 | j1", "c2": "c2j1"},
807 |         {"c1": "c1j2", "c2": "c2j2"},
808 |         {"c1": "c1j3", "c2": "c2j3"},
809 |     ]
810 |     mock_sub.assert_called_once_with(
811 |         args=(
812 |             "sacct --parsable -n --delimiter=^|^ " "--format=c1,c2 --jobs=j1,j2,j3"
813 |         ).split(),
814 |         stdout=mocker.ANY,
815 |         encoding=mocker.ANY,
816 |         check=mocker.ANY,
817 |         shell=False,
818 |         text=True,
819 |     )
820 | 
821 |     debug = []
822 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
823 |     assert debug[0] == ("c1 | j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
824 | 
825 | 
826 | def test_sacct_newline_jobs_issue_63(sacct, mocker):
827 |     """Handle cases when the job name contains a newline."""
828 |     mock_sacct = mocker.MagicMock()
829 |     mock_sacct.returncode = 0
830 |     mock_sacct.stdout = "c1 \n j1^|^c2j1^|^\nc1j2^|^c2j2^|^\nc1j3^|^c2j3^|^\n"
831 |     mock_sub = mocker.patch(
832 |         "reportseff.db_inquirer.subprocess.run", return_value=mock_sacct
833 |     )
834 |     result = sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split())
835 |     assert result == [
836 |         {"c1": "c1 \\n j1", "c2": "c2j1"},
837 |         {"c1": "c1j2", "c2": "c2j2"},
838 |         {"c1": "c1j3", "c2": "c2j3"},
839 |     ]
840 |     mock_sub.assert_called_once_with(
841 |         args=(
842 |             "sacct --parsable -n --delimiter=^|^ " "--format=c1,c2 --jobs=j1,j2,j3"
843 |         ).split(),
844 |         stdout=mocker.ANY,
845 |         encoding=mocker.ANY,
846 |         check=mocker.ANY,
847 |         shell=False,
848 |         text=True,
849 |     )
850 | 
851 |     debug = []
852 |     sacct.get_db_output("c1 c2".split(), "j1 j2 j3".split(), debug.append)
853 |     assert debug[0] == ("c1 \\n j1^|^c2j1\nc1j2^|^c2j2\nc1j3^|^c2j3\n")
854 | 


--------------------------------------------------------------------------------
/tests/test_job.py:
--------------------------------------------------------------------------------
  1 | """Test job object."""
  2 | 
  3 | import pytest
  4 | from reportseff import job as job_module
  5 | 
  6 | 
  7 | @pytest.fixture()
  8 | def job():
  9 |     """Default job ."""
 10 |     return job_module.Job("job", "jobid", "filename")
 11 | 
 12 | 
 13 | def test_eq():
 14 |     """Jobs must have all matching values to equal."""
 15 |     job1 = job_module.Job("j1", "j1", "filename")
 16 |     job2 = job_module.Job("j1", "j1", "filename")
 17 |     assert job1 == job2
 18 | 
 19 |     job2 = job_module.Job("j2", "j1", "filename")
 20 |     assert job1 != job2
 21 |     job2 = {}
 22 |     assert job1 != job2
 23 | 
 24 | 
 25 | def test_repr():
 26 |     """Representation builds constructor."""
 27 |     job1 = job_module.Job("j1", "jid1", "filename")
 28 |     assert repr(job1) == "Job(job=j1, jobid=jid1, filename=filename)"
 29 | 
 30 |     job2 = job_module.Job("j2", "jid2", None)
 31 |     assert repr(job2) == "Job(job=j2, jobid=jid2, filename=None)"
 32 | 
 33 | 
 34 | def test_job_init(job):
 35 |     """Blank job has expected defaults."""
 36 |     assert job.job == "job"
 37 |     assert job.jobid == "jobid"
 38 |     assert job.filename == "filename"
 39 |     assert job.stepmem == 0
 40 |     assert job.totalmem is None
 41 |     assert job.time == "---"
 42 |     assert job.cpu == "---"
 43 |     assert job.state is None
 44 | 
 45 | 
 46 | def test_update_main_job():
 47 |     """Updating jobs changes expected properties."""
 48 |     job = job_module.Job("24371655", "24371655", None)
 49 |     job.update(
 50 |         {
 51 |             "JobID": "24371655",
 52 |             "State": "COMPLETED",
 53 |             "AllocCPUS": "1",
 54 |             "REQMEM": "1Gn",
 55 |             "TotalCPU": "00:09:00",
 56 |             "Elapsed": "00:10:00",
 57 |             "Timelimit": "00:20:00",
 58 |             "MaxRSS": "",
 59 |             "NNodes": "1",
 60 |             "NTasks": "",
 61 |         }
 62 |     )
 63 |     assert job.state == "COMPLETED"
 64 |     assert job.time == "00:10:00"
 65 |     assert job.time_eff == 50.0
 66 |     assert job.cpu == 90.0
 67 |     assert job.totalmem == 1 * 1024**2
 68 | 
 69 |     job = job_module.Job("24371655", "24371655", None)
 70 |     job.update(
 71 |         {
 72 |             "JobID": "24371655",
 73 |             "State": "COMPLETED",
 74 |             "AllocCPUS": "1",
 75 |             "REQMEM": "1G",
 76 |             "TotalCPU": "00:09:00",
 77 |             "Elapsed": "00:10:00",
 78 |             "Timelimit": "00:20:00",
 79 |             "MaxRSS": "",
 80 |             "NNodes": "1",
 81 |             "NTasks": "",
 82 |         }
 83 |     )
 84 |     assert job.state == "COMPLETED"
 85 |     assert job.time == "00:10:00"
 86 |     assert job.time_eff == 50.0
 87 |     assert job.cpu == 90.0
 88 |     assert job.totalmem == 1 * 1024**2
 89 | 
 90 |     job = job_module.Job("24371655", "24371655", None)
 91 |     job.update(
 92 |         {
 93 |             "JobID": "24371655",
 94 |             "State": "COMPLETED",
 95 |             "AllocCPUS": "1",
 96 |             "REQMEM": "1G",
 97 |             "TotalCPU": "00:09:00",
 98 |             "Elapsed": "00:10:00",
 99 |             "Timelimit": "00:20:00",
100 |             "MaxRSS": "",
101 |         }
102 |     )
103 |     assert job.state == "COMPLETED"
104 |     assert job.time == "00:10:00"
105 |     assert job.time_eff == 50.0
106 |     assert job.cpu == 90.0
107 |     assert job.totalmem is None
108 | 
109 |     job = job_module.Job("24371655", "24371655", None)
110 |     job.update(
111 |         {
112 |             "JobID": "24371655",
113 |             "State": "PENDING",
114 |             "AllocCPUS": "1",
115 |             "REQMEM": "1Gn",
116 |             "TotalCPU": "00:09:00",
117 |             "Elapsed": "00:10:00",
118 |             "Timelimit": "00:20:00",
119 |             "MaxRSS": "",
120 |             "NNodes": "1",
121 |             "NTasks": "",
122 |         }
123 |     )
124 |     assert job.state == "PENDING"
125 |     assert job.time == "---"
126 |     assert job.time_eff == "---"
127 |     assert job.cpu == "---"
128 |     assert job.totalmem is None
129 | 
130 |     job = job_module.Job("24371655", "24371655", None)
131 |     job.update(
132 |         {
133 |             "JobID": "24371655",
134 |             "State": "RUNNING",
135 |             "AllocCPUS": "1",
136 |             "REQMEM": "1Gn",
137 |             "TotalCPU": "00:09:00",
138 |             "Elapsed": "00:10:00",
139 |             "Timelimit": "00:20:00",
140 |             "MaxRSS": "",
141 |             "NNodes": "1",
142 |             "NTasks": "",
143 |         }
144 |     )
145 |     job.update(
146 |         {
147 |             "JobID": "24371655.batch",
148 |             "State": "RUNNING",
149 |             "AllocCPUS": "1",
150 |             "REQMEM": "1Gn",
151 |             "TotalCPU": "00:09:00",
152 |             "Elapsed": "00:10:00",
153 |             "Timelimit": "00:20:00",
154 |             "MaxRSS": "",
155 |             "NNodes": "1",
156 |             "NTasks": "",
157 |         }
158 |     )
159 |     assert job.state == "RUNNING"
160 |     assert job.time == "00:10:00"
161 |     assert job.time_eff == 50.0
162 |     assert job.cpu == "---"
163 |     assert job.totalmem is None
164 | 
165 |     job = job_module.Job("24371655", "24371655", None)
166 |     job.update(
167 |         {
168 |             "JobID": "24371655",
169 |             "State": "CANCELLED",
170 |             "AllocCPUS": "1",
171 |             "REQMEM": "1Gn",
172 |             "TotalCPU": "00:09:00",
173 |             "Elapsed": "00:00:00",
174 |             "Timelimit": "00:20:00",
175 |             "MaxRSS": "",
176 |             "NNodes": "1",
177 |             "NTasks": "",
178 |         }
179 |     )
180 |     assert job.state == "CANCELLED"
181 |     assert job.time == "00:00:00"
182 |     assert job.time_eff == 0.0
183 |     assert job.cpu is None
184 |     assert job.totalmem == 1024**2
185 | 
186 | 
187 | def test_update_main_job_unlimited():
188 |     """Updating jobs changes expected properties."""
189 |     job = job_module.Job("11741520", "11741520", None)
190 |     job.update(
191 |         {
192 |             "AdminComment": "",
193 |             "AllocCPUS": "4",
194 |             "Elapsed": "03:22:47",
195 |             "JobID": "11741520",
196 |             "JobIDRaw": "11741520",
197 |             "MaxRSS": "",
198 |             "NNodes": "1",
199 |             "REQMEM": "7Gc",
200 |             "State": "COMPLETED",
201 |             "Timelimit": "UNLIMITED",
202 |             "TotalCPU": "01:15:11",
203 |         }
204 |     )
205 |     assert job.state == "COMPLETED"
206 |     assert job.time == "03:22:47"
207 |     assert job.time_eff == "---"
208 |     assert job.cpu == 9.3
209 |     assert job.totalmem == 4 * 7 * 1024**2
210 | 
211 | 
212 | def test_update_main_job_partition_limit():
213 |     """Updating jobs changes expected properties."""
214 |     job = job_module.Job("341", "341", None)
215 |     job.update(
216 |         {
217 |             "AdminComment": "",
218 |             "AllocCPUS": "1",
219 |             "Elapsed": "00:00:00",
220 |             "JobID": "341",
221 |             "JobIDRaw": "341",
222 |             "MaxRSS": "",
223 |             "NNodes": "1",
224 |             "Partition": "mainqueue",
225 |             "QOS": "normal",
226 |             "REQMEM": "4000G",
227 |             "State": "CANCELLED by 1001",
228 |             "Timelimit": "Partition_Limit",
229 |             "TotalCPU": "00:00:00",
230 |         }
231 |     )
232 |     assert job.state == "CANCELLED"
233 |     assert job.time == "00:00:00"
234 |     assert job.time_eff == "---"
235 |     assert job.cpu is None
236 |     assert job.totalmem == 4 * 1000 * 1024**2
237 | 
238 | 
239 | def test_update_part_job():
240 |     """Can update job with batch to add to stepmem."""
241 |     job = job_module.Job("24371655", "24371655", None)
242 |     job.update(
243 |         {
244 |             "JobID": "24371655.batch",
245 |             "State": "COMPLETED",
246 |             "AllocCPUS": "1",
247 |             "REQMEM": "1Gn",
248 |             "TotalCPU": "00:09:00",
249 |             "Elapsed": "00:10:00",
250 |             "MaxRSS": "495644K",
251 |             "NNodes": "1",
252 |             "NTasks": "1",
253 |         }
254 |     )
255 |     assert job.state is None
256 |     assert job.time == "---"
257 |     assert job.cpu == "---"
258 |     assert job.totalmem is None
259 |     assert job.stepmem == 495644
260 | 
261 | 
262 | def test_parse_bug():
263 |     """Can handle job id mismatches."""
264 |     job = job_module.Job("24371655", "24371655", None)
265 |     job.update(
266 |         {
267 |             "AllocCPUS": "1",
268 |             "Elapsed": "00:00:19",
269 |             "JobID": "34853801.extern",
270 |             "JobIDRaw": "34853801.extern",
271 |             "JobName": "extern",
272 |             "MaxRSS": "0",
273 |             "NNodes": "1",
274 |             "REQMEM": "4Gn",
275 |             "State": "COMPLETED",
276 |             "Timelimit": "",
277 |             "TotalCPU": "00:00:00",
278 |         }
279 |     )
280 | 
281 | 
282 | def test_name(job):
283 |     """Name is either filename or the jobid."""
284 |     assert job.name() == "filename"
285 |     job = job_module.Job("job", "jobid", None)
286 |     assert job.name() == "jobid"
287 | 
288 | 
289 | def test_get_entry(job):
290 |     """State is read properly and updated by main job entry."""
291 |     job.state = "TEST"
292 |     assert job.get_entry("MemEff") == "---"
293 |     assert job.get_entry("TimeEff") == "---"
294 |     assert job.get_entry("CPUEff") == "---"
295 |     assert job.get_entry("undefined") == "---"
296 | 
297 |     job = job_module.Job("24371655", "24371655", None)
298 |     job.update(
299 |         {
300 |             "JobID": "24371655",
301 |             "State": "CANCELLED",
302 |             "AllocCPUS": "1",
303 |             "REQMEM": "1Gn",
304 |             "TotalCPU": "00:09:00",
305 |             "Elapsed": "00:00:00",
306 |             "Timelimit": "00:20:00",
307 |             "MaxRSS": "",
308 |             "NNodes": "1",
309 |             "NTasks": "",
310 |         }
311 |     )
312 |     assert job.get_entry("JobID") == "24371655"
313 |     assert job.get_entry("State") == "CANCELLED"
314 |     assert job.get_entry("MemEff") == 0.0
315 |     assert job.get_entry("TimeEff") == 0.0
316 |     assert job.get_entry("CPUEff") == "---"
317 |     assert job.get_entry("undefined") == "---"
318 |     assert job.get_entry("Elapsed") == "00:00:00"
319 | 
320 | 
321 | def test_parse_slurm_timedelta():
322 |     """Can parse all types of time formats."""
323 |     timestamps = ["01-03:04:02", "03:04:02", "04:02.123"]
324 |     expected_seconds = [97442, 11042, 242]
325 |     for timestamp, seconds in zip(timestamps, expected_seconds):
326 |         assert job_module._parse_slurm_timedelta(timestamp) == seconds
327 | 
328 |     with pytest.raises(ValueError, match="Failed to parse time 'asdf'"):
329 |         job_module._parse_slurm_timedelta("asdf")
330 | 
331 | 
332 | def test_parsemem_nodes():
333 |     """Can parse memory entries with nodes provided."""
334 |     for mem in (1, 2, 4):
335 |         for exp, multiple in enumerate("K M G T E".split()):
336 |             for alloc in (1, 2, 4):
337 |                 assert (
338 |                     job_module.parsemem(f"{mem}{multiple}n", alloc, -1)
339 |                     == mem * 1024**exp * alloc
340 |                 ), f"{mem}{multiple}n"
341 | 
342 | 
343 | def test_parsemem_cpus():
344 |     """Can parse memory entries with cpus provided."""
345 |     for mem in (1, 2, 4):
346 |         for exp, multiple in enumerate("K M G T E".split()):
347 |             for alloc in (1, 2, 4):
348 |                 assert (
349 |                     job_module.parsemem(f"{mem}{multiple}c", -1, alloc)
350 |                     == mem * 1024**exp * alloc
351 |                 ), f"{mem}{multiple}c"
352 | 
353 | 
354 | def test_parsememstep():
355 |     """Can parse memory for steps and handle odd formats."""
356 |     for exp, multiple in enumerate("K M G T E".split()):
357 |         for mem in (2, 4, 6):
358 |             assert job_module.parsemem(f"{mem}{multiple}") == mem * 1024**exp
359 | 
360 |     with pytest.raises(ValueError, match="Failed to parse memory '18GG'"):
361 |         job_module.parsemem("18GG")
362 | 
363 |     assert job_module.parsemem("") == 0
364 |     assert job_module.parsemem("0") == 0
365 |     assert job_module.parsemem("5") == 5
366 |     assert job_module.parsemem("1084.50M") == 1084.5 * 1024
367 | 
368 | 
369 | def test_unknown_admin_comment(job):
370 |     """Unknown comment types raise informative errors."""
371 |     with pytest.raises(ValueError, match="Unknown comment type 'JS0'"):
372 |         job._parse_admin_comment("JS0:asdfasdf")
373 | 
374 |     # invalid gzip file
375 |     with pytest.raises(ValueError, match="Cannot decode comment 'JS1:asdfasdf'"):
376 |         job._parse_admin_comment("JS1:asdfasdf")
377 | 
378 |     # invalid base 64
379 |     with pytest.raises(ValueError, match="Cannot decode comment 'JS1:asd&asdf'"):
380 |         job._parse_admin_comment("JS1:asd&asdf")
381 | 
382 |     # valid, not updated
383 |     job._parse_admin_comment('\'{"arrayTaskId":4294967294...')
384 | 
385 | 
386 | def test_single_core(single_core):
387 |     """Job with single node is updated properly."""
388 |     job = job_module.Job("39895850", "39889258_1426", None)
389 |     for line in single_core:
390 |         job.update(line)
391 | 
392 |     assert job.cpu == 99.7
393 |     assert job.mem_eff == 3.6
394 |     assert job.gpu is None
395 |     assert job.gpu_mem is None
396 |     # single nodes are not printed
397 |     assert list(job.get_node_entries("JobID")) == ["39889258_1426"]
398 |     assert list(job.get_node_entries("CPUEff")) == [99.7]
399 | 
400 | 
401 | def test_multi_node(multi_node):
402 |     """Job with multiple nodes is updated properly."""
403 |     job = job_module.Job("8205048", "8205048", None)
404 |     for line in multi_node:
405 |         job.update(line)
406 | 
407 |     assert job.cpu == 4.6
408 |     assert job.mem_eff == 1.1
409 |     assert job.gpu is None
410 |     assert job.gpu_mem is None
411 | 
412 |     assert list(job.get_node_entries("JobID")) == [
413 |         "8205048",
414 |         "  tiger-h19c1n15",
415 |         "  tiger-h26c2n13",
416 |         "  tiger-i26c2n11",
417 |         "  tiger-i26c2n15",
418 |     ]
419 | 
420 |     assert list(job.get_node_entries("CPUEff")) == [
421 |         4.6,
422 |         18.6,
423 |         0.0,
424 |         0.0,
425 |         0.0,
426 |     ]
427 | 
428 |     assert list(job.get_node_entries("MemEff")) == [
429 |         1.1,
430 |         4.5,
431 |         0.0,
432 |         0.0,
433 |         0.0,
434 |     ]
435 | 
436 |     assert list(job.get_node_entries("GPUEff")) == [
437 |         "---",
438 |         "",
439 |         "",
440 |         "",
441 |         "",
442 |     ]
443 | 
444 | 
445 | def test_single_gpu(single_gpu):
446 |     """Jobs with GPUs are reported properly."""
447 |     job = job_module.Job("8197399", "8197399", None)
448 |     for line in single_gpu:
449 |         job.update(line)
450 | 
451 |     assert job.cpu == 95.4
452 |     assert job.mem_eff == 9.5
453 |     assert job.gpu == 29.4
454 |     assert job.gpu_mem == 99.8
455 | 
456 |     # without forcing GPU output
457 |     assert list(job.get_node_entries("JobID")) == ["8197399"]
458 |     assert list(job.get_node_entries("CPUEff")) == [95.4]
459 |     assert list(job.get_node_entries("MemEff")) == [9.5]
460 |     assert list(job.get_node_entries("GPUEff")) == [29.4]
461 |     assert list(job.get_node_entries("GPUMem")) == [99.8]
462 | 
463 |     # with forced GPU output
464 |     assert list(job.get_node_entries("JobID", gpu=True)) == [
465 |         "8197399",
466 |         "  tiger-i23g14",
467 |         "    3",
468 |     ]
469 | 
470 |     assert list(job.get_node_entries("CPUEff", gpu=True)) == [
471 |         95.4,
472 |         95.4,
473 |         "",
474 |     ]
475 | 
476 |     assert list(job.get_node_entries("MemEff", gpu=True)) == [
477 |         9.5,
478 |         9.5,
479 |         "",
480 |     ]
481 | 
482 |     assert list(job.get_node_entries("GPUEff", gpu=True)) == [
483 |         29.4,
484 |         29.4,
485 |         29.4,
486 |     ]
487 | 
488 |     assert list(job.get_node_entries("GPUMem", gpu=True)) == [
489 |         99.8,
490 |         99.8,
491 |         99.8,
492 |     ]
493 | 
494 | 
495 | def test_multi_gpu(multi_gpu):
496 |     """Single core, multi gpu jobs are updated properly."""
497 |     job = job_module.Job("8189521", "8189521", None)
498 |     for line in multi_gpu:
499 |         job.update(line)
500 | 
501 |     assert job.cpu == 10.5
502 |     assert job.mem_eff == 26.3
503 |     assert job.gpu == 3.5
504 |     assert job.gpu_mem == 30.1
505 | 
506 |     # without forcing GPU output
507 |     assert list(job.get_node_entries("JobID")) == ["8189521"]
508 |     assert list(job.get_node_entries("CPUEff")) == [10.5]
509 |     assert list(job.get_node_entries("MemEff")) == [26.3]
510 |     assert list(job.get_node_entries("GPUEff")) == [3.5]
511 |     assert list(job.get_node_entries("GPUMem")) == [30.1]
512 | 
513 |     # with forced GPU output
514 |     assert list(job.get_node_entries("JobID", gpu=True)) == [
515 |         "8189521",
516 |         "  tiger-i19g9",
517 |         "    0",
518 |         "    1",
519 |         "    2",
520 |         "    3",
521 |     ]
522 | 
523 |     assert list(job.get_node_entries("CPUEff", gpu=True)) == [
524 |         10.5,
525 |         10.5,
526 |         "",
527 |         "",
528 |         "",
529 |         "",
530 |     ]
531 | 
532 |     assert list(job.get_node_entries("MemEff", gpu=True)) == [
533 |         26.3,
534 |         26.3,
535 |         "",
536 |         "",
537 |         "",
538 |         "",
539 |     ]
540 | 
541 |     assert list(job.get_node_entries("GPUEff", gpu=True)) == [
542 |         3.5,
543 |         3.5,
544 |         3.5,
545 |         3.5,
546 |         3.2,
547 |         3.8,
548 |     ]
549 | 
550 |     assert list(job.get_node_entries("GPUMem", gpu=True)) == [
551 |         30.1,
552 |         30.1,
553 |         30.1,
554 |         30.1,
555 |         30.1,
556 |         30.1,
557 |     ]
558 | 
559 | 
560 | def test_multi_node_multi_gpu(multi_node_multi_gpu):
561 |     """Multiple nodes with multiple gpus are updated properly."""
562 |     job = job_module.Job("8189521", "8189521", None)
563 |     for line in multi_node_multi_gpu:
564 |         job.update(line)
565 | 
566 |     assert job.cpu == 10.5
567 |     assert job.mem_eff == 26.0
568 |     assert job.gpu == 5.5
569 |     assert job.gpu_mem == 30.1
570 | 
571 |     assert list(job.get_node_entries("JobID")) == [
572 |         "8189521",
573 |         "  tiger-i19g10",
574 |         "  tiger-i19g9",
575 |     ]
576 | 
577 |     assert list(job.get_node_entries("CPUEff")) == [
578 |         10.5,
579 |         10.5,
580 |         10.5,
581 |     ]
582 | 
583 |     assert list(job.get_node_entries("MemEff")) == [
584 |         26.0,
585 |         25.8,
586 |         26.3,
587 |     ]
588 | 
589 |     assert list(job.get_node_entries("GPUEff")) == [
590 |         5.5,
591 |         7.5,
592 |         3.5,
593 |     ]
594 | 
595 |     assert list(job.get_node_entries("GPUMem")) == [
596 |         30.1,
597 |         30.1,
598 |         30.1,
599 |     ]
600 | 
601 |     assert list(job.get_node_entries("JobID", gpu=True)) == [
602 |         "8189521",
603 |         "  tiger-i19g10",
604 |         "    0",
605 |         "    1",
606 |         "    2",
607 |         "    3",
608 |         "  tiger-i19g9",
609 |         "    0",
610 |         "    1",
611 |         "    2",
612 |         "    3",
613 |     ]
614 | 
615 |     assert list(job.get_node_entries("CPUEff", gpu=True)) == [
616 |         10.5,
617 |         10.5,
618 |         "",
619 |         "",
620 |         "",
621 |         "",
622 |         10.5,
623 |         "",
624 |         "",
625 |         "",
626 |         "",
627 |     ]
628 | 
629 |     assert list(job.get_node_entries("MemEff", gpu=True)) == [
630 |         26.0,
631 |         25.8,
632 |         "",
633 |         "",
634 |         "",
635 |         "",
636 |         26.3,
637 |         "",
638 |         "",
639 |         "",
640 |         "",
641 |     ]
642 | 
643 |     assert list(job.get_node_entries("GPUEff", gpu=True)) == [
644 |         5.5,
645 |         7.5,
646 |         7.5,
647 |         7.5,
648 |         7.2,
649 |         7.8,
650 |         3.5,
651 |         3.5,
652 |         3.5,
653 |         3.2,
654 |         3.8,
655 |     ]
656 | 
657 |     assert list(job.get_node_entries("GPUMem", gpu=True)) == [
658 |         30.1,
659 |         30.1,
660 |         30.1,
661 |         30.1,
662 |         30.1,
663 |         30.1,
664 |         30.1,
665 |         30.1,
666 |         30.1,
667 |         30.1,
668 |         30.1,
669 |     ]
670 | 
671 | 
672 | def test_short_job(short_job):
673 |     """Jobs with JS1:Short are handled with sacct info instead."""
674 |     job = job_module.Job("8205464", "8205464", None)
675 |     for line in short_job:
676 |         job.update(line)
677 | 
678 |     assert job.cpu == 6.2
679 |     assert job.mem_eff is None
680 |     assert job.gpu is None
681 |     assert job.gpu_mem is None
682 | 
683 |     assert list(job.get_node_entries("JobID")) == ["8205464"]
684 |     assert list(job.get_node_entries("JobID", gpu=True)) == ["8205464"]
685 |     assert list(job.get_node_entries("CPUEff")) == [6.2]
686 |     assert list(job.get_node_entries("State")) == ["FAILED"]
687 | 
688 | 
689 | def test_bad_gpu(bad_gpu):
690 |     """Jobs failing due to gpu are parsed properly."""
691 |     job = job_module.Job("45352405", "45352405", None)
692 |     for line in bad_gpu:
693 |         job.update(line)
694 | 
695 |     assert job.cpu == 99.5
696 |     assert job.mem_eff == 39.1
697 |     assert job.gpu == 0
698 |     assert job.gpu_mem == 1.0
699 | 
700 |     assert list(job.get_node_entries("JobID")) == ["45352405"]
701 |     assert list(job.get_node_entries("CPUEff")) == [99.5]
702 |     assert list(job.get_node_entries("State")) == ["CANCELLED"]
703 | 
704 | 
705 | def test_bad_gpu_utilization(bad_gpu_used):
706 |     """Jobs with no gpu utilization are parsed properly."""
707 |     job = job_module.Job("46044267", "46044267", None)
708 |     for line in bad_gpu_used:
709 |         job.update(line)
710 | 
711 |     assert job.cpu == 96.2
712 |     assert job.mem_eff == 86.4
713 |     assert job.gpu == 4.8
714 |     assert job.gpu_mem == 11.1
715 | 
716 |     assert list(job.get_node_entries("JobID")) == ["46044267"]
717 |     assert list(job.get_node_entries("CPUEff")) == [96.2]
718 |     assert list(job.get_node_entries("State")) == ["TIMEOUT"]
719 | 
720 | 
721 | def test_issue_26(get_jobstats):
722 |     """Jobs with 0 total_time are parsed."""
723 |     admin_comment = {
724 |         "gpus": True,
725 |         "nodes": {
726 |             "maestro-3003": {
727 |                 "cpus": 8,
728 |                 "gpu_total_memory": {"2": 42949672960},
729 |                 "gpu_used_memory": {"2": 0},
730 |                 "gpu_utilization": {"2": 0},
731 |                 "total_memory": 62914560.0,
732 |                 "total_time": 0,
733 |                 "used_memory": 0,
734 |             }
735 |         },
736 |         "total_time": 0,
737 |     }
738 |     entry = {
739 |         "AdminComment": get_jobstats(admin_comment),
740 |         "AllocCPUS": "8",
741 |         "Elapsed": "00:00:00",
742 |         "JobID": "13421658",
743 |         "JobIDRaw": "13421658",
744 |         "MaxRSS": "",
745 |         "NNodes": "1",
746 |         "REQMEM": "60G",
747 |         "State": "FAILED",
748 |         "Timelimit": "3-00:00:00",
749 |         "TotalCPU": "00:00.001",
750 |     }
751 |     job = job_module.Job("13421658", "13421658", None)
752 |     job.update(entry)
753 |     assert job.state == "FAILED"
754 |     assert job.cpu == 0
755 |     assert job.mem_eff == 0
756 | 
757 | 
758 | def test_multinode_job(multinode_job):
759 |     """Testing issue37 which is not actually a bug efficiency is truly 5%."""
760 |     job = job_module.Job("6196869", "6196869", None)
761 |     for line in multinode_job:
762 |         job.update(line)
763 | 
764 |     assert job.cpu == 5.0
765 | 
766 | 
767 | def test_multinode_job_issue_41(issue_41):
768 |     """Testing issue 41 where multiple tasks are used.
769 | 
770 |     Previously reported incorrect memory efficiency.
771 |     """
772 |     job = job_module.Job("131042", "131042", None)
773 |     for line in issue_41:
774 |         job.update(line)
775 | 
776 |     assert job.cpu == 98.3
777 |     assert job.get_entry("MemEff") == 95.1
778 | 


--------------------------------------------------------------------------------
/tests/test_job_collection.py:
--------------------------------------------------------------------------------
  1 | """Test job collection functions."""
  2 | 
  3 | from pathlib import Path
  4 | 
  5 | import pytest
  6 | from reportseff import job_collection
  7 | from reportseff.job import Job
  8 | 
  9 | 
 10 | @pytest.fixture()
 11 | def jobs():
 12 |     """New default job collection."""
 13 |     return job_collection.JobCollection()
 14 | 
 15 | 
 16 | def test_get_columns(jobs):
 17 |     """Default get columns are reasonable."""
 18 |     assert jobs.get_columns() == (
 19 |         "JobIDRaw,JobID,State,AllocCPUS,TotalCPU,Elapsed,Timelimit,"
 20 |         "REQMEM,MaxRSS,NNodes,NTasks,Partition"
 21 |     ).split(",")
 22 | 
 23 | 
 24 | def test_get_jobs(jobs):
 25 |     """Can hold a set of jobs and access them."""
 26 |     assert jobs.get_jobs() == []
 27 | 
 28 |     jobs.jobs = {
 29 |         "1_1": Job("1", "1_1", None),
 30 |         "1_2": Job("1", "1_2", None),
 31 |         "2_2": Job("2", "2_2", None),
 32 |     }
 33 |     assert jobs.get_jobs() == "1,2".split(",")
 34 | 
 35 | 
 36 | def test_set_out_dir_dir_handling(jobs, mocker):
 37 |     """Can handle setting path from cwd or provided value."""
 38 |     # dir handling
 39 |     mock_cwd = mocker.patch(
 40 |         "reportseff.job_collection.Path.cwd", return_value=Path("/dir/path")
 41 |     )
 42 |     mock_real = mocker.patch(
 43 |         "reportseff.job_collection.Path.resolve", return_value=Path("/dir/path2")
 44 |     )
 45 |     mock_exists = mocker.patch(
 46 |         "reportseff.job_collection.Path.exists", return_value=False
 47 |     )
 48 | 
 49 |     with pytest.raises(ValueError, match="/dir/path does not exist!"):
 50 |         jobs.set_out_dir("")
 51 |     mock_cwd.assert_called_once()
 52 |     mock_real.assert_not_called()
 53 |     mock_exists.assert_called_once()
 54 | 
 55 |     mock_cwd.reset_mock()
 56 |     mock_real.reset_mock()
 57 |     mock_exists.reset_mock()
 58 | 
 59 |     with pytest.raises(ValueError, match="/dir/path2 does not exist!"):
 60 |         jobs.set_out_dir("pwd")
 61 |     mock_cwd.assert_not_called()
 62 |     mock_real.assert_called_once()
 63 |     mock_exists.assert_called_once()
 64 | 
 65 | 
 66 | def test_set_jobs_none_valid(jobs):
 67 |     """Set jobs raises exceptions when no valid name is provided."""
 68 |     with pytest.raises(ValueError, match="No valid jobs provided!"):
 69 |         jobs.set_jobs(("asdf", "qwer", "zxcv", "asdf111"))
 70 | 
 71 | 
 72 | def test_set_jobs_filter(jobs):
 73 |     """Set jobs take only valid names from list."""
 74 |     jobs.set_jobs(("asdf", "1", "1_1", "asdf_1_2", "1_asdf_2"))
 75 |     assert jobs.jobs == {
 76 |         "1": Job("1", "1", None),
 77 |         "1_1": Job("1", "1_1", None),
 78 |         "1_2": Job("1", "1_2", "asdf_1_2"),
 79 |         "2": Job("2", "2", "1_asdf_2"),
 80 |     }
 81 | 
 82 | 
 83 | def test_set_jobs_dir(jobs, mocker):
 84 |     """Can provide a directory to set jobs."""
 85 |     jobs.jobs = {}
 86 |     mocker.patch("reportseff.job_collection.Path.is_dir", return_value=False)
 87 |     with pytest.raises(ValueError, match="No valid jobs provided!"):
 88 |         jobs.set_jobs(("dir",))
 89 | 
 90 |     jobs.set_jobs(("1",))
 91 |     assert jobs.jobs == {"1": Job("1", "1", None)}
 92 | 
 93 |     mocker.patch("reportseff.job_collection.Path.is_dir", return_value=True)
 94 |     mock_set_out = mocker.patch.object(job_collection.JobCollection, "set_out_dir")
 95 | 
 96 |     jobs.set_jobs(())
 97 |     mock_set_out.assert_called_once()
 98 | 
 99 |     mock_set_out.reset_mock()
100 |     jobs.set_jobs(("dir",))
101 |     mock_set_out.assert_called_once()
102 | 
103 | 
104 | def test_process_line(jobs, mocker):
105 |     """Can process entries from sacct and send to update."""
106 |     jobs.jobs = {"24371655": Job("24371655", "24371655", "test_24371655")}
107 |     mock_update = mocker.patch.object(Job, "update")
108 |     jobs.process_entry(
109 |         dict(
110 |             zip(
111 |                 jobs.get_columns(),
112 |                 "24371655|24371655|COMPLETED|1|"
113 |                 "01:29:47|01:29:56|03:00:00|1Gn||1|".split("|"),
114 |             )
115 |         )
116 |     )
117 |     jobs.process_entry(
118 |         dict(
119 |             zip(
120 |                 jobs.get_columns(),
121 |                 "24371655.batch|24371655.batch|COMPLETED|1|"
122 |                 "01:29:47|01:29:56||1Gn|495644K|1|1".split("|"),
123 |             )
124 |         )
125 |     )
126 |     jobs.process_entry(
127 |         dict(
128 |             zip(
129 |                 jobs.get_columns(),
130 |                 "24371655.extern|24371655.extern|COMPLETED|1|"
131 |                 "00:00:00|01:29:56||1Gn|1372K|1|1".split("|"),
132 |             )
133 |         )
134 |     )
135 | 
136 |     assert mock_update.call_args_list == [
137 |         mocker.call(
138 |             {
139 |                 "JobIDRaw": "24371655",
140 |                 "JobID": "24371655",
141 |                 "State": "COMPLETED",
142 |                 "AllocCPUS": "1",
143 |                 "REQMEM": "1Gn",
144 |                 "TotalCPU": "01:29:47",
145 |                 "Elapsed": "01:29:56",
146 |                 "Timelimit": "03:00:00",
147 |                 "MaxRSS": "",
148 |                 "NNodes": "1",
149 |                 "NTasks": "",
150 |             }
151 |         ),
152 |         mocker.call(
153 |             {
154 |                 "JobIDRaw": "24371655.batch",
155 |                 "JobID": "24371655.batch",
156 |                 "State": "COMPLETED",
157 |                 "AllocCPUS": "1",
158 |                 "REQMEM": "1Gn",
159 |                 "TotalCPU": "01:29:47",
160 |                 "Elapsed": "01:29:56",
161 |                 "Timelimit": "",
162 |                 "MaxRSS": "495644K",
163 |                 "NNodes": "1",
164 |                 "NTasks": "1",
165 |             }
166 |         ),
167 |         mocker.call(
168 |             {
169 |                 "JobIDRaw": "24371655.extern",
170 |                 "JobID": "24371655.extern",
171 |                 "State": "COMPLETED",
172 |                 "AllocCPUS": "1",
173 |                 "REQMEM": "1Gn",
174 |                 "TotalCPU": "00:00:00",
175 |                 "Elapsed": "01:29:56",
176 |                 "Timelimit": "",
177 |                 "MaxRSS": "1372K",
178 |                 "NNodes": "1",
179 |                 "NTasks": "1",
180 |             }
181 |         ),
182 |     ]
183 | 
184 | 
185 | def test_process_line_partition_timelimit_not_set(jobs, mocker):
186 |     """When partition limits is not set, forward to job."""
187 |     jobs.jobs = {"24371655": Job("24371655", "24371655", "test_24371655")}
188 |     mock_update = mocker.patch.object(Job, "update")
189 |     jobs.process_entry(
190 |         dict(
191 |             zip(
192 |                 jobs.get_columns(),
193 |                 "24371655|24371655|COMPLETED|1|"
194 |                 "01:29:47|01:29:56|Partition_Limit|1Gn||1||mainqueue".split("|"),
195 |             )
196 |         )
197 |     )
198 | 
199 |     assert mock_update.call_args_list == [
200 |         mocker.call(
201 |             {
202 |                 "JobIDRaw": "24371655",
203 |                 "JobID": "24371655",
204 |                 "State": "COMPLETED",
205 |                 "AllocCPUS": "1",
206 |                 "REQMEM": "1Gn",
207 |                 "TotalCPU": "01:29:47",
208 |                 "Elapsed": "01:29:56",
209 |                 "Timelimit": "Partition_Limit",
210 |                 "MaxRSS": "",
211 |                 "NNodes": "1",
212 |                 "NTasks": "",
213 |                 "Partition": "mainqueue",
214 |             }
215 |         ),
216 |     ]
217 | 
218 | 
219 | def test_process_line_partition_timelimit(jobs, mocker):
220 |     """When partition limits is set, replace with limit."""
221 |     jobs.jobs = {"24371655": Job("24371655", "24371655", "test_24371655")}
222 |     mock_update = mocker.patch.object(Job, "update")
223 |     jobs.set_partition_limits({"mainqueue": "01:02:03"})
224 |     jobs.process_entry(
225 |         dict(
226 |             zip(
227 |                 jobs.get_columns(),
228 |                 "24371655|24371655|COMPLETED|1|"
229 |                 "01:29:47|01:29:56|Partition_Limit|1Gn||1||mainqueue".split("|"),
230 |             )
231 |         )
232 |     )
233 | 
234 |     assert mock_update.call_args_list == [
235 |         mocker.call(
236 |             {
237 |                 "JobIDRaw": "24371655",
238 |                 "JobID": "24371655",
239 |                 "State": "COMPLETED",
240 |                 "AllocCPUS": "1",
241 |                 "REQMEM": "1Gn",
242 |                 "TotalCPU": "01:29:47",
243 |                 "Elapsed": "01:29:56",
244 |                 "Timelimit": "01:02:03",
245 |                 "MaxRSS": "",
246 |                 "NNodes": "1",
247 |                 "NTasks": "",
248 |                 "Partition": "mainqueue",
249 |             }
250 |         ),
251 |     ]
252 | 
253 | 
254 | def test_process_line_partition_timelimit_no_match(jobs, mocker):
255 |     """When partition limits is set, but not matching, forward limit."""
256 |     jobs.jobs = {"24371655": Job("24371655", "24371655", "test_24371655")}
257 |     mock_update = mocker.patch.object(Job, "update")
258 |     jobs.set_partition_limits({"mainqueue2": "01:02:03"})
259 |     jobs.process_entry(
260 |         dict(
261 |             zip(
262 |                 jobs.get_columns(),
263 |                 "24371655|24371655|COMPLETED|1|"
264 |                 "01:29:47|01:29:56|Partition_Limit|1Gn||1||mainqueue".split("|"),
265 |             )
266 |         )
267 |     )
268 | 
269 |     assert mock_update.call_args_list == [
270 |         mocker.call(
271 |             {
272 |                 "JobIDRaw": "24371655",
273 |                 "JobID": "24371655",
274 |                 "State": "COMPLETED",
275 |                 "AllocCPUS": "1",
276 |                 "REQMEM": "1Gn",
277 |                 "TotalCPU": "01:29:47",
278 |                 "Elapsed": "01:29:56",
279 |                 "Timelimit": "Partition_Limit",
280 |                 "MaxRSS": "",
281 |                 "NNodes": "1",
282 |                 "NTasks": "",
283 |                 "Partition": "mainqueue",
284 |             }
285 |         ),
286 |     ]
287 | 
288 | 
289 | def test_set_out_dir(jobs, mocker):
290 |     """Can set directory with slurm out files."""
291 |     mocker.patch(
292 |         "reportseff.job_collection.Path.resolve",
293 |         return_value=Path("/dir/path2/test"),
294 |     )
295 |     mocker.patch("reportseff.job_collection.Path.exists", return_value=True)
296 |     mocker.patch("reportseff.job_collection.Path.is_file", return_value=True)
297 | 
298 |     mocker.patch("reportseff.job_collection.Path.iterdir", return_value=[])
299 |     with pytest.raises(
300 |         ValueError,
301 |         match="/dir/path2/test contains no files!",
302 |     ):
303 |         jobs.set_out_dir("test")
304 | 
305 |     mocker.patch("reportseff.job_collection.Path.iterdir", return_value=[Path("asdf")])
306 |     with pytest.raises(
307 |         ValueError, match="/dir/path2/test contains no valid output files!"
308 |     ):
309 |         jobs.set_out_dir("test")
310 | 
311 |     mocker.patch(
312 |         "reportseff.job_collection.Path.iterdir",
313 |         return_value=[
314 |             Path("asdf"),
315 |             Path("base_1"),
316 |             Path("base_1_1.out"),
317 |             Path("base_2_1"),  # overwritten
318 |             Path("base_2_1.out"),
319 |         ],
320 |     )
321 |     jobs.set_out_dir("test")
322 | 
323 |     assert jobs.jobs == {
324 |         "1": Job("1", "1", "base_1"),
325 |         "1_1": Job("1", "1_1", "base_1_1.out"),
326 |         "2_1": Job("2", "2_1", "base_2_1.out"),
327 |     }
328 | 
329 | 
330 | def test_set_custom_seff_format(jobs, mocker):
331 |     """Can change the slurm output file matching."""
332 |     mocker.patch("reportseff.job_collection.Path.exists", return_value=True)
333 |     mocker.patch("reportseff.job_collection.Path.is_file", return_value=True)
334 |     mocker.patch(
335 |         "reportseff.job_collection.Path.iterdir",
336 |         return_value=[
337 |             Path("asdf"),
338 |             Path("base_1"),
339 |             Path("base_1_1.out"),
340 |             Path("base_2_1"),
341 |             Path("base_2_1.out"),
342 |             Path("3.out"),
343 |             Path("4_1.out"),
344 |         ],
345 |     )
346 | 
347 |     with pytest.raises(ValueError, match="Unable to determine jobid from %n.out."):
348 |         jobs.set_custom_seff_format("%n.out")
349 | 
350 |     jobs.set_custom_seff_format("%j.out")
351 |     assert jobs.job_file_regex.pattern == r"^(?P<jobid>(?P<job>[0-9]+))\.out$"
352 | 
353 |     jobs.set_out_dir("test")
354 |     assert jobs.jobs == {
355 |         "3": Job("3", "3", "3.out"),
356 |     }
357 |     jobs.jobs = {}
358 | 
359 |     jobs.set_custom_seff_format("%x%n_%A_%a")
360 |     assert jobs.job_file_regex.pattern == r"^.*_(?P<jobid>(?P<job>[0-9]+)_[0-9]+)$"
361 | 
362 |     jobs.set_out_dir("test")
363 |     assert jobs.jobs == {
364 |         "2_1": Job("2", "2_1", "base_2_1"),
365 |     }
366 |     jobs.jobs = {}
367 | 
368 |     jobs.set_custom_seff_format("%x_%A.out")
369 |     assert jobs.job_file_regex.pattern == r"^.*_(?P<jobid>(?P<job>[0-9]+))\.out$"
370 | 
371 |     jobs.set_out_dir("test")
372 |     assert jobs.jobs == {
373 |         "1": Job("1", "1", "4_1.out"),
374 |     }
375 |     jobs.jobs = {}
376 | 
377 | 
378 | def test_process_seff_file(jobs):
379 |     """Can parse job names from slurm output file names."""
380 |     # no matches
381 |     jobs.process_seff_file("")
382 |     assert jobs.jobs == {}
383 | 
384 |     jobs.process_seff_file("base_name")
385 |     assert jobs.jobs == {}
386 | 
387 |     # simple job file
388 |     jobs.process_seff_file("base_name_1")
389 |     assert jobs.jobs == {"1": Job("1", "1", "base_name_1")}
390 | 
391 |     # with .out
392 |     jobs.process_seff_file("base_name_2.out")
393 |     assert jobs.jobs == {
394 |         "1": Job("1", "1", "base_name_1"),
395 |         "2": Job("2", "2", "base_name_2.out"),
396 |     }
397 | 
398 |     # with array
399 |     jobs.process_seff_file("base_name_3_1")
400 |     assert jobs.jobs == {
401 |         "1": Job("1", "1", "base_name_1"),
402 |         "2": Job("2", "2", "base_name_2.out"),
403 |         "3_1": Job("3", "3_1", "base_name_3_1"),
404 |     }
405 | 
406 |     # array and .out
407 |     jobs.process_seff_file("base_name_4_1.out")
408 |     assert jobs.jobs == {
409 |         "1": Job("1", "1", "base_name_1"),
410 |         "2": Job("2", "2", "base_name_2.out"),
411 |         "3_1": Job("3", "3_1", "base_name_3_1"),
412 |         "4_1": Job("4", "4_1", "base_name_4_1.out"),
413 |     }
414 | 
415 |     jobs.jobs = {}
416 |     # slight mistakes
417 |     jobs.process_seff_file("base_name_4_1out")
418 |     assert jobs.jobs == {}
419 | 
420 |     jobs.process_seff_file("base_name4_1.out")
421 |     assert jobs.jobs == {"1": Job("1", "1", "base_name4_1.out")}
422 | 
423 |     jobs.process_seff_file("base_name_0_4_1.out")
424 |     assert jobs.jobs == {
425 |         "1": Job("1", "1", "base_name4_1.out"),
426 |         "4_1": Job("4", "4_1", "base_name_0_4_1.out"),
427 |     }
428 | 
429 |     jobs.process_seff_file("slurm-24825624.out")
430 |     assert jobs.jobs == {
431 |         "1": Job("1", "1", "base_name4_1.out"),
432 |         "4_1": Job("4", "4_1", "base_name_0_4_1.out"),
433 |         "24825624": Job("24825624", "24825624", "slurm-24825624.out"),
434 |     }
435 | 
436 | 
437 | def test_add_job(jobs):
438 |     """Can add jobs to collection."""
439 |     jobs.add_job("j1", "jid1")
440 |     assert jobs.jobs == {"jid1": Job("j1", "jid1", None)}
441 | 
442 |     # overwrite based on jobid
443 |     jobs.add_job("j2", "jid1", "file")
444 |     assert jobs.jobs == {"jid1": Job("j2", "jid1", "file")}
445 | 
446 |     # another job, different jid
447 |     jobs.add_job("j2", "jid2", "file")
448 |     assert jobs.jobs == {
449 |         "jid1": Job("j2", "jid1", "file"),
450 |         "jid2": Job("j2", "jid2", "file"),
451 |     }
452 | 
453 | 
454 | def test_get_sorted_jobs(jobs, mocker):
455 |     """Can get jobs in sorted order by name or time."""
456 |     jobs.add_job("j3", "jid3")
457 |     jobs.add_job("j1", "jid1")
458 |     jobs.add_job("j2", "jid2")
459 |     jobs.add_job("j13", "jid13")
460 | 
461 |     assert jobs.get_sorted_jobs(change_sort=False) == [
462 |         Job("j1", "jid1", None),
463 |         Job("j2", "jid2", None),
464 |         Job("j3", "jid3", None),
465 |         Job("j13", "jid13", None),
466 |     ]
467 | 
468 |     jobs.jobs = {}
469 |     jobs.add_job("j3", "jid3", "file3")
470 |     jobs.add_job("j1", "jid1", "file12")
471 |     jobs.add_job("j2", "jid2", "file234")
472 |     jobs.add_job("j13", "jid13")
473 |     jobs.add_job("j14", "jid14", "nothing")
474 | 
475 |     # make all non-none files exist
476 |     mocker.patch(
477 |         "reportseff.job_collection.Path.exists",
478 |         lambda x: str(x) != "dir/nothing",
479 |     )
480 | 
481 |     # replace mtime with the length of the filename
482 |     def my_stat(file):
483 |         mock = mocker.MagicMock()
484 |         mock.st_mtime = len(file.name)
485 |         return mock
486 | 
487 |     mocker.patch(
488 |         "reportseff.job_collection.Path.stat",
489 |         my_stat,
490 |     )
491 | 
492 |     # still uses other sorting, no dir_name set
493 |     assert jobs.get_sorted_jobs(change_sort=True) == [
494 |         Job("j13", "jid13", None),
495 |         Job("j2", "jid2", "file234"),
496 |         Job("j14", "jid14", "nothing"),
497 |         Job("j1", "jid1", "file12"),
498 |         Job("j3", "jid3", "file3"),
499 |     ]
500 | 
501 |     jobs.dir_name = Path("dir")  # now dir/nothing doesn't exist
502 |     assert jobs.get_sorted_jobs(change_sort=True) == [
503 |         Job("j14", "jid14", "nothing"),
504 |         Job("j13", "jid13", None),
505 |         Job("j2", "jid2", "file234"),
506 |         Job("j1", "jid1", "file12"),
507 |         Job("j3", "jid3", "file3"),
508 |     ]
509 | 
510 | 
511 | def test_process_entry_array_user(jobs):
512 |     """Providing a user shorts the checks for existing jobs."""
513 |     jobs.process_entry(
514 |         {
515 |             "AllocCPUS": "1",
516 |             "Elapsed": "00:00:00",
517 |             "JobID": "14729857_[737-999]",
518 |             "JobIDRaw": "14729857",
519 |             "MaxRSS": "",
520 |             "NNodes": "1",
521 |             "REQMEM": "50Gn",
522 |             "State": "PENDING",
523 |             "TotalCPU": "00:00:00",
524 |         },
525 |         add_job=True,
526 |     )
527 |     expected_job = Job("14729857", "14729857_[737-999]", None)
528 |     expected_job.state = "PENDING"
529 |     expected_job._cache_entries()
530 |     assert jobs.jobs == {"14729857_[737-999]": expected_job}
531 | 


--------------------------------------------------------------------------------
/tests/test_output_renderer.py:
--------------------------------------------------------------------------------
  1 | """Test operation of output renderer object."""
  2 | 
  3 | import re
  4 | 
  5 | import click
  6 | import pytest
  7 | from reportseff import job as job_module
  8 | from reportseff import output_renderer
  9 | 
 10 | min_required = (
 11 |     "JobID,State,Elapsed,JobIDRaw,State,TotalCPU,AllocCPUS,"
 12 |     "REQMEM,NNodes,MaxRSS,Timelimit"
 13 | ).split(",")
 14 | 
 15 | 
 16 | @pytest.fixture()
 17 | def renderer():
 18 |     """Default renderer with valid names for only default string."""
 19 |     return output_renderer.OutputRenderer(
 20 |         min_required,
 21 |         output_renderer.RenderOptions(),
 22 |     )
 23 | 
 24 | 
 25 | @pytest.fixture()
 26 | def some_jobs():
 27 |     """A few test jobs for generating an output table."""
 28 |     jobs = []
 29 |     job = job_module.Job("24371655", "24371655", None)
 30 |     job.update(
 31 |         {
 32 |             "JobID": "24371655",
 33 |             "State": "COMPLETED",
 34 |             "AllocCPUS": "1",
 35 |             "REQMEM": "1Gn",
 36 |             "TotalCPU": "00:09:00",
 37 |             "Elapsed": "00:10:00",
 38 |             "Timelimit": "00:20:00",
 39 |             "MaxRSS": "",
 40 |             "NNodes": "1",
 41 |             "NTasks": "",
 42 |         }
 43 |     )
 44 |     jobs.append(job)
 45 |     job = job_module.Job("24371656", "24371656", None)
 46 |     job.update(
 47 |         {
 48 |             "JobID": "24371656",
 49 |             "State": "PENDING",
 50 |             "AllocCPUS": "1",
 51 |             "REQMEM": "1Gn",
 52 |             "TotalCPU": "00:09:00",
 53 |             "Elapsed": "00:10:00",
 54 |             "Timelimit": "00:20:00",
 55 |             "MaxRSS": "",
 56 |             "NNodes": "1",
 57 |             "NTasks": "",
 58 |         }
 59 |     )
 60 |     jobs.append(job)
 61 |     job = job_module.Job("24371657", "24371657", None)
 62 |     job.update(
 63 |         {
 64 |             "JobID": "24371657",
 65 |             "State": "RUNNING",
 66 |             "AllocCPUS": "1",
 67 |             "REQMEM": "1Gn",
 68 |             "TotalCPU": "00:09:00",
 69 |             "Elapsed": "00:10:00",
 70 |             "Timelimit": "00:20:00",
 71 |             "MaxRSS": "",
 72 |             "NNodes": "1",
 73 |             "NTasks": "",
 74 |         }
 75 |     )
 76 |     jobs.append(job)
 77 |     job = job_module.Job("24371658", "24371658", None)
 78 |     job.update(
 79 |         {
 80 |             "JobID": "24371658",
 81 |             "State": "CANCELLED",
 82 |             "AllocCPUS": "1",
 83 |             "REQMEM": "1Gn",
 84 |             "TotalCPU": "00:09:00",
 85 |             "Elapsed": "00:00:00",
 86 |             "Timelimit": "00:20:00",
 87 |             "MaxRSS": "",
 88 |             "NNodes": "1",
 89 |             "NTasks": "",
 90 |         }
 91 |     )
 92 |     jobs.append(job)
 93 |     job = job_module.Job("24371659", "24371659", None)
 94 |     job.update(
 95 |         {
 96 |             "JobID": "24371659",
 97 |             "State": "TIMEOUT",
 98 |             "AllocCPUS": "1",
 99 |             "REQMEM": "2Gn",
100 |             "TotalCPU": "00:04:00",
101 |             "Elapsed": "00:21:00",
102 |             "Timelimit": "00:20:00",
103 |             "MaxRSS": "",
104 |             "NNodes": "1",
105 |             "NTasks": "",
106 |         }
107 |     )
108 |     jobs.append(job)
109 |     job = job_module.Job("24371660", "24371660", None)
110 |     job.update(
111 |         {
112 |             "JobID": "24371660",
113 |             "State": "OTHER",
114 |             "AllocCPUS": "1",
115 |             "REQMEM": "2Gn",
116 |             "TotalCPU": "00:09:00",
117 |             "Elapsed": "00:12:05",
118 |             "Timelimit": "00:20:00",
119 |             "MaxRSS": "",
120 |             "NNodes": "1",
121 |             "NTasks": "",
122 |         }
123 |     )
124 |     jobs.append(job)
125 |     return jobs
126 | 
127 | 
128 | @pytest.fixture()
129 | def gpu_jobs(single_gpu, multi_gpu, multi_node_multi_gpu):
130 |     """A collection of jobs with gpus."""
131 |     jobs = []
132 | 
133 |     job = job_module.Job("8189521", "8189521", None)
134 |     for line in multi_node_multi_gpu:
135 |         job.update(line)
136 |     jobs.append(job)
137 | 
138 |     job = job_module.Job("8189521", "8189521", None)
139 |     for line in multi_gpu:
140 |         job.update(line)
141 |     jobs.append(job)
142 | 
143 |     job = job_module.Job("8197399", "8197399", None)
144 |     for line in single_gpu:
145 |         job.update(line)
146 |     jobs.append(job)
147 | 
148 |     return jobs
149 | 
150 | 
151 | @pytest.fixture()
152 | def cpu_jobs(single_core, multi_node, short_job):
153 |     """A collection of cpu jobs."""
154 |     jobs = []
155 | 
156 |     job = job_module.Job("8205464", "8205464", None)
157 |     for line in short_job:
158 |         job.update(line)
159 |     jobs.append(job)
160 | 
161 |     job = job_module.Job("8205048", "8205048", None)
162 |     for line in multi_node:
163 |         job.update(line)
164 |     jobs.append(job)
165 | 
166 |     job = job_module.Job("39895850", "39889258_1426", None)
167 |     for line in single_core:
168 |         job.update(line)
169 |     jobs.append(job)
170 | 
171 |     return jobs
172 | 
173 | 
174 | @pytest.fixture()
175 | def some_multi_core_jobs(gpu_jobs, cpu_jobs):
176 |     """A collection of jobs with multiple cores/gpus."""
177 |     result = []
178 |     result.append(cpu_jobs[0])
179 |     result += gpu_jobs
180 |     result += cpu_jobs[1:]
181 |     return result
182 | 
183 | 
184 | def test_renderer_init(renderer):
185 |     """Initialized renderer produces correct columns."""
186 |     assert renderer.formatters == [
187 |         output_renderer.ColumnFormatter("JobID%>"),
188 |         output_renderer.ColumnFormatter("State"),
189 |         output_renderer.ColumnFormatter("Elapsed%>"),
190 |         output_renderer.ColumnFormatter("CPUEff"),
191 |         output_renderer.ColumnFormatter("MemEff"),
192 |     ]
193 |     assert sorted(renderer.query_columns) == sorted(
194 |         (
195 |             "JobID JobIDRaw State Elapsed TotalCPU "
196 |             "AllocCPUS REQMEM NNodes NTasks MaxRSS AdminComment"
197 |         ).split()
198 |     )
199 | 
200 |     renderer = output_renderer.OutputRenderer(
201 |         min_required,
202 |         output_renderer.RenderOptions(),
203 |         "",
204 |     )
205 |     assert renderer.formatters == []
206 |     assert sorted(renderer.query_columns) == sorted(
207 |         ("JobID JobIDRaw State AdminComment").split()
208 |     )
209 | 
210 |     renderer = output_renderer.OutputRenderer(
211 |         min_required,
212 |         output_renderer.RenderOptions(),
213 |         "TotalCPU%<5",
214 |     )
215 |     assert renderer.formatters == [output_renderer.ColumnFormatter("TotalCPU%<5")]
216 |     assert sorted(renderer.query_columns) == sorted(
217 |         ("JobID JobIDRaw State TotalCPU AdminComment").split()
218 |     )
219 | 
220 | 
221 | def test_renderer_build_formatters():
222 |     """Can parse formatters from format string."""
223 |     assert output_renderer.build_formatters("Name,Name%>,Name%10,Name%<10") == [
224 |         output_renderer.ColumnFormatter("Name"),
225 |         output_renderer.ColumnFormatter("Name%>"),
226 |         output_renderer.ColumnFormatter("Name%10"),
227 |         output_renderer.ColumnFormatter("Name%<10"),
228 |     ]
229 | 
230 |     assert output_renderer.build_formatters("jobid,state,elapsed") == [
231 |         "jobid",
232 |         "state",
233 |         "elapsed",
234 |     ]
235 | 
236 |     assert output_renderer.build_formatters("") == []
237 | 
238 | 
239 | def test_renderer_validate_formatters(renderer):
240 |     """Can validate formatters as members of a provided collection, normalizing name."""
241 |     renderer.formatters = output_renderer.build_formatters("JobID,JOBid,jObId")
242 |     assert renderer.validate_formatters(["JobID"]) == "JobID JobID JobID".split()
243 |     assert renderer.formatters == "JobID JobID JobID".split()
244 | 
245 |     renderer.formatters = output_renderer.build_formatters("JobID,GPU%>10")
246 |     assert (
247 |         renderer.validate_formatters(["JobID", "GPU", "GPUEff", "GPUMem"])
248 |         == "JobID GPU".split()
249 |     )
250 |     assert renderer.formatters == "JobID GPUEff GPUMem".split()
251 |     # other params are copied from GPU to GPUEff and GPUMem
252 |     assert renderer.formatters[1].alignment == ">"
253 |     assert renderer.formatters[2].alignment == ">"
254 |     assert renderer.formatters[1].width == 10
255 |     assert renderer.formatters[2].width == 10
256 | 
257 | 
258 | def test_renderer_validate_formatters_with_node(renderer):
259 |     """Validating formatters with GPUs can alter formatters."""
260 |     min_gpu = [*min_required, "GPU", "GPUEff", "GPUMem"]
261 |     # normal function
262 |     renderer.options.node = False
263 |     renderer.options.gpu = False
264 |     renderer.formatters = output_renderer.build_formatters("State")
265 |     assert renderer.validate_formatters(min_gpu) == ["State"]
266 |     assert renderer.formatters == ["State"]
267 | 
268 |     # add in job id
269 |     renderer.options.node = True
270 |     renderer.options.gpu = False
271 |     renderer.formatters = output_renderer.build_formatters("State")
272 |     assert renderer.validate_formatters(min_gpu) == ["State"]
273 |     assert renderer.formatters == ["JobID", "State"]
274 | 
275 |     # add in both gpus, gpu implies node
276 |     renderer.options.node = True
277 |     renderer.options.gpu = True
278 |     renderer.formatters = output_renderer.build_formatters("State")
279 |     assert renderer.validate_formatters(min_gpu) == ["State"]
280 |     assert renderer.formatters == ["JobID", "State", "GPUEff", "GPUMem"]
281 |     assert renderer.formatters[0].alignment == "<"  # switched by node reporting
282 | 
283 |     # since format already has jobid and gpumem, will not override
284 |     renderer.options.node = True
285 |     renderer.options.gpu = True
286 |     renderer.formatters = output_renderer.build_formatters("GPUMEM,State,JobID:>")
287 |     assert renderer.validate_formatters(min_gpu) == "GPUMem State JobID".split()
288 |     assert renderer.formatters == ["GPUMem", "State", "JobID"]
289 |     assert renderer.formatters[2].alignment == "<"  # switched by node reporting
290 | 
291 | 
292 | def test_renderer_correct_columns(renderer):
293 |     """Corrected columns include required entries and derived values."""
294 |     renderer.query_columns = ["JobID"]
295 |     renderer.correct_columns()
296 |     assert sorted(renderer.query_columns) == sorted(
297 |         "JobID JobIDRaw State AdminComment".split()
298 |     )
299 | 
300 |     renderer.query_columns = "JobID CPUEff MemEff TimeEff".split()
301 |     renderer.correct_columns()
302 |     assert sorted(renderer.query_columns) == sorted(
303 |         (
304 |             "JobID TotalCPU Elapsed REQMEM"
305 |             " JobIDRaw State AdminComment"
306 |             " NNodes NTasks AllocCPUS MaxRSS Timelimit"
307 |         ).split()
308 |     )
309 | 
310 |     renderer.query_columns = "JobID JobID JobID".split()
311 |     renderer.correct_columns()
312 |     assert sorted(renderer.query_columns) == sorted(
313 |         "JobID JobIDRaw State AdminComment".split()
314 |     )
315 | 
316 | 
317 | def test_renderer_format_jobs(some_jobs):
318 |     """Can render output as table with colored entries."""
319 |     renderer = output_renderer.OutputRenderer(
320 |         min_required,
321 |         output_renderer.RenderOptions(),
322 |         "JobID,State,Elapsed,CPUEff,REQMEM,TimeEff",
323 |     )
324 |     result = renderer.format_jobs(some_jobs)
325 |     ansi_escape = re.compile(r"\x1B[@-_][0-?]*[ -/]*[@-~]")
326 |     # check removed codes
327 |     codes = ansi_escape.findall(result)
328 |     for code in codes[1::2]:  # normal
329 |         assert code == "\x1b[0m"
330 |     for code in codes[0:10:20]:
331 |         assert code == "\x1b[1m"  # bold
332 |     for i in (22, 24, 26, 28):
333 |         assert codes[i] == "\x1b[31m"  # red
334 |     for i in (12, 14, 30):
335 |         assert codes[i] == "\x1b[32m"  # green
336 |     for i in (20,):
337 |         assert codes[i] == "\x1b[33m"  # yellow
338 |     for i in (16,):
339 |         assert codes[i] == "\x1b[34m"  # blue
340 |     for i in (18,):
341 |         assert codes[i] == "\x1b[36m"  # cyan
342 |     # remove color codes
343 |     result = ansi_escape.sub("", result)
344 |     lines = result.split("\n")
345 |     assert lines[0].split() == "JobID State Elapsed CPUEff REQMEM TimeEff".split()
346 |     assert lines[1].split() == "24371655 COMPLETED 00:10:00 90.0% 1Gn 50.0%".split()
347 |     assert lines[2].split() == "24371656 PENDING --- --- --- ---".split()
348 |     assert lines[3].split() == "24371657 RUNNING 00:10:00 --- 1Gn 50.0%".split()
349 |     assert lines[4].split() == "24371658 CANCELLED 00:00:00 --- 1Gn 0.0%".split()
350 |     assert lines[5].split() == "24371659 TIMEOUT 00:21:00 19.0% 2Gn 105.0%".split()
351 |     assert lines[6].split() == "24371660 OTHER 00:12:05 74.5% 2Gn 60.4%".split()
352 | 
353 | 
354 | def test_renderer_format_jobs_multi_node(some_multi_core_jobs):
355 |     """Can render output as table with colored entries."""
356 |     renderer = output_renderer.OutputRenderer(
357 |         min_required,
358 |         output_renderer.RenderOptions(),
359 |         "JobID,State,CPUEff,TimeEff,MemEff,GPU",
360 |     )
361 |     result = renderer.format_jobs(some_multi_core_jobs)
362 |     ansi_escape = re.compile(r"\x1B[@-_][0-?]*[ -/]*[@-~]")
363 |     result = ansi_escape.sub("", result)
364 |     lines = result.split("\n")
365 |     assert lines[0].split() == "JobID State CPUEff TimeEff MemEff GPUEff GPUMem".split()
366 |     assert lines[1].split() == "8205464 FAILED 6.2% 0.0% 0.0% --- ---".split()
367 |     assert lines[2].split() == "8189521 CANCELLED 10.5% 83.0% 26.0% 5.5% 30.1%".split()
368 |     assert lines[3].split() == "8189521 CANCELLED 10.5% 83.0% 26.3% 3.5% 30.1%".split()
369 |     assert lines[4].split() == "8197399 COMPLETED 95.4% 21.1% 9.5% 29.4% 99.8%".split()
370 |     assert lines[5].split() == "8205048 COMPLETED 4.6% 4.1% 1.1% --- ---".split()
371 |     assert (
372 |         lines[6].split() == "39889258_1426 COMPLETED 99.7% 76.7% 3.6% --- ---".split()
373 |     )
374 | 
375 | 
376 | def test_renderer_format_jobs_multi_node_with_nodes(some_multi_core_jobs):
377 |     """Can render output as table with colored entries."""
378 |     renderer = output_renderer.OutputRenderer(
379 |         min_required,
380 |         output_renderer.RenderOptions(node=True),
381 |         "JobID,State,CPUEff,TimeEff,MemEff,GPU",
382 |     )
383 |     result = renderer.format_jobs(some_multi_core_jobs)
384 |     ansi_escape = re.compile(r"\x1B[@-_][0-?]*[ -/]*[@-~]")
385 |     result = ansi_escape.sub("", result)
386 |     lines = result.split("\n")
387 |     assert lines[0].split() == "JobID State CPUEff TimeEff MemEff GPUEff GPUMem".split()
388 |     assert lines[1].split() == "8205464 FAILED 6.2% 0.0% 0.0% --- ---".split()
389 |     assert lines[2].split() == "8189521 CANCELLED 10.5% 83.0% 26.0% 5.5% 30.1%".split()
390 |     assert lines[3].split() == "tiger-i19g10 10.5% 25.8% 7.5% 30.1%".split()
391 |     assert lines[4].split() == "tiger-i19g9 10.5% 26.3% 3.5% 30.1%".split()
392 |     assert lines[5].split() == "8189521 CANCELLED 10.5% 83.0% 26.3% 3.5% 30.1%".split()
393 |     assert lines[6].split() == "8197399 COMPLETED 95.4% 21.1% 9.5% 29.4% 99.8%".split()
394 |     assert lines[7].split() == "8205048 COMPLETED 4.6% 4.1% 1.1% --- ---".split()
395 |     assert lines[8].split() == "tiger-h19c1n15 18.6% 4.5%".split()
396 |     assert lines[9].split() == "tiger-h26c2n13 0.0% 0.0%".split()
397 |     assert lines[10].split() == "tiger-i26c2n11 0.0% 0.0%".split()
398 |     assert lines[11].split() == "tiger-i26c2n15 0.0% 0.0%".split()
399 |     assert (
400 |         lines[12].split() == "39889258_1426 COMPLETED 99.7% 76.7% 3.6% --- ---".split()
401 |     )
402 | 
403 | 
404 | def test_renderer_format_jobs_multi_node_with_nodes_and_gpu(some_multi_core_jobs):
405 |     """Can render output as table with colored entries."""
406 |     renderer = output_renderer.OutputRenderer(
407 |         min_required,
408 |         output_renderer.RenderOptions(node=True, gpu=True),
409 |         "JobID,State,CPUEff,TimeEff,MemEff,GPU",
410 |     )
411 |     result = renderer.format_jobs(some_multi_core_jobs)
412 |     ansi_escape = re.compile(r"\x1B[@-_][0-?]*[ -/]*[@-~]")
413 |     result = ansi_escape.sub("", result)
414 |     lines = result.split("\n")
415 |     assert lines[0].split() == "JobID State CPUEff TimeEff MemEff GPUEff GPUMem".split()
416 |     assert lines[1].split() == "8205464 FAILED 6.2% 0.0% 0.0% --- ---".split()
417 |     assert lines[2].split() == "8189521 CANCELLED 10.5% 83.0% 26.0% 5.5% 30.1%".split()
418 |     assert lines[3].split() == "tiger-i19g10 10.5% 25.8% 7.5% 30.1%".split()
419 |     assert lines[4].split() == "0 7.5% 30.1%".split()
420 |     assert lines[5].split() == "1 7.5% 30.1%".split()
421 |     assert lines[6].split() == "2 7.2% 30.1%".split()
422 |     assert lines[7].split() == "3 7.8% 30.1%".split()
423 |     assert lines[8].split() == "tiger-i19g9 10.5% 26.3% 3.5% 30.1%".split()
424 |     assert lines[9].split() == "0 3.5% 30.1%".split()
425 |     assert lines[10].split() == "1 3.5% 30.1%".split()
426 |     assert lines[11].split() == "2 3.2% 30.1%".split()
427 |     assert lines[12].split() == "3 3.8% 30.1%".split()
428 |     assert lines[13].split() == "8189521 CANCELLED 10.5% 83.0% 26.3% 3.5% 30.1%".split()
429 |     assert lines[14].split() == "tiger-i19g9 10.5% 26.3% 3.5% 30.1%".split()
430 |     assert lines[15].split() == "0 3.5% 30.1%".split()
431 |     assert lines[16].split() == "1 3.5% 30.1%".split()
432 |     assert lines[17].split() == "2 3.2% 30.1%".split()
433 |     assert lines[18].split() == "3 3.8% 30.1%".split()
434 |     assert lines[19].split() == "8197399 COMPLETED 95.4% 21.1% 9.5% 29.4% 99.8%".split()
435 |     assert lines[20].split() == "tiger-i23g14 95.4% 9.5% 29.4% 99.8%".split()
436 |     assert lines[21].split() == "3 29.4% 99.8%".split()
437 |     assert lines[22].split() == "8205048 COMPLETED 4.6% 4.1% 1.1% --- ---".split()
438 |     assert lines[23].split() == "tiger-h19c1n15 18.6% 4.5%".split()
439 |     assert lines[24].split() == "tiger-h26c2n13 0.0% 0.0%".split()
440 |     assert lines[25].split() == "tiger-i26c2n11 0.0% 0.0%".split()
441 |     assert lines[26].split() == "tiger-i26c2n15 0.0% 0.0%".split()
442 |     assert (
443 |         lines[27].split() == "39889258_1426 COMPLETED 99.7% 76.7% 3.6% --- ---".split()
444 |     )
445 | 
446 | 
447 | def test_format_jobs_empty(some_jobs):
448 |     """Empty format string produces empty outputs."""
449 |     renderer = output_renderer.OutputRenderer(
450 |         min_required,
451 |         output_renderer.RenderOptions(),
452 |         "",
453 |     )
454 |     result = renderer.format_jobs(some_jobs)
455 |     assert result == ""
456 | 
457 | 
458 | def test_format_jobs_single_str(some_jobs):
459 |     """A single format string left aligns and suppresses title for piping."""
460 |     renderer = output_renderer.OutputRenderer(
461 |         min_required,
462 |         output_renderer.RenderOptions(),
463 |         "JobID%>",
464 |     )
465 |     assert len(renderer.formatters) == 1
466 |     assert renderer.formatters[0].alignment == ">"
467 | 
468 |     result = renderer.format_jobs(some_jobs).split("\n")
469 | 
470 |     # alignment is switched
471 |     assert renderer.formatters[0].alignment == "<"
472 |     assert result == [
473 |         "24371655",
474 |         "24371656",
475 |         "24371657",
476 |         "24371658",
477 |         "24371659",
478 |         "24371660",
479 |     ]
480 | 
481 | 
482 | def test_formatter_init():
483 |     """Column formatter parses format tokens correctly."""
484 |     # simple name
485 |     result = output_renderer.ColumnFormatter("test")
486 |     assert result.title == "test"
487 |     assert result.alignment == "^"
488 |     assert result.width is None
489 | 
490 |     # with alignment
491 |     result = output_renderer.ColumnFormatter("test%>")
492 |     assert result.title == "test"
493 |     assert result.alignment == ">"
494 |     assert result.width is None
495 | 
496 |     # with width
497 |     result = output_renderer.ColumnFormatter("test%10")
498 |     assert result.title == "test"
499 |     assert result.alignment == "^"
500 |     assert result.width == 10
501 | 
502 |     # with both
503 |     result = output_renderer.ColumnFormatter("test%<10")
504 |     assert result.title == "test"
505 |     assert result.alignment == "<"
506 |     assert result.width == 10
507 |     assert result.end is None
508 | 
509 |     # with invalid width
510 |     with pytest.raises(ValueError, match="Unable to parse format token 'test%1<0'"):
511 |         result = output_renderer.ColumnFormatter("test%1<0")
512 | 
513 |     # empty
514 |     with pytest.raises(ValueError, match="Unable to parse format token ''"):
515 |         result = output_renderer.ColumnFormatter("")
516 | 
517 |     # if unable to parse with %, recommend using ""
518 |     with pytest.raises(
519 |         ValueError,
520 |         match=(
521 |             "Unable to parse format token 'test%a', "
522 |             "did you forget to wrap in quotes?"
523 |         ),
524 |     ):
525 |         result = output_renderer.ColumnFormatter("test%a")
526 | 
527 |     # if unable to parse with %, recommend using "" even when matching
528 |     with pytest.raises(
529 |         ValueError,
530 |         match="Unable to parse format token 'test%', did you forget to wrap in quotes?",
531 |     ):
532 |         result = output_renderer.ColumnFormatter("test%")
533 | 
534 |     # end without width is an error
535 |     with pytest.raises(ValueError, match="Unable to parse format token 'test%e'"):
536 |         result = output_renderer.ColumnFormatter("test%e")
537 | 
538 |     # can specify end with width
539 |     result = output_renderer.ColumnFormatter("test%20e")
540 |     assert result.title == "test"
541 |     assert result.alignment == "^"
542 |     assert result.width == 20
543 |     assert result.end is not None
544 | 
545 |     # can use alternate tokens : and $
546 |     result = output_renderer.ColumnFormatter("test:20$")
547 |     assert result.title == "test"
548 |     assert result.alignment == "^"
549 |     assert result.width == 20
550 |     assert result.end is not None
551 | 
552 | 
553 | def test_formatter_eq():
554 |     """Can test for equality and with a string."""
555 |     fmt = output_renderer.ColumnFormatter("Name")
556 |     fmt2 = output_renderer.ColumnFormatter("Name")
557 |     fmt3 = output_renderer.ColumnFormatter("Name>")
558 |     assert fmt == fmt2
559 |     assert fmt != fmt3
560 | 
561 |     assert fmt != []
562 |     assert repr(fmt) == "Name%^None"
563 | 
564 |     assert "Name" == fmt  # noqa: SIM300 need to check both sides for equality
565 |     assert fmt == "Name"
566 |     assert fmt != "NaMe"
567 | 
568 |     formatters = [fmt, fmt2, fmt3]
569 |     assert "Name" in formatters
570 |     assert "NAME" not in formatters
571 | 
572 | 
573 | def test_formatter_validate_title():
574 |     """Can validate titles against a column formatter."""
575 |     fmt = output_renderer.ColumnFormatter("NaMe")
576 | 
577 |     with pytest.raises(ValueError, match="'NaMe' is not a valid title"):
578 |         fmt.validate_title(["JobID", "State"])
579 | 
580 |     fmt.title = "jOBid"
581 |     assert fmt.validate_title(["other", "JobID", "State"]) == "JobID"
582 |     assert fmt.title == "JobID"
583 | 
584 | 
585 | def test_formatter_compute_width():
586 |     """Can determine width of table entries."""
587 |     fmt = output_renderer.ColumnFormatter("JobID")
588 |     # matches title
589 |     jobs = [
590 |         job_module.Job("job", "tes", None),
591 |         job_module.Job("job", "tin", None),
592 |         job_module.Job("job", "g", None),
593 |     ]
594 |     fmt.compute_width(jobs)
595 |     assert fmt.width == 7
596 | 
597 |     # already set
598 |     jobs = [
599 |         job_module.Job("job", "aLongEntry", None),
600 |         job_module.Job("job", "addAnother", None),
601 |     ]
602 |     fmt.compute_width(jobs)
603 |     assert fmt.width == 7
604 | 
605 |     fmt = output_renderer.ColumnFormatter("JobID")
606 |     fmt.compute_width(jobs)
607 |     assert fmt.width == 12
608 | 
609 | 
610 | def test_formatter_format_entry():
611 |     """Can format entry with alignment, width, and color."""
612 |     fmt = output_renderer.ColumnFormatter("Name")
613 |     # no width causes just the name to be printed
614 |     assert fmt.format_title() == click.style("Name", bold=True)
615 | 
616 |     fmt.width = 8
617 |     assert fmt.format_title() == click.style("  Name  ", bold=True)
618 |     fmt.alignment = "<"
619 |     assert fmt.format_title() == click.style("Name    ", bold=True)
620 |     fmt.alignment = ">"
621 |     assert fmt.format_title() == click.style("    Name", bold=True)
622 | 
623 |     assert fmt.format_entry("A Long Entry") == "A Long E"
624 |     assert fmt.format_entry("A Long Entry", "green") == click.style(
625 |         "A Long E", fg="green"
626 |     )
627 | 
628 |     fmt.end = "e"
629 |     assert fmt.format_entry("A Long Entry") == "ng Entry"
630 | 


--------------------------------------------------------------------------------