├── .editorconfig
├── .github
    ├── ISSUE_TEMPLATE
    │   ├── bug_report.md
    │   ├── config.yml
    │   └── feature_request.md
    ├── PULL_REQUEST_TEMPLATE.md
    └── workflows
    │   ├── ci.yml
    │   └── linter.yml
├── .gitignore
├── .golangci.yml
├── CONTRIBUTING.md
├── LICENSE-3rdparty.csv
├── LICENSE.md
├── Makefile
├── NOTICE
├── README.md
├── doc
    └── documentor.1.scd
├── go.mod
├── go.sum
├── internal
    ├── ai
    │   ├── ai.go
    │   ├── anthropic
    │   │   ├── anthropic.go
    │   │   └── request.go
    │   ├── datadog
    │   │   ├── datadog.go
    │   │   ├── request.go
    │   │   └── transport.go
    │   └── openai
    │   │   ├── openai.go
    │   │   └── request.go
    ├── app
    │   ├── app.go
    │   ├── describe.go
    │   ├── draft.go
    │   └── review.go
    ├── errno
    │   ├── errno.go
    │   └── errno_test.go
    ├── meta
    │   └── meta.go
    ├── prompt
    │   ├── data
    │   │   ├── describe-prompt.txt
    │   │   ├── draft-prompt.txt
    │   │   └── review-prompt.txt
    │   └── prompt.go
    ├── validate
    │   ├── validate.go
    │   └── validate_test.go
    └── xbase64
    │   ├── testdata
    │       └── dot.gif
    │   ├── xbase64.go
    │   └── xbase64_test.go
├── license-3rdparty.tpl
└── main.go


/.editorconfig:
--------------------------------------------------------------------------------
 1 | root = true
 2 | 
 3 | [*]
 4 | charset = utf-8
 5 | end_of_line = lf
 6 | insert_final_newline = true
 7 | trim_trailing_whitespace = true
 8 | max_line_length = 80
 9 | indent_style = space
10 | indent_size = 2
11 | tab_width = 4
12 | 
13 | [.git/config]
14 | indent_style = tab
15 | 
16 | [.git/COMMIT_EDITMSG]
17 | max_line_length = 72
18 | 
19 | [*.md]
20 | max_line_length = 72
21 | trim_trailing_whitespace = false
22 | 
23 | [*.go]
24 | indent_style = tab
25 | indent_size = 4
26 | 
27 | [*.scd]
28 | indent_style = tab
29 | indent_size = 4
30 | 
31 | [go.mod]
32 | indent_style = tab
33 | 
34 | [Makefile]
35 | indent_style = tab
36 | indent_size = 4
37 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/bug_report.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: "Bug report"
 3 | about: "Create a report to help us improve."
 4 | title: ""
 5 | labels: "bug, needs triage"
 6 | assignees: ""
 7 | ---
 8 | 
 9 | **Describe the bug**
10 | A clear and concise description of the bug.
11 | 
12 | **Environment and versions**
13 | A clear and precise description of your setup.
14 | 
15 | - Version of the client in use.
16 | - Services, libraries, languages and tools list and versions.
17 | 
18 | **To reproduce**
19 | Steps to reproduce the behavior:
20 | 
21 | 1. Go to '...'
22 | 2. Click on '...'
23 | 3. Scroll down to '...'
24 | 4. See the error.
25 | 
26 | **Expected behavior**
27 | A clear and concise description of what you expected to happen.
28 | 
29 | **Screenshots**
30 | If applicable, add screenshots to help explain your problem.
31 | 
32 | **Additional context**
33 | Add any other context about the problem here.
34 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/config.yml:
--------------------------------------------------------------------------------
1 | blank_issues_enabled: false
2 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/feature_request.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: "Feature request"
 3 | about: "Suggest an idea for this project."
 4 | title: ""
 5 | labels: "enhancement, needs triage"
 6 | assignees: ""
 7 | ---
 8 | 
 9 | **Is your feature request related to a problem? Please describe.**
10 | A clear and concise description of what the problem is.
11 | 
12 | **Describe the solution you'd like**
13 | A clear and concise description of what you want to happen.
14 | 
15 | **Describe alternatives you've considered**
16 | A clear and concise description of any alternative solutions or features you've considered.
17 | 
18 | **Additional context**
19 | Add any other context or screenshots about the feature request here.
20 | 


--------------------------------------------------------------------------------
/.github/PULL_REQUEST_TEMPLATE.md:
--------------------------------------------------------------------------------
 1 | <!--
 2 | **Requirements for Contributing to this repository**
 3 | 
 4 | Fill out the template below. Any pull request that does not include enough information to be reviewed in a timely manner may be closed at the maintainers' discretion.
 5 | 
 6 | For more details, please see [CONTRIBUTING.md](../CONTRIBUTING.md).
 7 | -->
 8 | 
 9 | ### What does this PR do?
10 | 
11 | <!--
12 | 
13 | What inspired you to submit this pull request? Link to the issue describing the bug that you're fixing.
14 | 
15 | If there is not yet an issue for your bug, please open a new issue and then link to that issue in your pull request.
16 | 
17 | If the pull request does not address an existing issue with the "bug" label, the maintainers have the final say on whether the current behavior is a bug.
18 | 
19 | We must be able to understand the design of your change from this description. If we can't get a good idea of what the code will be doing from the description here, the pull request may be closed at the maintainers' discretion.
20 | 
21 | Keep in mind that the maintainer reviewing this PR may not be familiar with or have worked with the code here recently, so please walk us through the concepts.
22 | 
23 | -->
24 | 
25 | ### Additional Notes
26 | 
27 | <!-- Anything else we should know when reviewing? -->
28 | 
29 | ### Review checklist
30 | 
31 | Please check relevant items below:
32 | 
33 | - [ ] The title & description contain a short meaningful summary of work completed.
34 | - [ ] Tests have been updated/created and are passing locally.
35 | - [ ] I've reviewed the [CONTRIBUTING.md](/CONTRIBUTING.md) file.
36 | 


--------------------------------------------------------------------------------
/.github/workflows/ci.yml:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: 'Tests'
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - 'trunk'
 7 |     paths-ignore:
 8 |       - '.editorconfig'
 9 |       - '.gitignore'
10 |       - '.golangci.yml'
11 |       - 'CONTRIBUTING.md'
12 |       - 'LICENSE-3rdparty.csv'
13 |       - 'LICENSE.md'
14 |       - 'NOTICE'
15 |       - 'README.md'
16 |       - 'license-3rdparty.tpl'
17 |   pull_request:
18 |     branches:
19 |       - 'trunk'
20 |     paths-ignore:
21 |       - '.editorconfig'
22 |       - '.gitignore'
23 |       - '.golangci.yml'
24 |       - 'CONTRIBUTING.md'
25 |       - 'LICENSE-3rdparty.csv'
26 |       - 'LICENSE.md'
27 |       - 'NOTICE'
28 |       - 'README.md'
29 |       - 'license-3rdparty.tpl'
30 | 
31 | jobs:
32 |   test:
33 |     runs-on: 'ubuntu-latest'
34 |     name: 'Tests'
35 |     steps:
36 |       - uses: 'actions/checkout@v4'
37 | 
38 |       - name: 'Setup Go environment'
39 |         uses: 'actions/setup-go@v4'
40 |         with:
41 |           go-version: '1.24.x'
42 | 
43 |       - name: 'Run tests'
44 |         run: 'make test'
45 | 
46 |       - name: 'Run build'
47 |         run: 'make build'
48 | 


--------------------------------------------------------------------------------
/.github/workflows/linter.yml:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: 'Lint'
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - 'trunk'
 7 |     paths-ignore:
 8 |       - '.editorconfig'
 9 |       - '.gitignore'
10 |       - 'CONTRIBUTING.md'
11 |       - 'LICENSE-3rdparty.csv'
12 |       - 'LICENSE.md'
13 |       - 'NOTICE'
14 |       - 'README.md'
15 |       - 'license-3rdparty.tpl'
16 |   pull_request:
17 |     branches:
18 |       - 'trunk'
19 |     paths-ignore:
20 |       - '.editorconfig'
21 |       - '.gitignore'
22 |       - 'CONTRIBUTING.md'
23 |       - 'LICENSE-3rdparty.csv'
24 |       - 'LICENSE.md'
25 |       - 'NOTICE'
26 |       - 'README.md'
27 |       - 'license-3rdparty.tpl'
28 | 
29 | permissions:
30 |   contents: 'read'
31 | 
32 | jobs:
33 |   go:
34 |     name: 'Lint Go files'
35 |     runs-on: 'ubuntu-latest'
36 |     steps:
37 |       - uses: 'actions/checkout@v4'
38 | 
39 |       - name: 'Setup Go environment'
40 |         uses: 'actions/setup-go@v4'
41 |         with:
42 |           go-version: '1.24.x'
43 | 
44 |       - name: 'Run govulncheck'
45 |         run: 'make vulnerabilities'
46 | 
47 |       - name: 'Run gofumpt'
48 |         run: 'make fmt'
49 | 
50 |       - name: 'Run golangci-lint'
51 |         run: 'make lint'
52 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # Directories and files that may be generated by tooling or your OS.
 2 | .idea
 3 | documentor
 4 | documentor.1
 5 | 
 6 | # Temporary directory that holds temporary files, reading materials, and other
 7 | # things you don't want in the remote repository.
 8 | .tmp
 9 | 
10 | # https://i.cpimg.sh/r6BsGDijfFyl.png
11 | .DS_Store
12 | 


--------------------------------------------------------------------------------
/.golangci.yml:
--------------------------------------------------------------------------------
  1 | linters:
  2 |   disable-all: true
  3 |   enable:
  4 |     - asasalint
  5 |     - asciicheck
  6 |     - bidichk
  7 |     - bodyclose
  8 |     - canonicalheader
  9 |     - containedctx
 10 |     - contextcheck
 11 |     - copyloopvar
 12 |     - decorder
 13 |     - dogsled
 14 |     - durationcheck
 15 |     - err113
 16 |     - errcheck
 17 |     - errchkjson
 18 |     - errname
 19 |     - errorlint
 20 |     - exhaustive
 21 |     - fatcontext
 22 |     - forcetypeassert
 23 |     - gci
 24 |     - gocheckcompilerdirectives
 25 |     - gochecknoglobals
 26 |     - gochecknoinits
 27 |     - gochecksumtype
 28 |     - gocognit
 29 |     - goconst
 30 |     - gocritic
 31 |     - gocyclo
 32 |     - godot
 33 |     - godox
 34 |     - gofumpt
 35 |     - goimports
 36 |     - goprintffuncname
 37 |     - gosec
 38 |     - gosimple
 39 |     - gosmopolitan
 40 |     - govet
 41 |     - inamedparam
 42 |     - ineffassign
 43 |     - interfacebloat
 44 |     - intrange
 45 |     - ireturn
 46 |     - maintidx
 47 |     - makezero
 48 |     - mirror
 49 |     - misspell
 50 |     - musttag
 51 |     - nestif
 52 |     - nilerr
 53 |     - nilnil
 54 |     - noctx
 55 |     - nolintlint
 56 |     - nonamedreturns
 57 |     - nosprintfhostport
 58 |     - paralleltest
 59 |     - perfsprint
 60 |     - prealloc
 61 |     - predeclared
 62 |     - reassign
 63 |     - revive
 64 |     - rowserrcheck
 65 |     - sloglint
 66 |     - sqlclosecheck
 67 |     - staticcheck
 68 |     - stylecheck
 69 |     - testableexamples
 70 |     - testpackage
 71 |     - thelper
 72 |     - tparallel
 73 |     - typecheck
 74 |     - unconvert
 75 |     - unparam
 76 |     - unused
 77 |     - usestdlibvars
 78 |     - wastedassign
 79 |     - wrapcheck
 80 |     - wsl
 81 | 
 82 | linters-settings:
 83 |   decorder:
 84 |     dec-order:
 85 |       - const
 86 |       - var
 87 |       - type
 88 |       - func
 89 |   errcheck:
 90 |     check-type-assertions: true
 91 |     check-blank: true
 92 |     excluded-functions:
 93 |       - encoding/json.Marshal
 94 |       - encoding/json.MarshalIndent
 95 |   errchkjson:
 96 |     check-error-free-encoding: true
 97 |   gocritic:
 98 |     enabled-tags:
 99 |       - diagnostic
100 |       - experimental
101 |       - style
102 |       - performance
103 |       - opinionated
104 |   gofumpt:
105 |     extra-rules: true
106 |   gosimple:
107 |     checks: ["all"]
108 |   govet:
109 |     enable-all: true
110 |     settings:
111 |       shadow:
112 |         strict: true
113 |   makezero:
114 |     always: true
115 |   misspell:
116 |     locale: US
117 |   nolintlint:
118 |     require-explanation: true
119 |     require-specific: true
120 |   prealloc:
121 |     simple: false
122 |     for-loops: true
123 |   revive:
124 |     rules:
125 |       - name: argument-limit
126 |       - name: atomic
127 |       - name: bare-return
128 |       - name: blank-imports
129 |       - name: bool-literal-in-expr
130 |       - name: call-to-gc
131 |       - name: comment-spacings
132 |       - name: confusing-naming
133 |       - name: confusing-results
134 |       - name: constant-logical-expr
135 |       - name: context-as-argument
136 |       - name: context-keys-type
137 |       - name: datarace
138 |       - name: deep-exit
139 |       - name: defer
140 |       - name: dot-imports
141 |       - name: duplicated-imports
142 |       - name: early-return
143 |       - name: empty-block
144 |       - name: empty-lines
145 |       - name: enforce-map-style
146 |         arguments:
147 |           - "make"
148 |       - name: enforce-slice-style
149 |         arguments:
150 |           - "make"
151 |       - name: error-naming
152 |       - name: error-return
153 |       - name: error-strings
154 |       - name: errorf
155 |       - name: exported
156 |       - name: flag-parameter
157 |       - name: function-result-limit
158 |       - name: get-return
159 |       - name: identical-branches
160 |       - name: if-return
161 |       - name: import-shadowing
162 |       - name: increment-decrement
163 |       - name: indent-error-flow
164 |       - name: modifies-parameter
165 |       - name: modifies-value-receiver
166 |       - name: nested-structs
167 |       - name: optimize-operands-order
168 |       - name: package-comments
169 |       - name: range
170 |       - name: range-val-address
171 |       - name: range-val-in-closure
172 |       - name: receiver-naming
173 |       - name: redefines-builtin-id
174 |       - name: redundant-import-alias
175 |       - name: string-of-int
176 |       - name: struct-tag
177 |       - name: superfluous-else
178 |       - name: time-equal
179 |       - name: time-naming
180 |       - name: unchecked-type-assertion
181 |       - name: unconditional-recursion
182 |       - name: unexported-naming
183 |       - name: unexported-return
184 |       - name: unnecessary-stmt
185 |       - name: unreachable-code
186 |       - name: unused-parameter
187 |       - name: unused-receiver
188 |       - name: use-any
189 |       - name: useless-break
190 |       - name: var-declaration
191 |       - name: var-naming
192 |       - name: waitgroup-by-value
193 |   sloglint:
194 |     kv-only: true
195 |     no-global: "default"
196 |     args-on-sep-lines: true
197 |   staticcheck:
198 |     checks: ["all"]
199 |   stylecheck:
200 |     checks: ["all"]
201 |   usestdlibvars:
202 |     time-month: true
203 |     time-layout: true
204 |     crypto-hash: true
205 |     sql-isolation-level: true
206 |     tls-signature-scheme: true
207 |     constant-kind: true
208 |   unparam:
209 |     check-exported: true
210 | 
211 | issues:
212 |   max-issues-per-linter: 0
213 |   max-same-issues: 0
214 |   exclude-rules:
215 |     - path: _test\.go
216 |       linters:
217 |         - containedctx
218 |         - gochecknoglobals
219 |         - nilerr
220 |         - wrapcheck
221 |     - path: _test\.go
222 |       text: "fieldalignment"
223 | 


--------------------------------------------------------------------------------
/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contribution guidelines
 2 | 
 3 | Thank you for your interest in improving `documentor`! Follow these
 4 | guidelines to contribute effectively and get your patches accepted.
 5 | 
 6 | ## Commit sign-off
 7 | 
 8 | Remember to sign-off on your commits by running `git commit --signoff`
 9 | before pushing. To understand what this means, read the [Linux Kernel
10 | Developer's Certificate of
11 | Origin](https://www.kernel.org/doc/html/latest/process/submitting-patches.html#sign-your-work-the-developer-s-certificate-of-origin).
12 | 
13 | ## Submission guidelines
14 | 
15 | Adhere to the following rules when submitting your PR:
16 | 
17 | - **Keep it small**: Avoid changing too many things at once.
18 | - **Individual PRs**: One PR per issue, please.
19 | - **Commit messages**: Write meaningful, clear commit messages.
20 | - **Quality assurance**: [Review your spelling and
21 |   grammar](https://languagetool.org/) before submission.
22 | - **Testing**: Write tests. Ensure your changes do not break any
23 |   existing functionality by running `make test`.
24 | - **Respect the coding style**: Ensure your contributions maintain the
25 |   codebase’s style.
26 | 
27 | ## License
28 | 
29 | All contributions are made under the [Apache-2.0 license](LICENSE.md).
30 | 


--------------------------------------------------------------------------------
/LICENSE-3rdparty.csv:
--------------------------------------------------------------------------------
1 | Origin,License,"License URL",Copyright
2 | git.sr.ht/~jamesponddotco/xstd-go,MIT,https://git.sr.ht/~jamesponddotco/xstd-go/tree/v0.8.0/LICENSE.md,2023 James Pond
3 | github.com/cpuguy83/go-md2man/v2/md2man,MIT,https://github.com/cpuguy83/go-md2man/blob/v2.0.4/LICENSE.md,2014 Brian Goff
4 | github.com/liushuangls/go-anthropic/v2,Apache-2.0,https://github.com/liushuangls/go-anthropic/blob/v2.4.0/LICENSE,2024 Liu Shuang
5 | github.com/russross/blackfriday/v2,BSD-2-Clause,https://github.com/russross/blackfriday/blob/v2.1.0/LICENSE.txt,2011 Russ Ross
6 | github.com/sashabaranov/go-openai,Apache-2.0,https://github.com/sashabaranov/go-openai/blob/v1.27.0/LICENSE,2020 Alex Baranov
7 | github.com/urfave/cli/v2,MIT,https://github.com/urfave/cli/blob/v2.27.2/LICENSE,2023 urfave/cli maintainers
8 | github.com/xrash/smetrics,MIT,https://github.com/xrash/smetrics/blob/5f08fbb34913/LICENSE,2016 Felipe da Cunha Gonçalves
9 | 


--------------------------------------------------------------------------------
/LICENSE.md:
--------------------------------------------------------------------------------
  1 |                               Apache License
  2 |                         Version 2.0, January 2004
  3 |                      http://www.apache.org/licenses/
  4 | 
  5 | TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 | 1. Definitions.
  8 | 
  9 |    "License" shall mean the terms and conditions for use, reproduction,
 10 |    and distribution as defined by Sections 1 through 9 of this document.
 11 | 
 12 |    "Licensor" shall mean the copyright owner or entity authorized by
 13 |    the copyright owner that is granting the License.
 14 | 
 15 |    "Legal Entity" shall mean the union of the acting entity and all
 16 |    other entities that control, are controlled by, or are under common
 17 |    control with that entity. For the purposes of this definition,
 18 |    "control" means (i) the power, direct or indirect, to cause the
 19 |    direction or management of such entity, whether by contract or
 20 |    otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |    outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |    "You" (or "Your") shall mean an individual or Legal Entity
 24 |    exercising permissions granted by this License.
 25 | 
 26 |    "Source" form shall mean the preferred form for making modifications,
 27 |    including but not limited to software source code, documentation
 28 |    source, and configuration files.
 29 | 
 30 |    "Object" form shall mean any form resulting from mechanical
 31 |    transformation or translation of a Source form, including but
 32 |    not limited to compiled object code, generated documentation,
 33 |    and conversions to other media types.
 34 | 
 35 |    "Work" shall mean the work of authorship, whether in Source or
 36 |    Object form, made available under the License, as indicated by a
 37 |    copyright notice that is included in or attached to the work
 38 |    (an example is provided in the Appendix below).
 39 | 
 40 |    "Derivative Works" shall mean any work, whether in Source or Object
 41 |    form, that is based on (or derived from) the Work and for which the
 42 |    editorial revisions, annotations, elaborations, or other modifications
 43 |    represent, as a whole, an original work of authorship. For the purposes
 44 |    of this License, Derivative Works shall not include works that remain
 45 |    separable from, or merely link (or bind by name) to the interfaces of,
 46 |    the Work and Derivative Works thereof.
 47 | 
 48 |    "Contribution" shall mean any work of authorship, including
 49 |    the original version of the Work and any modifications or additions
 50 |    to that Work or Derivative Works thereof, that is intentionally
 51 |    submitted to Licensor for inclusion in the Work by the copyright owner
 52 |    or by an individual or Legal Entity authorized to submit on behalf of
 53 |    the copyright owner. For the purposes of this definition, "submitted"
 54 |    means any form of electronic, verbal, or written communication sent
 55 |    to the Licensor or its representatives, including but not limited to
 56 |    communication on electronic mailing lists, source code control systems,
 57 |    and issue tracking systems that are managed by, or on behalf of, the
 58 |    Licensor for the purpose of discussing and improving the Work, but
 59 |    excluding communication that is conspicuously marked or otherwise
 60 |    designated in writing by the copyright owner as "Not a Contribution."
 61 | 
 62 |    "Contributor" shall mean Licensor and any individual or Legal Entity
 63 |    on behalf of whom a Contribution has been received by Licensor and
 64 |    subsequently incorporated within the Work.
 65 | 
 66 | 2. Grant of Copyright License. Subject to the terms and conditions of
 67 |    this License, each Contributor hereby grants to You a perpetual,
 68 |    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 69 |    copyright license to reproduce, prepare Derivative Works of,
 70 |    publicly display, publicly perform, sublicense, and distribute the
 71 |    Work and such Derivative Works in Source or Object form.
 72 | 
 73 | 3. Grant of Patent License. Subject to the terms and conditions of
 74 |    this License, each Contributor hereby grants to You a perpetual,
 75 |    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 76 |    (except as stated in this section) patent license to make, have made,
 77 |    use, offer to sell, sell, import, and otherwise transfer the Work,
 78 |    where such license applies only to those patent claims licensable
 79 |    by such Contributor that are necessarily infringed by their
 80 |    Contribution(s) alone or by combination of their Contribution(s)
 81 |    with the Work to which such Contribution(s) was submitted. If You
 82 |    institute patent litigation against any entity (including a
 83 |    cross-claim or counterclaim in a lawsuit) alleging that the Work
 84 |    or a Contribution incorporated within the Work constitutes direct
 85 |    or contributory patent infringement, then any patent licenses
 86 |    granted to You under this License for that Work shall terminate
 87 |    as of the date such litigation is filed.
 88 | 
 89 | 4. Redistribution. You may reproduce and distribute copies of the
 90 |    Work or Derivative Works thereof in any medium, with or without
 91 |    modifications, and in Source or Object form, provided that You
 92 |    meet the following conditions:
 93 | 
 94 |    (a) You must give any other recipients of the Work or
 95 |        Derivative Works a copy of this License; and
 96 | 
 97 |    (b) You must cause any modified files to carry prominent notices
 98 |        stating that You changed the files; and
 99 | 
100 |    (c) You must retain, in the Source form of any Derivative Works
101 |        that You distribute, all copyright, patent, trademark, and
102 |        attribution notices from the Source form of the Work,
103 |        excluding those notices that do not pertain to any part of
104 |        the Derivative Works; and
105 | 
106 |    (d) If the Work includes a "NOTICE" text file as part of its
107 |        distribution, then any Derivative Works that You distribute must
108 |        include a readable copy of the attribution notices contained
109 |        within such NOTICE file, excluding those notices that do not
110 |        pertain to any part of the Derivative Works, in at least one
111 |        of the following places: within a NOTICE text file distributed
112 |        as part of the Derivative Works; within the Source form or
113 |        documentation, if provided along with the Derivative Works; or,
114 |        within a display generated by the Derivative Works, if and
115 |        wherever such third-party notices normally appear. The contents
116 |        of the NOTICE file are for informational purposes only and
117 |        do not modify the License. You may add Your own attribution
118 |        notices within Derivative Works that You distribute, alongside
119 |        or as an addendum to the NOTICE text from the Work, provided
120 |        that such additional attribution notices cannot be construed
121 |        as modifying the License.
122 | 
123 |    You may add Your own copyright statement to Your modifications and
124 |    may provide additional or different license terms and conditions
125 |    for use, reproduction, or distribution of Your modifications, or
126 |    for any such Derivative Works as a whole, provided Your use,
127 |    reproduction, and distribution of the Work otherwise complies with
128 |    the conditions stated in this License.
129 | 
130 | 5. Submission of Contributions. Unless You explicitly state otherwise,
131 |    any Contribution intentionally submitted for inclusion in the Work
132 |    by You to the Licensor shall be under the terms and conditions of
133 |    this License, without any additional terms or conditions.
134 |    Notwithstanding the above, nothing herein shall supersede or modify
135 |    the terms of any separate license agreement you may have executed
136 |    with Licensor regarding such Contributions.
137 | 
138 | 6. Trademarks. This License does not grant permission to use the trade
139 |    names, trademarks, service marks, or product names of the Licensor,
140 |    except as required for reasonable and customary use in describing the
141 |    origin of the Work and reproducing the content of the NOTICE file.
142 | 
143 | 7. Disclaimer of Warranty. Unless required by applicable law or
144 |    agreed to in writing, Licensor provides the Work (and each
145 |    Contributor provides its Contributions) on an "AS IS" BASIS,
146 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147 |    implied, including, without limitation, any warranties or conditions
148 |    of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149 |    PARTICULAR PURPOSE. You are solely responsible for determining the
150 |    appropriateness of using or redistributing the Work and assume any
151 |    risks associated with Your exercise of permissions under this License.
152 | 
153 | 8. Limitation of Liability. In no event and under no legal theory,
154 |    whether in tort (including negligence), contract, or otherwise,
155 |    unless required by applicable law (such as deliberate and grossly
156 |    negligent acts) or agreed to in writing, shall any Contributor be
157 |    liable to You for damages, including any direct, indirect, special,
158 |    incidental, or consequential damages of any character arising as a
159 |    result of this License or out of the use or inability to use the
160 |    Work (including but not limited to damages for loss of goodwill,
161 |    work stoppage, computer failure or malfunction, or any and all
162 |    other commercial damages or losses), even if such Contributor
163 |    has been advised of the possibility of such damages.
164 | 
165 | 9. Accepting Warranty or Additional Liability. While redistributing
166 |    the Work or Derivative Works thereof, You may choose to offer,
167 |    and charge a fee for, acceptance of support, warranty, indemnity,
168 |    or other liability obligations and/or rights consistent with this
169 |    License. However, in accepting such obligations, You may act only
170 |    on Your own behalf and on Your sole responsibility, not on behalf
171 |    of any other Contributor, and only if You agree to indemnify,
172 |    defend, and hold each Contributor harmless for any liability
173 |    incurred by, or claims asserted against, such Contributor by reason
174 |    of your accepting any such warranty or additional liability.
175 | 
176 | END OF TERMS AND CONDITIONS
177 | 


--------------------------------------------------------------------------------
/Makefile:
--------------------------------------------------------------------------------
 1 | .POSIX:
 2 | .SUFFIXES:
 3 | 
 4 | PREFIX=/usr/local
 5 | BINDIR=bin
 6 | MANDIR=share/man
 7 | PKGDIR=./
 8 | 
 9 | GO=go
10 | GIT=git
11 | RM=rm
12 | INSTALL=install
13 | SCDOC=scdoc
14 | 
15 | GOBUILD_OPTS=-trimpath -buildmode=pie -ldflags '-s -w' -mod 'readonly' -modcacherw
16 | 
17 | all: build doc
18 | 
19 | pre-commit: tidy fmt lint vulnerabilities test build clean # Runs all pre-commit checks.
20 | 
21 | commit: pre-commit # Commits the changes to the repository.
22 | 	$(GIT) commit -s
23 | 
24 | push: # Pushes the changes to the repository.
25 | 	$(GIT) push origin trunk
26 | 
27 | build: # Builds an application binary.
28 | 	$(GO) build $(GOBUILD_OPTS) $(PKGDIR)
29 | 
30 | build/linux: # Builds an application binary for Linux.
31 | 	GOOS=linux GOARCH=amd64 $(GO) build $(GOBUILD_OPTS) $(PKGDIR)
32 | 
33 | build/darwin: # Builds an application binary for macOS.
34 | 	GOOS=darwin GOARCH=amd64 $(GO) build $(GOBUILD_OPTS) $(PKGDIR)
35 | 
36 | build/windows: # Builds an application binary for Windows.
37 | 	GOOS=windows GOARCH=amd64 $(GO) build $(GOBUILD_OPTS) $(PKGDIR)
38 | 
39 | doc: # Builds the manpage.
40 | 	$(SCDOC) <doc/documentor.1.scd >documentor.1
41 | 
42 | install: # Installs the release binary.
43 | 	$(INSTALL) -d \
44 | 		$(DESTDIR)$(PREFIX)/$(BINDIR)/ \
45 | 		$(DESTDIR)$(PREFIX)/$(MANDIR)/man1/
46 | 	$(INSTALL) -pm 0755 documentor $(DESTDIR)$(PREFIX)/$(BINDIR)/
47 | 	$(INSTALL) -pm 0644 documentor.1 $(DESTDIR)$(PREFIX)/$(MANDIR)/man1/
48 | 
49 | tidy: # Updates the go.mod file to use the latest versions of all direct and indirect dependencies.
50 | 	$(GO) mod tidy
51 | 
52 | fmt: # Formats Go source files in this repository.
53 | 	$(GO) run mvdan.cc/gofumpt@latest -e -extra -w .
54 | 
55 | lint: # Runs golangci-lint using the config at the root of the repository.
56 | 	$(GO) run github.com/golangci/golangci-lint/cmd/golangci-lint@latest run ./...
57 | 
58 | vulnerabilities: # Analyzes the codebase and looks for vulnerabilities affecting it.
59 | 	$(GO) run golang.org/x/vuln/cmd/govulncheck@latest ./...
60 | 
61 | test: # Runs unit tests.
62 | 	$(GO) test -cover -race -vet all -mod readonly ./...
63 | 
64 | test/coverage: # Generates a coverage profile and open it in a browser.
65 | 	$(GO) test -coverprofile cover.out ./...
66 | 	$(GO) tool cover -html=cover.out
67 | 
68 | licenses: # Runs go-licenses to check the licenses of the dependencies and generate a CSV file.
69 | 	$(GO) run github.com/google/go-licenses@latest report --template 'license-3rdparty.tpl' --ignore 'github.com/DataDog/documentor' 'github.com/DataDog/documentor' > LICENSE-3rdparty.csv
70 | 
71 | clean: # Cleans cache files from tests and deletes any build output.
72 | 	$(RM) -f cover.out documentor documentor.1
73 | 
74 | .PHONY: all pre-commit commit push build doc install tidy fmt lint vulnerabilities test test/coverage licenses clean
75 | 


--------------------------------------------------------------------------------
/NOTICE:
--------------------------------------------------------------------------------
1 | Copyright 2024-Present Datadog, Inc.
2 | 
3 | This product includes software developed at Datadog (<https://www.datadoghq.com/).>
4 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | # `documentor`
  2 | 
  3 | `documentor` is an easy-to-use, efficient, and powerful command-line
  4 | application that uses the power of AI to review documentation and
  5 | provide feedback on how to improve it, draft new documentation from
  6 | scratch, and more.
  7 | 
  8 | It assists documentation writers in creating better documentation by
  9 | automating parts of the writing and review process, allowing them to
 10 | focus on the content and structure of the document itself.
 11 | 
 12 | ## Installation
 13 | 
 14 | ### From source
 15 | 
 16 | First, ensure that the following dependencies are installed:
 17 | 
 18 | - Go 1.24 or above.
 19 | - make.
 20 | - [scdoc](https://git.sr.ht/~sircmpwn/scdoc).
 21 | 
 22 | Optionally, you can install
 23 | [glow](https://github.com/charmbracelet/glow) to render the Markdown
 24 | output of the `review` command with more style.
 25 | 
 26 | Then, switch to the latest stable tag (`v1.2.0`), compile, and install:
 27 | 
 28 | ```bash
 29 | git checkout v1.2.0
 30 | make
 31 | sudo make install
 32 | ```
 33 | 
 34 | ## Usage
 35 | 
 36 | > [!NOTE] 
 37 | > If you're a Datadog employee, please follow [the documentation in
 38 | > Confluence](https://datadoghq.atlassian.net/wiki/spaces/Cloudcraft/pages/4780427137/Using+Documentor).
 39 | 
 40 | ```bash
 41 | $ documentor --help
 42 | NAME:
 43 |    documentor - improve technical documentation with the power of AI
 44 | 
 45 | USAGE:
 46 |    documentor [global options] command [command options]
 47 | 
 48 | VERSION:
 49 |    1.2.0
 50 | 
 51 | COMMANDS:
 52 |    review, r    review technical documentation
 53 |    describe, d  describe an image and generate alt text
 54 |    draft, D     draft new documentation based on the provided notes
 55 | 
 56 | GLOBAL OPTIONS:
 57 |    --key value, -k value          the API key to use [$DOCUMENTOR_KEY]
 58 |    --provider value, -p value     the AI provider to use (default: "openai") [$DOCUMENTOR_PROVIDER]
 59 |    --endpoint value, -e value     the API endpoint to use (currently only used for the Datadog provider) [$DOCUMENTOR_ENDPOINT]
 60 |    --model value, -m value        the AI model to use (default: "gpt-4o") [$DOCUMENTOR_MODEL]
 61 |    --temperature value, -t value  the temperature to use for the model (default: 0.8) [$DOCUMENTOR_TEMPERATURE]
 62 |    --help, -h                     show help
 63 |    --version, -v                  print the version
 64 | ```
 65 | 
 66 | ### Examples
 67 | 
 68 | **1. Review a documentation file using the default provider, OpenAI:**
 69 | 
 70 | ```bash
 71 | documentor --key 'your-openai-api-key' review '/path/to/file.md'
 72 | ```
 73 | 
 74 | **2. Review a documentation file with the API key set in the environment:**
 75 | 
 76 | ```bash
 77 | export DOCUMENTOR_KEY='your-openai-api-key'
 78 | documentor review '/path/to/file.md'
 79 | ```
 80 | 
 81 | **3. Save the output to a file:**
 82 | 
 83 | ```bash
 84 | documentor review '/path/to/file.md' >> review.md
 85 | ```
 86 | 
 87 | **4. Format the default Markdown output with glow:**
 88 | 
 89 | ```bash
 90 | documentor review '/path/to/file.md' | glow
 91 | ```
 92 | 
 93 | **5. Describe an image:**
 94 | 
 95 | ```bash
 96 | documentor describe '/path/to/image.png'
 97 | ```
 98 | 
 99 | **6. Describe an image with context:**
100 | 
101 | ```bash
102 | documentor describe --context 'This my cat, Mittens.' '/path/to/image.png'
103 | ```
104 | 
105 | **7. Describe an image and generate a filename for the image:**
106 | 
107 | ```bash
108 | documentor describe --filename '/path/to/image.png'
109 | ```
110 | 
111 | **8. Draft a document based on your notes:**
112 | 
113 | ```bash
114 | documentor draft '/path/to/notes/file.md'
115 | ```
116 | 
117 | **9. Draft a document using Anthropic as the AI provider:**
118 | 
119 | ```bash
120 | documentor --provider 'anthropic' --key 'your-anthropic-api-key' draft '/path/to/notes/file.md'
121 | ```
122 | 
123 | **10. Review a document using a different LLM model:**
124 | 
125 | ```bash
126 | documentor --model 'o3-mini' review '/path/to/file.md'
127 | ```
128 | 
129 | Refer to the _documentor(1)_ manpage after installation for more
130 | information.
131 | 
132 | ## Contributing
133 | 
134 | Anyone can help make `documentor` better. Refer to the [contribution
135 | guidelines](CONTRIBUTING.md) for more information.
136 | 
137 | ---
138 | 
139 | This project is released under the [Apache-2.0 License](LICENSE.md).
140 | 


--------------------------------------------------------------------------------
/doc/documentor.1.scd:
--------------------------------------------------------------------------------
  1 | documentor(1)
  2 | 
  3 | # NAME
  4 | 
  5 | documentor - review technical documentation with the power of AI
  6 | 
  7 | # SYNOPSIS
  8 | 
  9 | *documentor* [OPTIONS] COMMAND [ARGUMENTS]
 10 | 
 11 | # DESCRIPTION
 12 | 
 13 | *documentor* is an easy-to-use, efficient, and powerful command-line application
 14 | that uses the power of AI to review technical documentation and provide feedback
 15 | on how to improve it. It can also describe images and generate alt text for
 16 | them.
 17 | 
 18 | # OPTIONS
 19 | 
 20 | *-k*, *--key* <*API_KEY*>
 21 | 	Specifies the API key to use for authentication with the AI provider. Can be
 22 | 	set with the DOCUMENTOR_KEY environment variable.
 23 | 
 24 | *-p*, *--provider* <*PROVIDER*>
 25 | 	Specifies the AI provider to use. Default is "openai".Can be set with the
 26 | 	DOCUMENTOR_PROVIDER environment variable.
 27 | 
 28 | *-e*, *--endpoint* <*ENDPOINT*>
 29 | 	Specifies the API endpoint to use when communicating with the AI provider.
 30 | 	Currently only supported by Datadog. Can be set with the DOCUMENTOR_ENDPOINT
 31 | 	environment variable.
 32 | 
 33 | *-m*, *--model* <*MODEL*>
 34 | 	Specifies the model to use when generating text. Defaults is "gpt-4o" for
 35 | 	OpenAI and Datadog and "claude-3-5-sonnet-latest" for Anthropic. Can be
 36 | 	set with the DOCUMENTOR_MODEL environment variable.
 37 | 
 38 | *-t*, *--temperature* <*TEMPERATURE*>
 39 | 	Specifies the temperature to use when generating text. Default is 0.8. Can
 40 | 	be set with the DOCUMENTOR_TEMPERATURE environment variable.
 41 | 
 42 | *-h*, *--help*
 43 | 	Shows help message and quits.
 44 | 
 45 | *-v*, *--version*
 46 | 	Shows version information and quits.
 47 | 
 48 | # COMMANDS
 49 | 
 50 | *review* <*FILE*>
 51 | 	Reviews the documentation in the specified file.
 52 | 
 53 | *describe* [*OPTIONS*] <*FILE*>
 54 | 	Describes the image and generates alt text for it.
 55 | 
 56 | 	Options are:
 57 | 
 58 | 	*-c*, *--context* <*CONTEXT*>
 59 | 		Specifies the context around the image.
 60 | 
 61 | 	*-f*, *--filename*
 62 | 		Whether to generate a filename based on the image content.
 63 | 
 64 | *draft* <*FILE*>
 65 | 	Generates a document based on the notes provided in the specified file.
 66 | 
 67 | 	For the best results, your notes file should have a clear structure with a
 68 | 	specific request and bullet points for each piece of information.
 69 | 
 70 | 	For example:
 71 | 
 72 | 	```
 73 | 	I need to write technical documentation for a new feature in Datadog. The
 74 | 	feature is called "Cool Feature" and it allows users to do something cool.
 75 | 
 76 | 	- Information about the feature.
 77 | 	- More information about the feature.
 78 | 	- Even more information about the feature.
 79 | 	```
 80 | 
 81 | 	If you are not satisfied with the generated document, tweak the request part
 82 | 	of your notes file and try again.
 83 | 
 84 | # ARGUMENTS
 85 | 
 86 | <*API_KEY*>
 87 | 	The API key to use for authentication with the AI provider starting with the
 88 | 	"sk-" prefix. OpenAI expects a 51-character long key, while Anthropic
 89 | 	expects a 108-character long key.
 90 | 
 91 | <*PROVIDER*>
 92 | 	The AI provider to use. Can be one of the supported providers. Default is
 93 | 	"openai".
 94 | 
 95 | 	*Supported providers*:
 96 | 
 97 | 	- OpenAI: `openai`
 98 | 	- Anthropic: `anthropic`
 99 | 	- Datadog: `datadog`
100 | 
101 | <*MODEL*>
102 | 	The model to use when generating text for each command. The command expects
103 | 	a string like "gpt-4o" or "claude-3-5-sonnet-latest". Refer to the
104 | 	provider's documentation for the available models. Default is "gpt-4o" for
105 | 	OpenAI and Datadog and "claude-3-5-sonnet-latest" for Anthropic.
106 | 
107 | <*TEMPERATURE*>
108 | 	The temperature to use when generating text. The temperature is a float
109 | 	value between 0 and 1 that controls the randomness of the response. A value
110 | 	of 0 will always return the most likely output, while a value of 1 will
111 | 	return a more random token. Default is 0.8.
112 | 
113 | <*FILE*>
114 | 	The path to a documentation file to review, image to describe, or file with
115 | 	notes about a document to draft.
116 | 
117 | <*CONTEXT*>
118 | 	The context around the image to describe. This can be a short description of
119 | 	the purpose of the image, e.g., "Picture of a Cloudcraft diagram", or even
120 | 	the filename of the image.
121 | 
122 | # ENVIROMENT
123 | 
124 | *DOCUMENTOR_KEY*
125 | 	Specifies the OpenAI API key to use for authentication.
126 | 
127 | *DOCUMENTOR_PROVIDER*
128 | 	Specifies the AI provider to use. Default is "openai".
129 | 
130 | *DOCUMENTOR_ENDPOINT*
131 | 	Specifies the API endpoint to use when communicating with the AI provider.
132 | 	Currently only supported by Datadog.
133 | 
134 | *DOCUMENTOR_MODEL*
135 | 	Specifies the model to use when generating text. Defaults is "gpt-4o" for
136 | 	OpenAI and "claude-3-5-sonnet-latest" for Anthropic.
137 | 
138 | *DOCUMENTOR_TEMPERATURE*
139 | 	Specifies the temperature to use when generating text. Default is 0.8.
140 | 
141 | # RETURN VALUES
142 | 
143 | *0*
144 | 	Success.
145 | 
146 | *1*
147 | 	Unknown error.
148 | 
149 | *2*
150 | 	Incorrect usage of the application.
151 | 
152 | *3*
153 | 	I/O error when reading a file.
154 | 
155 | *4*
156 | 	File not found.
157 | 
158 | *5*
159 | 	Permission denied when reading a file.
160 | 
161 | *6*
162 | 	Error when communicating with the OpenAI API.
163 | 
164 | *7*
165 | 	Missing API key.
166 | 
167 | *8*
168 | 	Timed out when communicating with the OpenAI API.
169 | 
170 | *9*
171 | 	Invalid input.
172 | 
173 | # EXAMPLES
174 | 
175 | *1. Review a documentation file*
176 | 	$ documentor --key 'sk-the-rest-of-the-api-key' review documentation.md
177 | 
178 | *2. Review a documentation file with the API key set in the environment*
179 | 	$ documentor review documentation.md
180 | 
181 | *3. Save the output to a file*
182 | 	$ documentor review documentation.md >> review.md
183 | 
184 | *4. Format the default Markdown output with glow*
185 | 	$ documentor review documentation.md | glow
186 | 
187 | *5. Describe an image*
188 | 	$ documentor describe image.png
189 | 
190 | *6. Describe an image with context*
191 | 	$ documentor describe --context 'This my cat, Mittens.' image.png
192 | 
193 | *7. Describe an image and generate a filename*
194 | 	$ documentor describe --filename image.png
195 | 
196 | *8. Draft a document based on notes*
197 | 	$ documentor draft notes.md
198 | 
199 | *9. Draft a document using Anthropic as the AI provider*
200 | 	$ documentor --provider 'anthropic' draft notes.md
201 | 
202 | # AUTHORS
203 | 
204 | Maintained by James Pond <james.pond@datadoghq.com>
205 | 


--------------------------------------------------------------------------------
/go.mod:
--------------------------------------------------------------------------------
 1 | module github.com/DataDog/documentor
 2 | 
 3 | go 1.24
 4 | 
 5 | require (
 6 | 	git.sr.ht/~jamesponddotco/xstd-go v0.8.0
 7 | 	github.com/liushuangls/go-anthropic/v2 v2.13.1
 8 | 	github.com/sashabaranov/go-openai v1.37.0
 9 | 	github.com/urfave/cli/v2 v2.27.5
10 | )
11 | 
12 | require (
13 | 	github.com/cpuguy83/go-md2man/v2 v2.0.5 // indirect
14 | 	github.com/russross/blackfriday/v2 v2.1.0 // indirect
15 | 	github.com/xrash/smetrics v0.0.0-20240521201337-686a1a2994c1 // indirect
16 | )
17 | 


--------------------------------------------------------------------------------
/go.sum:
--------------------------------------------------------------------------------
 1 | git.sr.ht/~jamesponddotco/xstd-go v0.8.0 h1:2FcwEvLunzTL/tSvlcs+pO60O8rlkIcr8bSoJWuT2W0=
 2 | git.sr.ht/~jamesponddotco/xstd-go v0.8.0/go.mod h1:L0SjmhDqcj/gR7oeNof+ed6l9VPk6oHPeNQSoaFBRFk=
 3 | github.com/cpuguy83/go-md2man/v2 v2.0.5 h1:ZtcqGrnekaHpVLArFSe4HK5DoKx1T0rq2DwVB0alcyc=
 4 | github.com/cpuguy83/go-md2man/v2 v2.0.5/go.mod h1:tgQtvFlXSQOSOSIRvRPT7W67SCa46tRHOmNcaadrF8o=
 5 | github.com/liushuangls/go-anthropic/v2 v2.13.1 h1:RiLr5Ec7gDFu3BFiT/I65mdUI3+OxSjSHooqY/VLJ+Y=
 6 | github.com/liushuangls/go-anthropic/v2 v2.13.1/go.mod h1:BG+8VNOl7eoEjwW1yhOzFArWA9rzaG2aouth+PQyZgQ=
 7 | github.com/russross/blackfriday/v2 v2.1.0 h1:JIOH55/0cWyOuilr9/qlrm0BSXldqnqwMsf35Ld67mk=
 8 | github.com/russross/blackfriday/v2 v2.1.0/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
 9 | github.com/sashabaranov/go-openai v1.37.0 h1:hQQowgYm4OXJ1Z/wTrE+XZaO20BYsL0R3uRPSpfNZkY=
10 | github.com/sashabaranov/go-openai v1.37.0/go.mod h1:lj5b/K+zjTSFxVLijLSTDZuP7adOgerWeFyZLUhAKRg=
11 | github.com/urfave/cli/v2 v2.27.5 h1:WoHEJLdsXr6dDWoJgMq/CboDmyY/8HMMH1fTECbih+w=
12 | github.com/urfave/cli/v2 v2.27.5/go.mod h1:3Sevf16NykTbInEnD0yKkjDAeZDS0A6bzhBH5hrMvTQ=
13 | github.com/xrash/smetrics v0.0.0-20240521201337-686a1a2994c1 h1:gEOO8jv9F4OT7lGCjxCBTO/36wtF6j2nSip77qHd4x4=
14 | github.com/xrash/smetrics v0.0.0-20240521201337-686a1a2994c1/go.mod h1:Ohn+xnUBiLI6FVj/9LpzZWtj1/D6lUovWYBkxHVV3aM=
15 | 


--------------------------------------------------------------------------------
/internal/ai/ai.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package ai provides an interface for interacting with AI providers.
 7 | package ai
 8 | 
 9 | import "github.com/urfave/cli/v2"
10 | 
11 | // List of supported AI providers.
12 | const (
13 | 	ProviderOpenAI    string = "openai"
14 | 	ProviderAnthropic string = "anthropic"
15 | 	ProviderDatadog   string = "datadog"
16 | )
17 | 
18 | // Provider represents an LLM provider such as OpenAI, Anthropic, Mistral, etc.
19 | type Provider interface {
20 | 	// Name returns the name of the provider.
21 | 	Name() string
22 | 
23 | 	// Do performs a single API request to the provider's API, returning a
24 | 	// response for the provided Request.
25 | 	//
26 | 	// Do should attempt to interpret the response from the provider and return
27 | 	// it as streaming strings to ctx.App.Writer if successful.
28 | 	Do(ctx *cli.Context, req *Request) error
29 | }
30 | 
31 | // Request represents an HTTP request to an AI provider's API.
32 | type Request struct {
33 | 	// Context is a string that provides additional context for the request. It
34 | 	// is only used if Content is a base64-encoded image.
35 | 	Context string
36 | 
37 | 	// Model is the full name of the LLM model to use for the request, e.g.
38 | 	// "gpt-4o-mini" or "claude-3-5-sonnet-20240620".
39 | 	Model string
40 | 
41 | 	// SystemPrompt is a set of instructions for the AI model to follow when
42 | 	// generating a response.
43 | 	SystemPrompt string
44 | 
45 | 	// UserPrompt is a second set of instructions for the AI model to follow
46 | 	// when generating a response.
47 | 	//
48 | 	// This prompt is sent to the AI provider after the system prompt and can be
49 | 	// used to provide additional context or constraints for the response.
50 | 	UserPrompt string
51 | 
52 | 	// Text represents content that is sent to the AI provider together with the
53 | 	// user prompt for generating a response.
54 | 	Text []byte
55 | 
56 | 	// Image represents an image attachment that is sent to the AI provider
57 | 	// together with the user prompt for generating a response.
58 | 	Image []byte
59 | 
60 | 	// Temperature is a float between 0 and 1 that controls the randomness of
61 | 	// the response. A value of 0 will always return the most likely token,
62 | 	// while a value of 1 will sample from the distribution of tokens.
63 | 	Temperature float32
64 | }
65 | 
66 | // NewRequest returns a new Request instance for a text-based user prompt.
67 | func NewRequest(text []byte, model, userPrompt, systemPrompt string, temperature float32) *Request {
68 | 	return &Request{
69 | 		Text:         text,
70 | 		Model:        model,
71 | 		SystemPrompt: systemPrompt,
72 | 		UserPrompt:   userPrompt,
73 | 		Temperature:  temperature,
74 | 	}
75 | }
76 | 
77 | // NewRequestWithImage returns a new Request instance for an user prompt with a
78 | // base64-encoded image attachment.
79 | func NewRequestWithImage(image []byte, model, context, userPrompt, systemPrompt string, temperature float32) *Request {
80 | 	if context != "" {
81 | 		userPrompt += "/n/n Here is some context for the image: " + context
82 | 	}
83 | 
84 | 	return &Request{
85 | 		Image:        image,
86 | 		Context:      context,
87 | 		Model:        model,
88 | 		SystemPrompt: systemPrompt,
89 | 		UserPrompt:   userPrompt,
90 | 		Temperature:  temperature,
91 | 	}
92 | }
93 | 


--------------------------------------------------------------------------------
/internal/ai/anthropic/anthropic.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package anthropic provides a client wrapper for the Anthropic API that
 7 | // complies with the ai.Provider interface.
 8 | package anthropic
 9 | 
10 | import (
11 | 	"fmt"
12 | 
13 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
14 | 	"github.com/DataDog/documentor/internal/ai"
15 | 	"github.com/liushuangls/go-anthropic/v2"
16 | 	"github.com/urfave/cli/v2"
17 | )
18 | 
19 | // ErrInvalidRequest is returned when the request provided to the OpenAI API is
20 | // missing both an image and text.
21 | const ErrInvalidRequest xerrors.Error = "invalid request: must provide either an image or text"
22 | 
23 | // DefaultModel is the default model to use when making requests to the
24 | // Anthropic API.
25 | const DefaultModel = "claude-3-5-sonnet-latest"
26 | 
27 | // Client represents an Anthropic API client that complies with the ai.Provider
28 | // interface.
29 | type Client struct {
30 | 	// ai is the proper Anthropic API client.
31 | 	ai *anthropic.Client
32 | }
33 | 
34 | // NewClient returns a new Client instance with the given API key.
35 | func NewClient(key string) *Client {
36 | 	return &Client{
37 | 		ai: anthropic.NewClient(key),
38 | 	}
39 | }
40 | 
41 | // Compile-time check to ensure Client implements the ai.Provider interface.
42 | var _ ai.Provider = (*Client)(nil)
43 | 
44 | // Name returns the name of the provider.
45 | func (*Client) Name() string {
46 | 	return "Anthropic"
47 | }
48 | 
49 | // Do performs a single API request to the Anthropic API, returning a response for
50 | // the provided Request and writing said response to ctx.App.Writer as a stream
51 | // of strings.
52 | func (c *Client) Do(ctx *cli.Context, request *ai.Request) error {
53 | 	var req anthropic.MessagesStreamRequest
54 | 
55 | 	switch {
56 | 	case request.Image != nil:
57 | 		req = NewRequestWithImage(ctx, request)
58 | 	case request.Text != nil:
59 | 		req = NewRequest(ctx, request)
60 | 	default:
61 | 		return ErrInvalidRequest
62 | 	}
63 | 
64 | 	_, err := c.ai.CreateMessagesStream(ctx.Context, req)
65 | 	if err != nil {
66 | 		return fmt.Errorf("%w", err)
67 | 	}
68 | 
69 | 	fmt.Fprintf(ctx.App.Writer, "\n")
70 | 
71 | 	return nil
72 | }
73 | 


--------------------------------------------------------------------------------
/internal/ai/anthropic/request.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | package anthropic
 7 | 
 8 | import (
 9 | 	"fmt"
10 | 
11 | 	"git.sr.ht/~jamesponddotco/xstd-go/xunsafe"
12 | 	"github.com/DataDog/documentor/internal/ai"
13 | 	"github.com/liushuangls/go-anthropic/v2"
14 | 	"github.com/urfave/cli/v2"
15 | )
16 | 
17 | // NewRequest creates a chat completion request with streaming support for the
18 | // Anthropic API given the provided ai.Request object.
19 | func NewRequest(ctx *cli.Context, req *ai.Request) anthropic.MessagesStreamRequest {
20 | 	text := xunsafe.BytesToString(req.Text)
21 | 
22 | 	return anthropic.MessagesStreamRequest{
23 | 		MessagesRequest: anthropic.MessagesRequest{
24 | 			Model:       anthropic.Model(req.Model),
25 | 			Temperature: &req.Temperature,
26 | 			System:      req.SystemPrompt,
27 | 			MaxTokens:   4096,
28 | 			Stream:      true,
29 | 			Messages: []anthropic.Message{
30 | 				{
31 | 					Role: anthropic.RoleUser,
32 | 					Content: []anthropic.MessageContent{
33 | 						anthropic.NewTextMessageContent(text),
34 | 						anthropic.NewTextMessageContent(req.UserPrompt),
35 | 					},
36 | 				},
37 | 			},
38 | 		},
39 | 		OnContentBlockDelta: func(data anthropic.MessagesEventContentBlockDeltaData) {
40 | 			fmt.Fprintf(ctx.App.Writer, "%s", *data.Delta.Text)
41 | 		},
42 | 	}
43 | }
44 | 
45 | // NewRequestWithImage creates a chat completion request with streaming support
46 | // for the Anthropic API given the provided ai.Request object. The req.Content
47 | // field should be a base64-encoded image.
48 | func NewRequestWithImage(ctx *cli.Context, req *ai.Request) anthropic.MessagesStreamRequest {
49 | 	return anthropic.MessagesStreamRequest{
50 | 		MessagesRequest: anthropic.MessagesRequest{
51 | 			Model:       anthropic.Model(req.Model),
52 | 			Temperature: &req.Temperature,
53 | 			System:      req.SystemPrompt,
54 | 			MaxTokens:   4096,
55 | 			Stream:      true,
56 | 			Messages: []anthropic.Message{
57 | 				{
58 | 					Role: anthropic.RoleUser,
59 | 					Content: []anthropic.MessageContent{
60 | 						anthropic.NewImageMessageContent(anthropic.MessageContentSource{
61 | 							Type:      "base64",
62 | 							MediaType: "image/jpeg",
63 | 							Data:      req.Image,
64 | 						}),
65 | 						anthropic.NewTextMessageContent(req.UserPrompt),
66 | 					},
67 | 				},
68 | 			},
69 | 		},
70 | 		OnContentBlockDelta: func(data anthropic.MessagesEventContentBlockDeltaData) {
71 | 			fmt.Fprintf(ctx.App.Writer, "%s", *data.Delta.Text)
72 | 		},
73 | 	}
74 | }
75 | 


--------------------------------------------------------------------------------
/internal/ai/datadog/datadog.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package datadog provides a client wrapper for the Datadog AI proxy API that
 7 | // complies with the ai.Provider interface.
 8 | package datadog
 9 | 
10 | import (
11 | 	"errors"
12 | 	"fmt"
13 | 	"io"
14 | 	"net/http"
15 | 	"time"
16 | 
17 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
18 | 	"github.com/DataDog/documentor/internal/ai"
19 | 	"github.com/DataDog/documentor/internal/errno"
20 | 	"github.com/sashabaranov/go-openai"
21 | 	"github.com/urfave/cli/v2"
22 | )
23 | 
24 | // ErrInvalidRequest is returned when the request provided to the Datadog proxy
25 | // API is missing both an image and text.
26 | const ErrInvalidRequest xerrors.Error = "invalid request: must provide either an image or text"
27 | 
28 | // DefaultModel is the default model to use when making requests to the API.
29 | const DefaultModel = "gpt-4o"
30 | 
31 | // Client represents a Datadog AI proxy API client that complies with the
32 | // ai.Provider interface.
33 | type Client struct {
34 | 	// ai is the proper Datadog proxy client.
35 | 	ai *openai.Client
36 | }
37 | 
38 | // NewClient returns a new Client instance with the given email.
39 | func NewClient(endpoint, email string) *Client {
40 | 	cfg := openai.DefaultConfig("not-a-real-key")
41 | 	cfg.BaseURL = endpoint
42 | 	cfg.HTTPClient = &http.Client{
43 | 		Transport: &Transport{
44 | 			Email: email,
45 | 		},
46 | 		Timeout: 1 * time.Minute,
47 | 	}
48 | 
49 | 	return &Client{
50 | 		ai: openai.NewClientWithConfig(cfg),
51 | 	}
52 | }
53 | 
54 | // Compile-time check to ensure Client implements the ai.Provider interface.
55 | var _ ai.Provider = (*Client)(nil)
56 | 
57 | // Name returns the name of the provider.
58 | func (*Client) Name() string {
59 | 	return "Datadog"
60 | }
61 | 
62 | // Do performs a single API request to the Datadog API, returning a response for
63 | // the provided Request and writing said response to ctx.App.Writer as a stream
64 | // of strings.
65 | func (c *Client) Do(ctx *cli.Context, request *ai.Request) error {
66 | 	var req openai.ChatCompletionRequest
67 | 
68 | 	switch {
69 | 	case request.Image != nil:
70 | 		req = NewRequestWithImage(request)
71 | 	case request.Text != nil:
72 | 		req = NewRequest(request)
73 | 	default:
74 | 		return ErrInvalidRequest
75 | 	}
76 | 
77 | 	resp, err := c.ai.CreateChatCompletionStream(ctx.Context, req)
78 | 	if err != nil {
79 | 		return fmt.Errorf("%w", err)
80 | 	}
81 | 
82 | 	for {
83 | 		text, err := resp.Recv() //nolint:govet // Fixing this is more trouble than it's worth.
84 | 		if errors.Is(err, io.EOF) {
85 | 			fmt.Fprintf(ctx.App.Writer, "\n")
86 | 
87 | 			break
88 | 		}
89 | 
90 | 		if err != nil {
91 | 			return errno.New(errno.ExitAPIError, fmt.Errorf("failed to get response: %w", err))
92 | 		}
93 | 
94 | 		fmt.Fprintf(ctx.App.Writer, "%s", text.Choices[0].Delta.Content)
95 | 	}
96 | 
97 | 	return nil
98 | }
99 | 


--------------------------------------------------------------------------------
/internal/ai/datadog/request.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | package datadog
 7 | 
 8 | import (
 9 | 	"git.sr.ht/~jamesponddotco/xstd-go/xunsafe"
10 | 	"github.com/DataDog/documentor/internal/ai"
11 | 	"github.com/DataDog/documentor/internal/xbase64"
12 | 	"github.com/sashabaranov/go-openai"
13 | )
14 | 
15 | // NewTextRequest creates a chat completion request with streaming support for
16 | // the Datadog API given the provided ai.Request object.
17 | func NewRequest(req *ai.Request) openai.ChatCompletionRequest {
18 | 	text := xunsafe.BytesToString(req.Text)
19 | 
20 | 	return openai.ChatCompletionRequest{
21 | 		Model:       req.Model,
22 | 		Temperature: req.Temperature,
23 | 		Stream:      true,
24 | 		Messages: []openai.ChatCompletionMessage{
25 | 			{
26 | 				Role:    openai.ChatMessageRoleUser,
27 | 				Content: text,
28 | 			},
29 | 			{
30 | 				Role:    openai.ChatMessageRoleUser,
31 | 				Content: req.UserPrompt,
32 | 			},
33 | 			{
34 | 				Role:    openai.ChatMessageRoleSystem,
35 | 				Content: req.SystemPrompt,
36 | 			},
37 | 		},
38 | 	}
39 | }
40 | 
41 | // NewRequestWithImage creates a chat completion request with streaming support
42 | // for the Datadog API given the provided ai.Request object. The req.Content
43 | // field should be a base64-encoded image.
44 | func NewRequestWithImage(req *ai.Request) openai.ChatCompletionRequest {
45 | 	image := xbase64.EncodeImageToDataURL(req.Image)
46 | 
47 | 	return openai.ChatCompletionRequest{
48 | 		Model:       req.Model,
49 | 		Temperature: req.Temperature,
50 | 		Stream:      true,
51 | 		Messages: []openai.ChatCompletionMessage{
52 | 			{
53 | 				Role:    openai.ChatMessageRoleUser,
54 | 				Content: req.UserPrompt,
55 | 			},
56 | 			{
57 | 				Role: openai.ChatMessageRoleUser,
58 | 				MultiContent: []openai.ChatMessagePart{
59 | 					{
60 | 						Type: openai.ChatMessagePartTypeImageURL,
61 | 						ImageURL: &openai.ChatMessageImageURL{
62 | 							URL:    image,
63 | 							Detail: openai.ImageURLDetailAuto,
64 | 						},
65 | 					},
66 | 				},
67 | 			},
68 | 			{
69 | 				Role:    openai.ChatMessageRoleSystem,
70 | 				Content: req.SystemPrompt,
71 | 			},
72 | 		},
73 | 	}
74 | }
75 | 


--------------------------------------------------------------------------------
/internal/ai/datadog/transport.go:
--------------------------------------------------------------------------------
 1 | package datadog
 2 | 
 3 | import (
 4 | 	"fmt"
 5 | 	"net/http"
 6 | )
 7 | 
 8 | // Transport is a custom http.RoundTripper that supports adding custom headers
 9 | // to the request to the Datadog AI proxy API.
10 | type Transport struct {
11 | 	// Email is the email address of the user.
12 | 	Email string
13 | }
14 | 
15 | // RoundTrip implements the http.RoundTripper interface.
16 | func (t *Transport) RoundTrip(req *http.Request) (*http.Response, error) {
17 | 	req.Header.Set("X-Datadog-Org-Id", "2")
18 | 	req.Header.Set("X-Datadog-Source", "documentor")
19 | 	req.Header.Set("X-Datadog-User-Id", t.Email)
20 | 
21 | 	resp, err := http.DefaultTransport.RoundTrip(req)
22 | 	if err != nil {
23 | 		return nil, fmt.Errorf("%w", err)
24 | 	}
25 | 
26 | 	return resp, nil
27 | }
28 | 


--------------------------------------------------------------------------------
/internal/ai/openai/openai.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package openai provides a client wrapper for the OpenAI API that complies
 7 | // with the ai.Provider interface.
 8 | package openai
 9 | 
10 | import (
11 | 	"errors"
12 | 	"fmt"
13 | 	"io"
14 | 
15 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
16 | 	"github.com/DataDog/documentor/internal/ai"
17 | 	"github.com/DataDog/documentor/internal/errno"
18 | 	"github.com/sashabaranov/go-openai"
19 | 	"github.com/urfave/cli/v2"
20 | )
21 | 
22 | // ErrInvalidRequest is returned when the request provided to the OpenAI API is
23 | // missing both an image and text.
24 | const ErrInvalidRequest xerrors.Error = "invalid request: must provide either an image or text"
25 | 
26 | // DefaultModel is the default model to use when making requests to the OpenAI
27 | // API.
28 | const DefaultModel = "gpt-4o"
29 | 
30 | // Client represents an OpenAI API client that complies with the ai.Provider
31 | // interface.
32 | type Client struct {
33 | 	// ai is the proper OpenAI API client.
34 | 	ai *openai.Client
35 | }
36 | 
37 | // NewClient returns a new Client instance with the given API key.
38 | func NewClient(key string) *Client {
39 | 	return &Client{
40 | 		ai: openai.NewClient(key),
41 | 	}
42 | }
43 | 
44 | // Compile-time check to ensure Client implements the ai.Provider interface.
45 | var _ ai.Provider = (*Client)(nil)
46 | 
47 | // Name returns the name of the provider.
48 | func (*Client) Name() string {
49 | 	return "OpenAI"
50 | }
51 | 
52 | // Do performs a single API request to the OpenAI API, returning a response for
53 | // the provided Request and writing said response to ctx.App.Writer as a stream
54 | // of strings.
55 | func (c *Client) Do(ctx *cli.Context, request *ai.Request) error {
56 | 	var req openai.ChatCompletionRequest
57 | 
58 | 	switch {
59 | 	case request.Image != nil:
60 | 		req = NewRequestWithImage(request)
61 | 	case request.Text != nil:
62 | 		req = NewRequest(request)
63 | 	default:
64 | 		return ErrInvalidRequest
65 | 	}
66 | 
67 | 	resp, err := c.ai.CreateChatCompletionStream(ctx.Context, req)
68 | 	if err != nil {
69 | 		return fmt.Errorf("%w", err)
70 | 	}
71 | 
72 | 	for {
73 | 		text, err := resp.Recv() //nolint:govet // Fixing this is more trouble than it's worth.
74 | 		if errors.Is(err, io.EOF) {
75 | 			fmt.Fprintf(ctx.App.Writer, "\n")
76 | 
77 | 			break
78 | 		}
79 | 
80 | 		if err != nil {
81 | 			return errno.New(errno.ExitAPIError, fmt.Errorf("failed to get response: %w", err))
82 | 		}
83 | 
84 | 		fmt.Fprintf(ctx.App.Writer, "%s", text.Choices[0].Delta.Content)
85 | 	}
86 | 
87 | 	return nil
88 | }
89 | 


--------------------------------------------------------------------------------
/internal/ai/openai/request.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | package openai
 7 | 
 8 | import (
 9 | 	"git.sr.ht/~jamesponddotco/xstd-go/xunsafe"
10 | 	"github.com/DataDog/documentor/internal/ai"
11 | 	"github.com/DataDog/documentor/internal/xbase64"
12 | 	"github.com/sashabaranov/go-openai"
13 | )
14 | 
15 | // NewTextRequest creates a chat completion request with streaming support for
16 | // the OpenAI API given the provided ai.Request object.
17 | func NewRequest(req *ai.Request) openai.ChatCompletionRequest {
18 | 	text := xunsafe.BytesToString(req.Text)
19 | 
20 | 	return openai.ChatCompletionRequest{
21 | 		Model:       req.Model,
22 | 		Temperature: req.Temperature,
23 | 		Stream:      true,
24 | 		Messages: []openai.ChatCompletionMessage{
25 | 			{
26 | 				Role:    openai.ChatMessageRoleUser,
27 | 				Content: text,
28 | 			},
29 | 			{
30 | 				Role:    openai.ChatMessageRoleUser,
31 | 				Content: req.UserPrompt,
32 | 			},
33 | 			{
34 | 				Role:    openai.ChatMessageRoleSystem,
35 | 				Content: req.SystemPrompt,
36 | 			},
37 | 		},
38 | 	}
39 | }
40 | 
41 | // NewRequestWithImage creates a chat completion request with streaming support
42 | // for the OpenAI API given the provided ai.Request object. The req.Content
43 | // field should be a base64-encoded image.
44 | func NewRequestWithImage(req *ai.Request) openai.ChatCompletionRequest {
45 | 	image := xbase64.EncodeImageToDataURL(req.Image)
46 | 
47 | 	return openai.ChatCompletionRequest{
48 | 		Model:       req.Model,
49 | 		Temperature: req.Temperature,
50 | 		Stream:      true,
51 | 		Messages: []openai.ChatCompletionMessage{
52 | 			{
53 | 				Role:    openai.ChatMessageRoleUser,
54 | 				Content: req.UserPrompt,
55 | 			},
56 | 			{
57 | 				Role: openai.ChatMessageRoleUser,
58 | 				MultiContent: []openai.ChatMessagePart{
59 | 					{
60 | 						Type: openai.ChatMessagePartTypeImageURL,
61 | 						ImageURL: &openai.ChatMessageImageURL{
62 | 							URL:    image,
63 | 							Detail: openai.ImageURLDetailAuto,
64 | 						},
65 | 					},
66 | 				},
67 | 			},
68 | 			{
69 | 				Role:    openai.ChatMessageRoleSystem,
70 | 				Content: req.SystemPrompt,
71 | 			},
72 | 		},
73 | 	}
74 | }
75 | 


--------------------------------------------------------------------------------
/internal/app/app.go:
--------------------------------------------------------------------------------
  1 | // Unless explicitly stated otherwise all files in this repository are licensed
  2 | // under the Apache-2.0 License. This product includes software developed at
  3 | // Datadog (https://www.datadoghq.com/).
  4 | // Copyright 2024-Present Datadog, Inc.
  5 | 
  6 | // Package app is the main package for the application.
  7 | package app
  8 | 
  9 | import (
 10 | 	"errors"
 11 | 	"fmt"
 12 | 	"os"
 13 | 
 14 | 	"github.com/DataDog/documentor/internal/ai"
 15 | 	"github.com/DataDog/documentor/internal/ai/openai"
 16 | 	"github.com/DataDog/documentor/internal/errno"
 17 | 	"github.com/DataDog/documentor/internal/meta"
 18 | 	"github.com/urfave/cli/v2"
 19 | )
 20 | 
 21 | // Run is the entry point for the application.
 22 | func Run(args []string) int {
 23 | 	app := cli.NewApp()
 24 | 	app.Name = meta.Name
 25 | 	app.Version = meta.Version
 26 | 	app.Usage = meta.Description
 27 | 	app.HideHelpCommand = true
 28 | 
 29 | 	app.Flags = []cli.Flag{
 30 | 		&cli.StringFlag{
 31 | 			Name:    "key",
 32 | 			Aliases: []string{"k"},
 33 | 			Usage:   "the API key to use",
 34 | 			EnvVars: []string{
 35 | 				"DOCUMENTOR_KEY",
 36 | 			},
 37 | 		},
 38 | 		&cli.StringFlag{
 39 | 			Name:    "provider",
 40 | 			Aliases: []string{"p"},
 41 | 			Usage:   "the AI provider to use",
 42 | 			Value:   ai.ProviderOpenAI,
 43 | 			EnvVars: []string{
 44 | 				"DOCUMENTOR_PROVIDER",
 45 | 			},
 46 | 		},
 47 | 		&cli.StringFlag{
 48 | 			Name:    "endpoint",
 49 | 			Aliases: []string{"e"},
 50 | 			Usage:   "the API endpoint to use (currently only used for the Datadog provider)",
 51 | 			EnvVars: []string{
 52 | 				"DOCUMENTOR_ENDPOINT",
 53 | 			},
 54 | 		},
 55 | 		&cli.StringFlag{
 56 | 			Name:    "model",
 57 | 			Aliases: []string{"m"},
 58 | 			Usage:   "the AI model to use",
 59 | 			Value:   openai.DefaultModel,
 60 | 			EnvVars: []string{
 61 | 				"DOCUMENTOR_MODEL",
 62 | 			},
 63 | 		},
 64 | 		&cli.Float64Flag{
 65 | 			Name:    "temperature",
 66 | 			Aliases: []string{"t"},
 67 | 			Usage:   "the temperature to use for the model",
 68 | 			Value:   0.8,
 69 | 			EnvVars: []string{
 70 | 				"DOCUMENTOR_TEMPERATURE",
 71 | 			},
 72 | 		},
 73 | 	}
 74 | 
 75 | 	app.Commands = []*cli.Command{
 76 | 		{
 77 | 			Name:    "review",
 78 | 			Aliases: []string{"r"},
 79 | 			Usage:   "review technical documentation",
 80 | 			Action:  ReviewAction,
 81 | 		},
 82 | 		{
 83 | 			Name:    "describe",
 84 | 			Aliases: []string{"d"},
 85 | 			Usage:   "describe an image and generate alt text",
 86 | 			Action:  DescribeAction,
 87 | 			Flags: []cli.Flag{
 88 | 				&cli.StringFlag{
 89 | 					Name:    "context",
 90 | 					Aliases: []string{"c"},
 91 | 					Usage:   "the context to use for the image",
 92 | 				},
 93 | 				&cli.BoolFlag{
 94 | 					Name:    "filename",
 95 | 					Aliases: []string{"f"},
 96 | 					Usage:   "whether to generate a filename",
 97 | 					Value:   false,
 98 | 				},
 99 | 			},
100 | 		},
101 | 		{
102 | 			Name:    "draft",
103 | 			Aliases: []string{"D"},
104 | 			Usage:   "draft new documentation based on the provided notes",
105 | 			Action:  DraftAction,
106 | 		},
107 | 	}
108 | 
109 | 	if err := app.Run(args); err != nil {
110 | 		var exitErr *errno.Error
111 | 
112 | 		if errors.As(err, &exitErr) {
113 | 			fmt.Fprintf(os.Stderr, "error: %q\n", err)
114 | 
115 | 			return exitErr.Code()
116 | 		}
117 | 
118 | 		fmt.Fprintf(os.Stderr, "error: unknown error: %q\n", err)
119 | 
120 | 		return int(errno.ExitError)
121 | 	}
122 | 
123 | 	return 0
124 | }
125 | 


--------------------------------------------------------------------------------
/internal/app/describe.go:
--------------------------------------------------------------------------------
  1 | // Unless explicitly stated otherwise all files in this repository are licensed
  2 | // under the Apache-2.0 License. This product includes software developed at
  3 | // Datadog (https://www.datadoghq.com/).
  4 | // Copyright 2024-Present Datadog, Inc.
  5 | 
  6 | package app
  7 | 
  8 | import (
  9 | 	"errors"
 10 | 	"fmt"
 11 | 	"os"
 12 | 	"strings"
 13 | 
 14 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
 15 | 	"github.com/DataDog/documentor/internal/ai"
 16 | 	"github.com/DataDog/documentor/internal/ai/anthropic"
 17 | 	"github.com/DataDog/documentor/internal/ai/datadog"
 18 | 	"github.com/DataDog/documentor/internal/ai/openai"
 19 | 	"github.com/DataDog/documentor/internal/errno"
 20 | 	"github.com/DataDog/documentor/internal/prompt"
 21 | 	"github.com/DataDog/documentor/internal/validate"
 22 | 	"github.com/urfave/cli/v2"
 23 | )
 24 | 
 25 | const (
 26 | 	// ErrEmptyDescribeInput is the error message when the describe command is
 27 | 	// invoked without any input.
 28 | 	ErrEmptyDescribeInput xerrors.Error = "missing image file to describe"
 29 | 
 30 | 	// ErrTooManyImages is the error message when the describe command is
 31 | 	// invoked with more than one input.
 32 | 	ErrTooManyImages xerrors.Error = "too many image files to describe; please provide only one"
 33 | 
 34 | 	// ErrInvalidImageType is the error message when the describe command is
 35 | 	// invoked with an invalid image file type.
 36 | 	ErrInvalidImageType xerrors.Error = "invalid image file type; please provide a PNG, JPG, JPEG, or GIF file"
 37 | 
 38 | 	// ErrInvalidProvider is the error message when the describe command is
 39 | 	// invoked with an invalid AI provider.
 40 | 	ErrInvalidProvider xerrors.Error = "invalid AI provider; please refer to the documentation for a list of valid providers"
 41 | 
 42 | 	// ErrMissingDatadogEndpoint is the error message when any command is
 43 | 	// invoked with the Datadog provider but without an endpoint.
 44 | 	ErrMissingDatadogEndpoint xerrors.Error = "missing API endpoint; please refer to the internal documentation for the correct endpoint"
 45 | )
 46 | 
 47 | // DescribeAction is the action to perform when the describe command is invoked.
 48 | func DescribeAction(ctx *cli.Context) error {
 49 | 	if ctx.Args().Len() < 1 {
 50 | 		return errno.New(errno.ExitUsage, ErrEmptyDescribeInput)
 51 | 	}
 52 | 
 53 | 	if ctx.Args().Len() > 1 {
 54 | 		return errno.New(errno.ExitUsage, ErrTooManyImages)
 55 | 	}
 56 | 
 57 | 	var (
 58 | 		key         = ctx.String("key")
 59 | 		model       = ctx.String("model")
 60 | 		provider    = ctx.String("provider")
 61 | 		endpoint    = ctx.String("endpoint")
 62 | 		context     = ctx.String("context")
 63 | 		temperature = ctx.Float64("temperature")
 64 | 		filename    = ctx.Bool("filename")
 65 | 		file        = ctx.Args().Get(0)
 66 | 		client      ai.Provider
 67 | 	)
 68 | 
 69 | 	if provider != ai.ProviderDatadog && !validate.Key(key) {
 70 | 		return errno.New(errno.ExitUnauthorized, ErrInvalidAPIKey)
 71 | 	}
 72 | 
 73 | 	if provider == ai.ProviderDatadog && endpoint == "" {
 74 | 		return errno.New(errno.ExitInvalidInput, ErrMissingDatadogEndpoint)
 75 | 	}
 76 | 
 77 | 	if !validate.Filetype(file, []string{"png", "jpg", "jpeg", "gif"}) {
 78 | 		return errno.New(errno.ExitInvalidInput, ErrInvalidImageType)
 79 | 	}
 80 | 
 81 | 	provider = strings.ToLower(provider)
 82 | 	provider = strings.TrimSpace(provider)
 83 | 
 84 | 	switch provider {
 85 | 	case ai.ProviderOpenAI:
 86 | 		client = openai.NewClient(key)
 87 | 	case ai.ProviderAnthropic:
 88 | 		client = anthropic.NewClient(key)
 89 | 
 90 | 		if model == openai.DefaultModel {
 91 | 			model = anthropic.DefaultModel
 92 | 		}
 93 | 	case ai.ProviderDatadog:
 94 | 		client = datadog.NewClient(endpoint, key)
 95 | 
 96 | 		if model == openai.DefaultModel {
 97 | 			model = datadog.DefaultModel
 98 | 		}
 99 | 	default:
100 | 		return errno.New(errno.ExitInvalidInput, ErrInvalidProvider)
101 | 	}
102 | 
103 | 	data, err := os.ReadFile(file)
104 | 	if err != nil {
105 | 		if errors.Is(err, os.ErrNotExist) {
106 | 			return errno.New(errno.ExitNotFound, err)
107 | 		}
108 | 
109 | 		if errors.Is(err, os.ErrPermission) {
110 | 			return errno.New(errno.ExitPermission, err)
111 | 		}
112 | 
113 | 		return errno.New(errno.ExitIO, err)
114 | 	}
115 | 
116 | 	userPrompt := "Please generate an SEO-optimized alt text for the attached image."
117 | 
118 | 	if filename {
119 | 		userPrompt += " Include a SEO-optimized filename as well."
120 | 	}
121 | 
122 | 	req := ai.NewRequestWithImage(data, model, context, userPrompt, prompt.DescribePrompt, float32(temperature))
123 | 
124 | 	err = client.Do(ctx, req)
125 | 	if err != nil {
126 | 		if errors.Is(err, os.ErrDeadlineExceeded) {
127 | 			return errno.New(errno.ExitTimeout, err)
128 | 		}
129 | 
130 | 		return errno.New(errno.ExitAPIError, fmt.Errorf("failed to get response: %w", err))
131 | 	}
132 | 
133 | 	return nil
134 | }
135 | 


--------------------------------------------------------------------------------
/internal/app/draft.go:
--------------------------------------------------------------------------------
  1 | // Unless explicitly stated otherwise all files in this repository are licensed
  2 | // under the Apache-2.0 License. This product includes software developed at
  3 | // Datadog (https://www.datadoghq.com/).
  4 | // Copyright 2024-Present Datadog, Inc.
  5 | 
  6 | package app
  7 | 
  8 | import (
  9 | 	"errors"
 10 | 	"fmt"
 11 | 	"os"
 12 | 	"strings"
 13 | 
 14 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
 15 | 	"github.com/DataDog/documentor/internal/ai"
 16 | 	"github.com/DataDog/documentor/internal/ai/anthropic"
 17 | 	"github.com/DataDog/documentor/internal/ai/datadog"
 18 | 	"github.com/DataDog/documentor/internal/ai/openai"
 19 | 	"github.com/DataDog/documentor/internal/errno"
 20 | 	"github.com/DataDog/documentor/internal/prompt"
 21 | 	"github.com/DataDog/documentor/internal/validate"
 22 | 	"github.com/urfave/cli/v2"
 23 | )
 24 | 
 25 | const (
 26 | 	// ErrEmptyDraftInput is the error message when the draft command is
 27 | 	// invoked without any input.
 28 | 	ErrEmptyDraftInput xerrors.Error = "missing input for draft; please provide a file with your notes"
 29 | 
 30 | 	// ErrTooManyNotes is the error message when the draft command is
 31 | 	// invoked with more than one input.
 32 | 	ErrTooManyNotes xerrors.Error = "too many notes files; please provide only one"
 33 | 
 34 | 	// ErrInvalidFiletype is the error message when the draft command is
 35 | 	// invoked with a file that is not a text file.
 36 | 	ErrInvalidFiletype xerrors.Error = "invalid filetype; please provide a TXT or MD file"
 37 | )
 38 | 
 39 | // DraftAction is the action to perform when the draft command is invoked.
 40 | func DraftAction(ctx *cli.Context) error {
 41 | 	if ctx.Args().Len() < 1 {
 42 | 		return errno.New(errno.ExitUsage, ErrEmptyDraftInput)
 43 | 	}
 44 | 
 45 | 	if ctx.Args().Len() > 1 {
 46 | 		return errno.New(errno.ExitUsage, ErrTooManyNotes)
 47 | 	}
 48 | 
 49 | 	var (
 50 | 		key         = ctx.String("key")
 51 | 		model       = ctx.String("model")
 52 | 		provider    = ctx.String("provider")
 53 | 		endpoint    = ctx.String("endpoint")
 54 | 		temperature = ctx.Float64("temperature")
 55 | 		file        = ctx.Args().Get(0)
 56 | 		client      ai.Provider
 57 | 	)
 58 | 
 59 | 	if provider != ai.ProviderDatadog && !validate.Key(key) {
 60 | 		return errno.New(errno.ExitUnauthorized, ErrInvalidAPIKey)
 61 | 	}
 62 | 
 63 | 	if provider == ai.ProviderDatadog && endpoint == "" {
 64 | 		return errno.New(errno.ExitInvalidInput, ErrMissingDatadogEndpoint)
 65 | 	}
 66 | 
 67 | 	if !validate.Filetype(file, []string{"txt", "md"}) {
 68 | 		return errno.New(errno.ExitInvalidInput, ErrInvalidFiletype)
 69 | 	}
 70 | 
 71 | 	provider = strings.ToLower(provider)
 72 | 	provider = strings.TrimSpace(provider)
 73 | 
 74 | 	switch provider {
 75 | 	case ai.ProviderOpenAI:
 76 | 		client = openai.NewClient(key)
 77 | 	case ai.ProviderAnthropic:
 78 | 		client = anthropic.NewClient(key)
 79 | 
 80 | 		if model == openai.DefaultModel {
 81 | 			model = anthropic.DefaultModel
 82 | 		}
 83 | 	case ai.ProviderDatadog:
 84 | 		client = datadog.NewClient(endpoint, key)
 85 | 
 86 | 		if model == openai.DefaultModel {
 87 | 			model = datadog.DefaultModel
 88 | 		}
 89 | 	default:
 90 | 		return errno.New(errno.ExitInvalidInput, ErrInvalidProvider)
 91 | 	}
 92 | 
 93 | 	data, err := os.ReadFile(file)
 94 | 	if err != nil {
 95 | 		if errors.Is(err, os.ErrNotExist) {
 96 | 			return errno.New(errno.ExitNotFound, err)
 97 | 		}
 98 | 
 99 | 		if errors.Is(err, os.ErrPermission) {
100 | 			return errno.New(errno.ExitPermission, err)
101 | 		}
102 | 
103 | 		return errno.New(errno.ExitIO, err)
104 | 	}
105 | 
106 | 	var (
107 | 		userPrompt = "Please write a new technical document based on the notes " +
108 | 			"provided. It's very important that I get a good answer as I'm " +
109 | 			"under a LOT of stress at work. I'll tip $500 if you can help me " +
110 | 			"out. Thanks!"
111 | 		req = ai.NewRequest(data, model, userPrompt, prompt.DraftPrompt, float32(temperature))
112 | 	)
113 | 
114 | 	err = client.Do(ctx, req)
115 | 	if err != nil {
116 | 		if errors.Is(err, os.ErrDeadlineExceeded) {
117 | 			return errno.New(errno.ExitTimeout, err)
118 | 		}
119 | 
120 | 		return errno.New(errno.ExitAPIError, fmt.Errorf("failed to get response: %w", err))
121 | 	}
122 | 
123 | 	return nil
124 | }
125 | 


--------------------------------------------------------------------------------
/internal/app/review.go:
--------------------------------------------------------------------------------
  1 | // Unless explicitly stated otherwise all files in this repository are licensed
  2 | // under the Apache-2.0 License. This product includes software developed at
  3 | // Datadog (https://www.datadoghq.com/).
  4 | // Copyright 2024-Present Datadog, Inc.
  5 | 
  6 | package app
  7 | 
  8 | import (
  9 | 	"errors"
 10 | 	"fmt"
 11 | 	"os"
 12 | 	"strings"
 13 | 
 14 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
 15 | 	"github.com/DataDog/documentor/internal/ai"
 16 | 	"github.com/DataDog/documentor/internal/ai/anthropic"
 17 | 	"github.com/DataDog/documentor/internal/ai/datadog"
 18 | 	"github.com/DataDog/documentor/internal/ai/openai"
 19 | 	"github.com/DataDog/documentor/internal/errno"
 20 | 	"github.com/DataDog/documentor/internal/prompt"
 21 | 	"github.com/DataDog/documentor/internal/validate"
 22 | 	"github.com/urfave/cli/v2"
 23 | )
 24 | 
 25 | const (
 26 | 	// ErrEmptyInput is returned when no file is provided by the user.
 27 | 	ErrEmptyInput xerrors.Error = "missing file to review"
 28 | 
 29 | 	// ErrInvalidAPIKey is returned when the user does not provide an API key
 30 | 	// for the given provider or provides an invalid one.
 31 | 	ErrInvalidAPIKey xerrors.Error = "missing or invalid API key"
 32 | 
 33 | 	// ErrTooMuchInput is returned when the user provides more than one file.
 34 | 	ErrTooMuchInput xerrors.Error = "too many files to review; please provide only one file"
 35 | )
 36 | 
 37 | // ReviewAction is the main action for the application.
 38 | func ReviewAction(ctx *cli.Context) error {
 39 | 	if ctx.Args().Len() < 1 {
 40 | 		return errno.New(errno.ExitUsage, ErrEmptyInput)
 41 | 	}
 42 | 
 43 | 	if ctx.Args().Len() > 1 {
 44 | 		return errno.New(errno.ExitUsage, ErrTooMuchInput)
 45 | 	}
 46 | 
 47 | 	var (
 48 | 		key         = ctx.String("key")
 49 | 		model       = ctx.String("model")
 50 | 		provider    = ctx.String("provider")
 51 | 		endpoint    = ctx.String("endpoint")
 52 | 		temperature = ctx.Float64("temperature")
 53 | 		file        = ctx.Args().Get(0)
 54 | 		client      ai.Provider
 55 | 	)
 56 | 
 57 | 	if provider != ai.ProviderDatadog && !validate.Key(key) {
 58 | 		return errno.New(errno.ExitUnauthorized, ErrInvalidAPIKey)
 59 | 	}
 60 | 
 61 | 	if provider == ai.ProviderDatadog && endpoint == "" {
 62 | 		return errno.New(errno.ExitInvalidInput, ErrMissingDatadogEndpoint)
 63 | 	}
 64 | 
 65 | 	if !validate.Filetype(file, []string{"txt", "md"}) {
 66 | 		return errno.New(errno.ExitInvalidInput, ErrInvalidFiletype)
 67 | 	}
 68 | 
 69 | 	provider = strings.ToLower(provider)
 70 | 	provider = strings.TrimSpace(provider)
 71 | 
 72 | 	switch provider {
 73 | 	case ai.ProviderOpenAI:
 74 | 		client = openai.NewClient(key)
 75 | 	case ai.ProviderAnthropic:
 76 | 		client = anthropic.NewClient(key)
 77 | 
 78 | 		if model == openai.DefaultModel {
 79 | 			model = anthropic.DefaultModel
 80 | 		}
 81 | 	case ai.ProviderDatadog:
 82 | 		client = datadog.NewClient(endpoint, key)
 83 | 
 84 | 		if model == openai.DefaultModel {
 85 | 			model = datadog.DefaultModel
 86 | 		}
 87 | 	default:
 88 | 		return errno.New(errno.ExitInvalidInput, ErrInvalidProvider)
 89 | 	}
 90 | 
 91 | 	data, err := os.ReadFile(file)
 92 | 	if err != nil {
 93 | 		if errors.Is(err, os.ErrNotExist) {
 94 | 			return errno.New(errno.ExitNotFound, err)
 95 | 		}
 96 | 
 97 | 		if errors.Is(err, os.ErrPermission) {
 98 | 			return errno.New(errno.ExitPermission, err)
 99 | 		}
100 | 
101 | 		return errno.New(errno.ExitIO, err)
102 | 	}
103 | 
104 | 	var (
105 | 		userPrompt = "Please review the following content. It's very " +
106 | 			"important that I get a good answer as I'm under a LOT of " +
107 | 			"stress at work. I'll tip $500 if you can help me."
108 | 		req = ai.NewRequest(data, model, userPrompt, prompt.MarkdownPrompt, float32(temperature))
109 | 	)
110 | 
111 | 	err = client.Do(ctx, req)
112 | 	if err != nil {
113 | 		if errors.Is(err, os.ErrDeadlineExceeded) {
114 | 			return errno.New(errno.ExitTimeout, err)
115 | 		}
116 | 
117 | 		return errno.New(errno.ExitAPIError, fmt.Errorf("failed to get response: %w", err))
118 | 	}
119 | 
120 | 	return nil
121 | }
122 | 


--------------------------------------------------------------------------------
/internal/errno/errno.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package errno provides a way to handle errors with exit codes.
 7 | package errno
 8 | 
 9 | // Exit codes for errors.
10 | const (
11 | 	// ExitOK is the exit code for a successful operation.
12 | 	ExitOK uint8 = iota
13 | 
14 | 	// ExitError is the exit code for a generic error.
15 | 	ExitError
16 | 
17 | 	// ExitUsage is the exit code for an incorrect usage of a command.
18 | 	ExitUsage
19 | 
20 | 	// ExitIO is the exit code for an I/O error.
21 | 	ExitIO
22 | 
23 | 	// ExitNotFound is the exit code for a file not found error.
24 | 	ExitNotFound
25 | 
26 | 	// ExitPermission is the exit code for an I/O permission denied error.
27 | 	ExitPermission
28 | 
29 | 	// ExitAPIError is the exit code for errors related to API requests.
30 | 	ExitAPIError
31 | 
32 | 	// ExitUnauthorized is the exit code for unauthorized requests to the OpenAI
33 | 	// API.
34 | 	ExitUnauthorized
35 | 
36 | 	// ExitTimeout is the exit code for timeout errors.
37 | 	ExitTimeout
38 | 
39 | 	// ExitInvalidInput is the exit code for invalid input errors.
40 | 	ExitInvalidInput
41 | )
42 | 
43 | // Error is an error with an exit code.
44 | type Error struct {
45 | 	// Err is the underlying error that caused this error.
46 | 	Err error
47 | 
48 | 	// No is the machine-readable exit code.
49 | 	No uint8
50 | }
51 | 
52 | // Error implements the error interface for Error.
53 | func (e *Error) Error() string {
54 | 	if e.Err != nil {
55 | 		return e.Err.Error()
56 | 	}
57 | 
58 | 	return "unknown error"
59 | }
60 | 
61 | // Unwrap returns the underlying error.
62 | func (e *Error) Unwrap() error {
63 | 	return e.Err
64 | }
65 | 
66 | // Code returns the exit code of the error as an integer.
67 | func (e *Error) Code() int {
68 | 	return int(e.No)
69 | }
70 | 
71 | // New creates a new Error with the given exit code and error.
72 | func New(code uint8, err error) *Error {
73 | 	return &Error{
74 | 		No:  code,
75 | 		Err: err,
76 | 	}
77 | }
78 | 


--------------------------------------------------------------------------------
/internal/errno/errno_test.go:
--------------------------------------------------------------------------------
  1 | // Unless explicitly stated otherwise all files in this repository are licensed
  2 | // under the Apache-2.0 License. This product includes software developed at
  3 | // Datadog (https://www.datadoghq.com/).
  4 | // Copyright 2024-Present Datadog, Inc.
  5 | 
  6 | package errno_test
  7 | 
  8 | import (
  9 | 	"errors"
 10 | 	"testing"
 11 | 
 12 | 	"git.sr.ht/~jamesponddotco/xstd-go/xerrors"
 13 | 	"github.com/DataDog/documentor/internal/errno"
 14 | )
 15 | 
 16 | const ErrGenericError xerrors.Error = "failure"
 17 | 
 18 | func TestError_Error(t *testing.T) {
 19 | 	t.Parallel()
 20 | 
 21 | 	tests := []struct {
 22 | 		name string
 23 | 		err  error
 24 | 		want string
 25 | 	}{
 26 | 		{
 27 | 			name: "With underlying error",
 28 | 			err:  ErrGenericError,
 29 | 			want: "failure",
 30 | 		},
 31 | 		{
 32 | 			name: "With nil underlying error",
 33 | 			err:  nil,
 34 | 			want: "unknown error",
 35 | 		},
 36 | 	}
 37 | 
 38 | 	for _, tt := range tests {
 39 | 		t.Run(tt.name, func(t *testing.T) {
 40 | 			t.Parallel()
 41 | 
 42 | 			err := errno.Error{
 43 | 				Err: tt.err,
 44 | 			}
 45 | 
 46 | 			if got := err.Error(); got != tt.want {
 47 | 				t.Errorf("Error.Error() = %q, want %q", got, tt.want)
 48 | 			}
 49 | 		})
 50 | 	}
 51 | }
 52 | 
 53 | func TestError_Unwrap(t *testing.T) {
 54 | 	t.Parallel()
 55 | 
 56 | 	tests := []struct {
 57 | 		name string
 58 | 		err  error
 59 | 		want error
 60 | 	}{
 61 | 		{
 62 | 			name: "With underlying error",
 63 | 			err:  ErrGenericError,
 64 | 			want: ErrGenericError,
 65 | 		},
 66 | 		{
 67 | 			name: "With nil underlying error",
 68 | 			err:  nil,
 69 | 			want: nil,
 70 | 		},
 71 | 	}
 72 | 
 73 | 	for _, tt := range tests {
 74 | 		t.Run(tt.name, func(t *testing.T) {
 75 | 			t.Parallel()
 76 | 
 77 | 			err := errno.Error{
 78 | 				Err: tt.err,
 79 | 			}
 80 | 
 81 | 			if got := err.Unwrap(); !errors.Is(got, tt.want) {
 82 | 				t.Errorf("Error.Unwrap() = %v, want %v", got, tt.want)
 83 | 			}
 84 | 		})
 85 | 	}
 86 | }
 87 | 
 88 | func TestError_Code(t *testing.T) {
 89 | 	t.Parallel()
 90 | 
 91 | 	tests := []struct {
 92 | 		name string
 93 | 		no   uint8
 94 | 		want int
 95 | 	}{
 96 | 		{
 97 | 			name: "ExitOK",
 98 | 			no:   errno.ExitOK,
 99 | 			want: 0,
100 | 		},
101 | 		{
102 | 			name: "ExitError",
103 | 			no:   errno.ExitError,
104 | 			want: 1,
105 | 		},
106 | 	}
107 | 
108 | 	for _, tt := range tests {
109 | 		t.Run(tt.name, func(t *testing.T) {
110 | 			t.Parallel()
111 | 
112 | 			err := errno.Error{
113 | 				No: tt.no,
114 | 			}
115 | 
116 | 			if got := err.Code(); got != tt.want {
117 | 				t.Errorf("Error.Code() = %d, want %d", got, tt.want)
118 | 			}
119 | 		})
120 | 	}
121 | }
122 | 
123 | func TestNew(t *testing.T) {
124 | 	t.Parallel()
125 | 
126 | 	tests := []struct {
127 | 		name     string
128 | 		code     uint8
129 | 		err      error
130 | 		wantCode int
131 | 		wantErr  error
132 | 	}{
133 | 		{
134 | 			name:     "With nil error",
135 | 			code:     errno.ExitError,
136 | 			err:      nil,
137 | 			wantCode: 1,
138 | 			wantErr:  nil,
139 | 		},
140 | 		{
141 | 			name:     "With non-nil error",
142 | 			code:     errno.ExitError,
143 | 			err:      ErrGenericError,
144 | 			wantCode: 1,
145 | 			wantErr:  ErrGenericError,
146 | 		},
147 | 	}
148 | 
149 | 	for _, tt := range tests {
150 | 		t.Run(tt.name, func(t *testing.T) {
151 | 			t.Parallel()
152 | 
153 | 			got := errno.New(tt.code, tt.err)
154 | 
155 | 			if got.Code() != tt.wantCode || !errors.Is(got.Unwrap(), tt.wantErr) {
156 | 				t.Errorf("New(%d, %v) = {Code: %d, Err: %v}, want {Code: %d, Err: %v}", tt.code, tt.err, got.Code(), got.Unwrap(), tt.wantCode, tt.wantErr)
157 | 			}
158 | 		})
159 | 	}
160 | }
161 | 


--------------------------------------------------------------------------------
/internal/meta/meta.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package meta provides build information and other metadata for the
 7 | // application.
 8 | package meta
 9 | 
10 | const (
11 | 	// Name is the name of the application.
12 | 	Name = "documentor"
13 | 
14 | 	// Version is the version of the application.
15 | 	Version = "1.2.0"
16 | 
17 | 	// Description is the description of the application.
18 | 	Description = "improve technical documentation with the power of AI"
19 | )
20 | 


--------------------------------------------------------------------------------
/internal/prompt/data/describe-prompt.txt:
--------------------------------------------------------------------------------
 1 | You are to adopt the expertise of Joost de Valk, a renowned SEO and digital marketing expert. Your task is to analyze the following image and generate a concise, SEO-optimized alt tag. Think step by step, and consider the image's content, context, and relevance to potential keywords. Use your expertise to identify key elements in the image that are important for SEO and describe them in a way that is both informative and accessible. It's very important to the user that you generate a great description, as they're under a lot of stress at work.
 2 | 
 3 | Consider the following guidelines while analyzing the image:
 4 | 
 5 | - Identify the main subject or focus of the image.
 6 | - Note any important details that contribute to the overall context.
 7 | - Consider the potential keywords that users might search for related to the image.
 8 | 
 9 | When writing the alt tag, follow these best practices:
10 | 
11 | - Keep the alt tag concise, ideally between 5 to 15 words.
12 | - Include relevant keywords naturally, without keyword stuffing.
13 | - Describe the image accurately and specifically.
14 | - Focus on the most important elements of the image.
15 | - Use proper grammar and punctuation.
16 | - Use standard English language conventions.
17 | - Avoid starting with phrases like "A picture of" or "An image of."
18 | 
19 | Please generate an alt tag that improves the image's SEO performance. Remember, your goal is to maximize the image's
20 | visibility and relevance in web searches, while maintaining a natural and accurate description. Don't output anything
21 | else, just the value to the alt tag field. Do not use quotes and use a final period, just like the examples below.
22 | 
23 | Examples:
24 | 1. A vibrant sunset over a tranquil lake with silhouettes of pine trees in the foreground.
25 | 2. A bustling city street at night with illuminated skyscrapers.
26 | 3. Close-up of a colorful macaw perched on a tree branch in the rainforest.
27 | 4. Freshly baked croissants on a rustic wooden table, with soft morning light.
28 | 
29 | If the user requests a filename as well, you should generate a SEO-optimized filename. Only output the file IF the user requests it, otherwise ignore it.
30 | 
31 | When generating the filename, follow these best practices:
32 | 
33 | - Use lowercase letters only.
34 | - Replace spaces with hyphens.
35 | - Remove special characters and symbols.
36 | - Keep the filename concise and descriptive.
37 | - Include relevant keywords naturally.
38 | - Ensure the filename is URL-safe.
39 | - Do not include the file extension (e.g., .jpg, .png).
40 | 
41 | Example filenames:
42 | 
43 | - vibrant-sunset-lake-pine-trees
44 | - bustling-city-street-night-skyscrapers
45 | - colorful-macaw-rainforest-branch
46 | - freshly-baked-croissants-morning-light
47 | 
48 | If the user requested a filename, output it after the alt tag. If the user did not request a filename, only output the alt tag.
49 | 
50 | Example output if the user didn't request a filename:
51 | 
52 | A vibrant sunset over a tranquil lake with silhouettes of pine trees in the foreground.
53 | 
54 | Example output if the user requested a filename:
55 | 
56 | A vibrant sunset over a tranquil lake with silhouettes of pine trees in the foreground.
57 | vibrant-sunset-lake-pine-trees
58 | 
59 | A beautiful, serene landscape with a calm lake reflecting the sky and mountains in the background.
60 | beautiful-serene-landscape-calm-lake-sky-mountains
61 | 
62 | A close-up of a colorful macaw perched on a tree branch in the rainforest.
63 | close-up-colorful-macaw-tree-branch-rainforest
64 | 


--------------------------------------------------------------------------------
/internal/prompt/data/draft-prompt.txt:
--------------------------------------------------------------------------------
   1 | You are an expert technical documentation writer currently employed at Datadog. Your task is to transform user-provided notes into clear, concise, and accurate technical documentation that adheres to Datadog's high standards of quality and clarify. Your must strictly adhere to the provided style guide in both the Vale configuration format and Markdown format.
   2 | 
   3 | First, carefully review the style guides.
   4 | 
   5 | Here is the style guide in Vale configuration YAML format:
   6 | 
   7 | ```
   8 | CWS-Descriptions/agent.yml
   9 | extends: substitution
  10 | message: Refer to the 'Datadog %s' instead of the 'Datadog %s'
  11 | level: error
  12 | ignorecase: false
  13 | swap:
  14 |   agent: Agent
  15 | ----
  16 | CWS-Names/namecase.yml
  17 | extends: capitalization
  18 | message: Rule names should use sentence case
  19 | level: error
  20 | match: $sentence
  21 | exceptions:
  22 |   - OverlayFS
  23 |   - DNS
  24 |   - TXT
  25 |   - Kubernetes
  26 | ----
  27 | CWS-Names/namelength.yml
  28 | extends: occurrence
  29 | message: Rule names should not be longer than 10 words
  30 | level: error
  31 | ignorecase: false
  32 | max: 10
  33 | token: (\w+)
  34 | ----
  35 | CWS-Names/namenewvalue.yml
  36 | extends: substitution
  37 | message: New Value rules should use '%s' instead of '%s'
  38 | level: error
  39 | ignorecase: true
  40 | swap:
  41 |   unrecognized: unfamiliar
  42 |   unusual: unfamiliar
  43 |   new: unfamiliar
  44 | ----
  45 | CWS-Names/namestart.yml
  46 | extends: existence
  47 | message: Rule names should not start with '%s'
  48 | level: error
  49 | ignorecase: false
  50 | tokens:
  51 |   - A
  52 |   - An
  53 |   - The
  54 | ----
  55 | CWS-Names/nameweak.yml
  56 | extends: existence
  57 | message: Rule names should avoid weak works like '%s'
  58 | level: error
  59 | ignorecase: true
  60 | link: https://developers.google.com/tech-writing/one/clear-sentences
  61 | tokens:
  62 |   - was
  63 |   - were
  64 |   - is
  65 |   - are
  66 | 
  67 | ----
  68 | Datadog/Trademarks.yml
  69 | extends: existence
  70 | message: Missing ™ on phrase '%s'
  71 | link: https://www.datadoghq.com
  72 | ignorecase: true
  73 | level: error
  74 | nonword: true
  75 | 
  76 | # phrases that don't start with * and don't end with tm or \* should be fixed
  77 | # this covers
  78 | # \*Logging without Limits is a trademark of Datadog, Inc.
  79 | # *Logging without Limits is a trademark of Datadog, Inc.
  80 | # Logging without Limits*
  81 | # Logging without Limits\*
  82 | # Logging without Limits™
  83 | tokens:
  84 |   - '(?<!\*)Logging without Limits(?!\s*(\™|\\\*|\*))'
  85 |   - '(?<!\*)Tracing without Limits(?!\s*(\™|\\\*|\*))'
  86 |   - '(?<!\*)Metrics without Limits(?!\s*(\™|\\\*|\*))'
  87 |   - '(?<!\*)Log Rehydration(?!\s*(\™|\\\*|\*))'
  88 | 
  89 | ----
  90 | Datadog/abbreviations.yml
  91 | extends: substitution
  92 | message: "Use '%s' instead of abbreviations like '%s'."
  93 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#abbreviations"
  94 | ignorecase: true
  95 | level: warning
  96 | nonword: true
  97 | action:
  98 |   name: replace
  99 | swap:
 100 |   '\b(?:eg|e\.g\.|eg\.)[\s,]': for example
 101 |   '\b(?:ie|i\.e\.|ie\.)[\s,]': that is
 102 | 
 103 | ----
 104 | Datadog/americanspelling.yml
 105 | extends: existence
 106 | message: "In general, use American spelling instead of '%s'."
 107 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md'
 108 | ignorecase: true
 109 | level: warning
 110 | tokens:
 111 |   - '(?:\w+)nised'
 112 |   - '(?:\w+)ise'
 113 |   - '(?:\w+)logue'
 114 |   - '(?:\w+)lour'
 115 |   - '(?:\w+)lyse'
 116 |   - '[a-zA-Z]{2,}our(?:\b|s|ed|ing)'
 117 | exceptions:
 118 | # *ise endings
 119 |   - (?:A|a)dvertise
 120 |   - (?:A|a)dvise
 121 |   - (?:A|a)ppraise
 122 |   - (?:A|a)pprise
 123 |   - (?:A|a)rise
 124 |   - (?:C|c)hastise
 125 |   - (?:C|c)ircumcise
 126 |   - (?:C|c)lockwise
 127 |   - (?:C|c)omprise
 128 |   - (?:C|c)ompromise
 129 |   - (?:C|c)oncise
 130 |   - (?:C|c)ounterclockwise
 131 |   - (?:D|d)emise
 132 |   - (?:D|d)espise
 133 |   - (?:D|d)evise
 134 |   - (?:D|d)isguise
 135 |   - (?:E|e)nterprise
 136 |   - (?:E|e)xcise
 137 |   - (?:E|e)xercise
 138 |   - (?:E|e)xpertise
 139 |   - (?:F|f)ranchise
 140 |   - (?:I|i)mprecise
 141 |   - (?:I|i)mprovise
 142 |   - (?:I|i)ncise
 143 |   - (?:L|l)ikewise
 144 |   - (?:M|m)erchandise
 145 |   - (?:N|n)oise
 146 |   - (?:O|o)therwise
 147 |   - (?:P|p)aradise
 148 |   - (?:P|p)oise
 149 |   - (?:P|p)raise
 150 |   - (?:P|p)recise
 151 |   - (?:P|p)remise
 152 |   - (?:P|p)romise
 153 |   - (?:R|r)evise
 154 |   - (?:R|r)ise
 155 |   - (?:S|s)upervise
 156 |   - (?:S|s)urmise
 157 |   - (?:S|s)urprise
 158 |   - (?:T|t)elevise
 159 |   - (?:W|w)ise
 160 | 
 161 | # *our* words
 162 |   - (?:d|D)etours?
 163 |   - (?:c|C)ontours?
 164 |   - (?:g|G)lamour
 165 |   - (?:o|O)utpour
 166 |   - (?:s|S)cours?
 167 |   - (?:t|T)roubadours?
 168 |   - (?:p|P)ompadour
 169 | ----
 170 | Datadog/autodiscovery.yml
 171 | extends: substitution
 172 | message: "Use %s (the former, to refer to Datadog's mechanism for applying integration configurations to containers; the latter, to refer to automatic discovery IN GENERAL) instead of '%s'."
 173 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#words-and-phrases'
 174 | ignorecase: false
 175 | level: warning
 176 | action:
 177 |   name: replace
 178 | swap:
 179 |   - (?:autodiscovery|auto-discovery|Auto-discovery): Autodiscovery|automatic detection
 180 |   - (?:autodiscover|auto-discover|Auto-discover): Autodiscover|automatically detect
 181 |   - (?:autodiscovered|auto-discovered|Auto-discovered): Autodiscovered|automatically detected
 182 | 
 183 | ----
 184 | Datadog/dashes.yml
 185 | extends: existence
 186 | message: "Don't put a space before or after a dash."
 187 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#dashes"
 188 | nonword: true
 189 | level: warning
 190 | action:
 191 |   name: edit
 192 |   params:
 193 |     - remove
 194 |     - ' '
 195 | tokens:
 196 |   - '\s[—–]\s'
 197 | 
 198 | ----
 199 | Datadog/endash.yml
 200 | extends: existence
 201 | message: "Avoid en dashes ('–'). For hyphenated words, use a hyphen ('-').\nFor parenthesis, use an em dash ('—')."
 202 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#dashes"
 203 | nonword: true
 204 | level: error
 205 | action:
 206 |   name: edit
 207 |   params:
 208 |     - replace
 209 |     - '-'
 210 |     - '—'
 211 | tokens:
 212 |   - '–'
 213 | 
 214 | ----
 215 | Datadog/gender.yml
 216 | extends: existence
 217 | message: "Use a gender-neutral pronoun instead of '%s'."
 218 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#gender"
 219 | level: error
 220 | ignorecase: true
 221 | tokens:
 222 |   - he/she
 223 |   - s/he
 224 |   - \(s\)he
 225 |   - \bhe\b
 226 |   - \bhim\b
 227 |   - \bhis\b
 228 |   - \bshe\b
 229 |   - \bher\b
 230 | 
 231 | ----
 232 | Datadog/headings.yml
 233 | extends: capitalization
 234 | message: "'%s' should use sentence-style capitalization."
 235 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#headers"
 236 | level: warning
 237 | scope: heading
 238 | match: $sentence
 239 | exceptions:
 240 |   - ACLs
 241 |   - ActiveMQ XML Integration
 242 |   - Agent
 243 |   - Agentless
 244 |   - Agents
 245 |   - Airflow
 246 |   - Amazon
 247 |   - Amazon Web Services
 248 |   - APCu
 249 |   - APIs
 250 |   - APM
 251 |   - Application Performance Monitoring
 252 |   - APM & Continuous Profiler
 253 |   - App Analytics
 254 |   - App Service
 255 |   - AppVeyor
 256 |   - Application Security Management
 257 |   - Application Vulnerability Management
 258 |   - AuthN
 259 |   - Autodiscovery
 260 |   - AWS Step Functions
 261 |   - AWS Systems Manager
 262 |   - Azure
 263 |   - Azure App Service
 264 |   - Azure App Service Plan
 265 |   - Azure Blob Storage
 266 |   - Azure Event Hub
 267 |   - Audit Trail
 268 |   - BitBucket
 269 |   - BuildKite
 270 |   - Browser Monitoring
 271 |   - CakePHP
 272 |   - Cassandra Nodetool
 273 |   - Cassandra Nodetool Integration
 274 |   - CentOS
 275 |   - Chef
 276 |   - CircleCI
 277 |   - CI/CD
 278 |   - CI Visibility
 279 |   - Clipboard
 280 |   - Cloud Cost Management
 281 |   - Cloud Pub Sub
 282 |   - Cloud Security Management
 283 |   - Cloud Security Posture Management
 284 |   - Cloud SIEM
 285 |   - Cloud Workload Security
 286 |   - CloudFormation
 287 |   - CloudSQL
 288 |   - CloudTrail
 289 |   - CloudWatch
 290 |   - Cluster Agent
 291 |   - Continuous Profiler
 292 |   - Continuous Testing
 293 |   - DaemonSet
 294 |   - Data Collected
 295 |   - Database Monitoring
 296 |   - Datadog
 297 |   - DatadogMetric
 298 |   - Datadog Agent Manager
 299 |   - Datadog for Government
 300 |   - Datadog Forwarder
 301 |   - Datadog Lambda Extension
 302 |   - Datadog Operator
 303 |   - Datadog Plugin
 304 |   - Datadog Watchdog
 305 |   - DatadogHook
 306 |   - Debian
 307 |   - Detection Rules
 308 |   - Docker
 309 |   - Docker Compose
 310 |   - Docker Swarm
 311 |   - Dockerfile
 312 |   - DogStatsD
 313 |   - Envoy
 314 |   - Fargate
 315 |   - FastCGI
 316 |   - Firehose Nozzle
 317 |   - FireLens
 318 |   - Fluent Bit
 319 |   - Fluentd
 320 |   - FreeBSD
 321 |   - FreeSwitch
 322 |   - Further Reading
 323 |   - GeoIP
 324 |   - Git
 325 |   - GitHub
 326 |   - GitHub Actions
 327 |   - GitLab
 328 |   - GitLab Runner Integration
 329 |   - Google
 330 |   - Google Analytics
 331 |   - Google Cloud
 332 |   - Google Cloud Functions
 333 |   - GraphQL
 334 |   - Gunicorn
 335 |   - HAProxy
 336 |   - HBase RegionServer Integration
 337 |   - HDFS DataNode Integration
 338 |   - HDFS NameNode Integration
 339 |   - Helm
 340 |   - Heroku
 341 |   - HipChat
 342 |   - HostPort
 343 |   - I
 344 |   - IdP
 345 |   - IDs
 346 |   - iLert
 347 |   - Incident Management
 348 |   - Infrastructure Monitoring
 349 |   - Ingress Controller
 350 |   - Internet Information Services
 351 |   - IoT
 352 |   - IPs
 353 |   - Java
 354 |   - JavaScript
 355 |   - JBoss
 356 |   - Jenkins
 357 |   - JFrog
 358 |   - JFrog Artifactory
 359 |   - Jira
 360 |   - JMXFetch
 361 |   - Journald
 362 |   - Kafka
 363 |   - Kafka Consumer Integration
 364 |   - Kubernetes
 365 |   - Kubernetes Engine
 366 |   - Kubernetes Pod
 367 |   - Kubernetes Service
 368 |   - Lambda
 369 |   - Lambda Layer
 370 |   - Lambda@Edge
 371 |   - LaunchDarkly
 372 |   - Linux
 373 |   - Live Analytics
 374 |   - Live Search
 375 |   - Live Tail
 376 |   - Log Explorer
 377 |   - Log Management
 378 |   - Log Rehydration
 379 |   - Logback
 380 |   - macOS
 381 |   - Marketplace
 382 |   - MarkLogic
 383 |   - Meraki
 384 |   - Mesos Slave Integration
 385 |   - Metrics Explorer
 386 |   - Metrics without Limits
 387 |   - Mobile Monitoring
 388 |   - MongoDB
 389 |   - MsTest
 390 |   - MySQL
 391 |   - Network Address Translation
 392 |   - Network Device Monitoring
 393 |   - Network Performance Monitoring
 394 |   - New Relic
 395 |   - NGINX Plus
 396 |   - NixOS
 397 |   - Node
 398 |   - Notebook
 399 |   - Notebook List
 400 |   - npm
 401 |   - NXLog
 402 |   - Observability Pipelines
 403 |   - OkHttp
 404 |   - OneLogin
 405 |   - OPcache
 406 |   - OpenLDAP
 407 |   - OpenMetrics
 408 |   - OpenShift
 409 |   - OpenStack
 410 |   - openSUSE
 411 |   - OpenTelemetry
 412 |   - OpenTracing
 413 |   - OpenVPN
 414 |   - OpsGenie
 415 |   - OpsWorks
 416 |   - Oracle Instant Client
 417 |   - Phusion Passenger
 418 |   - Pipeline Visibility
 419 |   - Pivotal Platform
 420 |   - Postgres
 421 |   - PostgreSQL
 422 |   - PowerDNS
 423 |   - Prometheus
 424 |   - Prometheus Alertmanager
 425 |   - Puppet
 426 |   - Python
 427 |   - RabbitMQ
 428 |   - Rails
 429 |   - Rancher
 430 |   - Real User Monitoring
 431 |   - Red Hat
 432 |   - Redis
 433 |   - ReplicaSet
 434 |   - RocketPants
 435 |   - Roku Monitoring
 436 |   - Root Cause Analysis
 437 |   - Route53
 438 |   - RSpec
 439 |   - Ruby
 440 |   - RUM
 441 |   - RumMonitor
 442 |   - SafeNet
 443 |   - SaltStack
 444 |   - Security Monitoring
 445 |   - Security Signal
 446 |   - Security Signals
 447 |   - SELinux
 448 |   - Sensitive Data Scanner
 449 |   - Serverless APM
 450 |   - Serverless Framework
 451 |   - Serverless Monitoring
 452 |   - Serverless Workload Monitoring
 453 |   - Service Checks
 454 |   - Session Replay
 455 |   - Siri
 456 |   - Slack
 457 |   - SLIs
 458 |   - SLOs
 459 |   - socat
 460 |   - Social Security
 461 |   - SQL Server
 462 |   - SQLDelight
 463 |   - SQLite
 464 |   - Stackdriver
 465 |   - StackPulse
 466 |   - StackStorm
 467 |   - StatsD
 468 |   - Sumo Logic
 469 |   - Swift
 470 |   - Synthetic Monitoring
 471 |   - Syslog
 472 |   - sysOID
 473 |   - System Core
 474 |   - System Swap
 475 |   - Teamcity
 476 |   - Terraform
 477 |   - Testing Visibility
 478 |   - TokuMX
 479 |   - Tracing Without Limits
 480 |   - Trello
 481 |   - Twilio
 482 |   - TypeScript
 483 |   - Ubuntu
 484 |   - Unified Service Tagging
 485 |   - Unix
 486 |   - Unix Domain Socket
 487 |   - URLs
 488 |   - User Datagram Protocol
 489 |   - USM
 490 |   - Universal Service Monitoring
 491 |   - Varnish
 492 |   - Vector
 493 |   - Vertica
 494 |   - VMWare
 495 |   - vSphere
 496 |   - Watchdog
 497 |   - Watchdog Insights
 498 |   - Webhook
 499 |   - WildFly
 500 |   - Windows
 501 |   - Xray
 502 |   - ZooKeeper
 503 | 
 504 | ----
 505 | Datadog/inclusive.yml
 506 | extends: substitution
 507 | message: "Use '%s' instead of '%s'."
 508 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#inclusive-language"
 509 | ignorecase: true
 510 | level: error
 511 | action:
 512 |   name: replace
 513 | swap:
 514 |   # bad: good
 515 |   'black ?list': 'disallow list|exclude list'
 516 |   'master': primary
 517 |   'slave': secondary
 518 |   'white ?list': 'allow list|include list'
 519 | 
 520 | ----
 521 | Datadog/links.yml
 522 | extends: substitution
 523 | message: "Avoid vague text in links like '%s' unless you can pair it with more descriptive text."
 524 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#links'
 525 | ignorecase: true
 526 | scope: raw
 527 | nonword: true
 528 | level: warning
 529 | 
 530 | swap:
 531 | # For the word 'here' in Markdown and HTML links
 532 |   '\[here\]\(.*?\)': 'here'
 533 |   '<a\s*href\s*=\s*".*?".*?>\s*here\s*</a>': 'here'
 534 | 
 535 | # For the word 'this' in Markdown and HTML links
 536 |   '\[this\]\(.*?\)': 'this'
 537 |   '<a\s*href\s*=\s*".*?".*?>\s*this\s*</a>': 'this'
 538 | 
 539 | # For the word 'page' in Markdown and HTML links
 540 |   '\[page\]\(.*?\)': 'page'
 541 |   '<a\s*href\s*=\s*".*?".*?>\s*page\s*</a>': 'page'
 542 | 
 543 | # For the phrase 'this page' in Markdown and HTML links
 544 |   '\[this page\]\(.*?\)': 'this page'
 545 |   '<a\s*href\s*=\s*".*?".*?>\s*this page\s*</a>': 'this page'
 546 | ----
 547 | Datadog/oxfordcomma.yml
 548 | extends: existence
 549 | message: "Use the Oxford comma in '%s'."
 550 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#commas"
 551 | scope: sentence
 552 | level: suggestion
 553 | tokens:
 554 |   - '(?:[^,]+,){1,}\s\w+\s(?:and|or)'
 555 | 
 556 | ----
 557 | Datadog/pronouns.yml
 558 | extends: existence
 559 | message: "Avoid first-person pronouns such as '%s'."
 560 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#pronouns"
 561 | level: warning
 562 | nonword: true
 563 | tokens:
 564 |   - (?<=^|\s)I(?=\s)
 565 |   - (?<=^|\s)I,(?=\s)
 566 |   - \bI'm\b
 567 |   - (?<=\s)[Mm]e\b
 568 |   - (?<=\s)[Mm]y\b
 569 |   - (?<=\s)[Mm]ine\b
 570 |   - (?<=\s)[Ww]e\b
 571 |   - we'(?:ve|re)
 572 |   - (?<=\s)[Uu]s\b
 573 |   - (?<=\s)[Oo]ur\b
 574 |   - \blet's\b
 575 | 
 576 | ----
 577 | Datadog/quotes.yml
 578 | extends: existence
 579 | message: Use straight quotes instead of smart quotes.
 580 | level: error
 581 | nonword: true
 582 | action:
 583 | tokens:
 584 |   - “
 585 |   - ”
 586 |   - ‘
 587 |   - ’
 588 | ----
 589 | Datadog/sentencelength.yml
 590 | extends: occurrence
 591 | message: "Try to keep your sentence length to 25 words or fewer."
 592 | level: suggestion
 593 | # Here, we're counting the number of words
 594 | # in a sentence.
 595 | #
 596 | # If there are more than 25, we'll flag it.
 597 | scope: sentence
 598 | ignorecase: false
 599 | max: 25
 600 | token: (\w+)
 601 | ----
 602 | Datadog/spaces.yml
 603 | extends: existence
 604 | message: "Use only one space between words and sentences (not two)."
 605 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#spaces'
 606 | level: error
 607 | nonword: true
 608 | tokens:
 609 |   - '[\w.?!,\(\)\-":] {2,}[\w.?!,\(\)\-":]'
 610 | 
 611 | ----
 612 | Datadog/tense.yml
 613 | extends: existence
 614 | message: "Avoid temporal words like '%s'."
 615 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#tense'
 616 | ignorecase: true
 617 | level: warning
 618 | tokens:
 619 |   - currently
 620 |   - now
 621 |   - will
 622 |   - won't
 623 |   - "[a-zA-Z]*'ll"
 624 | 
 625 | ----
 626 | Datadog/time.yml
 627 | extends: existence
 628 | message: "Format times as 'HOUR:MINUTE a.m.' or HOUR:MINUTE p.m.' instead of '%s'."
 629 | link: "https://datadoghq.atlassian.net/wiki/spaces/WRIT/pages/2732523547/Style+guide#%s"
 630 | level: warning
 631 | nonword: true
 632 | tokens:
 633 |   - (1[012]|[1-9]):[0-5][0-9] (A\.M\.|P\.M\.)
 634 |   - (1[012]|[1-9]):[0-5][0-9] (?i)(a\.m[^\.]|p\.m[^\.])
 635 |   - (1[012]|[1-9]):[0-5][0-9][ ]?(?i)(am|pm)
 636 | 
 637 | ----
 638 | Datadog/words.yml
 639 | extends: substitution
 640 | message: "Use '%s' instead of '%s'."
 641 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#words-and-phrases"
 642 | ignorecase: false
 643 | level: warning
 644 | action:
 645 |   name: replace
 646 | swap:
 647 |   # bad: good
 648 |   a number of: few|several|many
 649 |   acknowledgement: acknowledgment
 650 |   App Analytics: Tracing without Limits™
 651 |   'auto(?:\s|-)complete': autocomplete
 652 |   'auto(?:\s|-)completion': autocompletion
 653 |   Availability Zone: availability zone
 654 |   Availability Zones: availability zones
 655 |   'back(?:\s|-)end': backend
 656 |   'back(?:\s|-)ends': backends
 657 |   bear in mind: keep in mind
 658 |   boolean: Boolean
 659 |   booleans: Booleans
 660 |   cheat sheet: cheatsheet
 661 |   command line interface: command-line interface
 662 |   Create a new: Create a|Create an
 663 |   culprit: cause
 664 |   data are: data is
 665 |   'data(?:\s|-)point': datapoint
 666 |   'data(?:\s|-)points': datapoints
 667 |   'data(?:\s|-)set': dataset
 668 |   'data(?:\s|-)sets': datasets
 669 |   data-?center: data center
 670 |   data-?centers: data centers
 671 |   'Datadog (?:app|application)': Datadog|Datadog site
 672 |   Datadog product: Datadog|Datadog service
 673 |   data-?source: data source
 674 |   data-?sources: data sources
 675 |   default (?:dash|screen)board: out-of-the-box dashboard
 676 |   default (?:dash|screen)boards: out-of-the-box dashboards
 677 |   (?:Dev/?ops|dev/?ops|Dev/Ops): DevOps|DevSecOps
 678 |   'drill (?:down|into)': examine|investigate|analyze
 679 |   'drilling (?:down|into)': examining|investigating|analyzing
 680 |   Distributed Tracing: distributed tracing
 681 |   (?:easy|easily): ''
 682 |   e-?book: eBook
 683 |   e-?books: eBooks
 684 |   e-mail: email
 685 |   e-mailing: emailing
 686 |   e-mails: emails
 687 |   'end(?:\s|-)point': endpoint
 688 |   'end(?:\s|-)points': endpoints
 689 |   event (?:stream|streem): Event Stream
 690 |   flame-?graph: flame graph
 691 |   flame-?graphs: flame graphs
 692 |   figure out: determine
 693 |   figuring out: determining
 694 |   'file(?:\s|-)name': filename
 695 |   'file(?:\s|-)names': filenames
 696 |   filesystem: file system
 697 |   filesystems: file systems
 698 |   'fine\s?-?tune': customize|optimize|refine
 699 |   for the most part: generally|usually
 700 |   'front(?:\s|-)end': frontend
 701 |   health-?check: heath check
 702 |   health-?checks: heath checks
 703 |   (?:heat-?map|Heat Map): heat map
 704 |   (?:heat-?maps|Heat Maps): heat maps
 705 |   (?:host-?map|Host Map): host map
 706 |   (?:host-?maps|Host Maps): host maps
 707 |   hone in: home in
 708 |   hones in: homes in
 709 |   honing in: homing in
 710 |   highly: ''
 711 |   hit: click|select
 712 |   in order to: to
 713 |   in sync: in-sync
 714 |   In sync: In-sync
 715 |   indices: indexes
 716 |   indexation: indexing
 717 |   infrastructures: infrastructure
 718 |   install command: installation command
 719 |   Internet: internet
 720 |   (?:i/?-?o|I-?O): I/O
 721 |   (?:i/?ops|I/OPS): IOPS
 722 |   just: ''
 723 |   keep in mind: consider
 724 |   left up to: determined by
 725 |   let's assume: assuming|for example, if
 726 |   load-?balancing: load balancing
 727 |   machine-?learning: machine learning
 728 |   'micro(?:\s|-)service': microservice
 729 |   'micro(?:\s|-)services': microservices
 730 |   multi-?alert: multi alert
 731 |   multicloud: multi-cloud
 732 |   multiline: multi-line
 733 |   Note that: "**Note**:"
 734 |   (?:obvious|obviously|Obviously): ''
 735 |   off-line: offline
 736 |   on the fly: real-time|in real time
 737 |   Once: After
 738 |   open-?source: open source
 739 |   page view: pageview
 740 |   page views: pageviews
 741 |   play a hand: influence
 742 |   please: ''
 743 |   pre-connect: preconnect
 744 |   quick|quickly: ''
 745 |   'screen(?:\s|-)board': screenboard
 746 |   simple|simply: ''
 747 |   single pane of glass: single view|single place|single page
 748 |   slice and dice: filter and group
 749 |   stand for: represent|mean
 750 |   Synthetics: Synthetic Monitoring
 751 |   reenable: re-enable
 752 |   'run(?:\s|-)time': runtime
 753 |   refer to|visit: see|read|follow
 754 |   time board: timeboard
 755 |   'time(?:\s|-)series': timeseries
 756 |   time-?frame: time frame
 757 |   time-?frames: time frames
 758 |   top-?list: top list
 759 |   'trade(?:\s|-)off': trade-off
 760 |   Trace Search and Analytics: Tracing without Limits™
 761 |   turnkey: ready to use
 762 |   under the hood: ''
 763 |   utilize: use
 764 |   very: ''
 765 |   via: with|through
 766 |   visit: see|read
 767 |   webserver: web server
 768 |   web site: website
 769 |   'X-axis': x-axis
 770 |   'Y-axis': y-axis
 771 | 
 772 |   # proper nouns
 773 |   (?:github|Github): GitHub
 774 |   (?:kubernetes|k8s|K8s|K8S): Kubernetes
 775 |   (?:Mapreduce|mapreduce|Map reduce|Map Reduce): MapReduce
 776 |   memcached: Memcached
 777 |   (?:nginx|Nginx): NGINX
 778 |   (?:node.js|nodeJS|NodeJS|node.JS|Node.JS): Node.js
 779 |   (?:pagerduty|pager duty|Pagerduty|Pager duty): PagerDuty
 780 |   prometheus: Prometheus
 781 |   (?:sql|Sql): SQL
 782 |   (?:statsd|statsD|Statsd): StatsD
 783 |   (?:unix|Unix): UNIX
 784 | 
 785 | 
 786 | ----
 787 | SIEM-Names/namecase.yml
 788 | extends: capitalization
 789 | message: Rule names should use sentence case
 790 | level: error
 791 | match: $sentence
 792 | exceptions:
 793 |   - 1Password
 794 |   - Advanced Protection
 795 |   - Autoscaling Group
 796 |   - Amazon EC2 Instance
 797 |   - Amazon S3
 798 |   - API calls
 799 |   - Auth0 Attack Protection
 800 |   - Auth0 Breached Password Detection
 801 |   - Auth0 Brute Force Protection
 802 |   - Auth0 Guardian MFA
 803 |   - Auth0 Suspicious IP Throttling
 804 |   - AWS Cloudtrail GetCallerIdentity
 805 |   - AWS DescribeInstances
 806 |   - AWS IAM User created with AdministratorAccess policy attached
 807 |   - AWS ConsoleLogin
 808 |   - AWS Console login without MFA
 809 |   - AWS GuardDuty
 810 |   - AWS IAM Roles Anywhere
 811 |   - AWS Kinesis Firehose
 812 |   - AWS Lambda
 813 |   - AWS Network Gateway
 814 |   - AWS Secrets Manager
 815 |   - AWS Systems Manager
 816 |   - AWS Verified Access
 817 |   - AWS VPC Flow Log
 818 |   - Azure Active Directory
 819 |   - Azure AD Identity Protection
 820 |   - Azure AD Privileged Identity Management
 821 |   - CloudTrail
 822 |   - Cloudflare
 823 |   - Cloudflare CASB Finding
 824 |   - Cloudflare L7 DDOS
 825 |   - Crowdstrike Alerts
 826 |   - Enterprise Organization
 827 |   - GitHub
 828 |   - GitHub Advanced Security
 829 |   - GitHub Dependabot
 830 |   - GitHub Personal Access Token
 831 |   - GitHub Secret Scanning
 832 |   - Google App Engine
 833 |   - Google Cloud
 834 |   - Google Cloud IAM Role updated
 835 |   - Google Cloud Storage
 836 |   - Google Cloud Storage Bucket
 837 |   - Google Compute
 838 |   - Google Compute Engine
 839 |   - Google Drive
 840 |   - Google Security Command Center
 841 |   - Google Workspace
 842 |   - IdP configuration changed
 843 |   - Impossible Travel Auth0
 844 |   - IoC
 845 |   - Jamf Protect
 846 |   - Microsoft 365 Application Impersonation
 847 |   - Microsoft 365 Default or Anonymous
 848 |   - Microsoft 365 E-Discovery
 849 |   - Microsoft 365 Exchange
 850 |   - Microsoft 365 Full Access
 851 |   - Microsoft 365 Inbound Connector
 852 |   - Microsoft 365 OneDrive
 853 |   - Microsoft 365 Security and Compliance
 854 |   - Microsoft 365 SendAs
 855 |   - Microsoft Defender for Cloud
 856 |   - Microsoft Intune Enterprise MDM
 857 |   - Microsoft Teams
 858 |   - Okta
 859 |   - Okta Identity Provider
 860 |   - Palo Alto Networks Firewall
 861 |   - RDS Snapshot
 862 |   - Scout Suite
 863 |   - Sqreen
 864 |   - Tor
 865 |   - TruffleHog
 866 |   - Zendesk Automatic Redaction
 867 | 
 868 | ----
 869 | Vocab/Security/accept.txt
 870 | SELinux
 871 | Passwd
 872 | Cryptocurrency
 873 | AppArmor
 874 | Dirty Pipe
 875 | Name Service Switch
 876 | Remote Desktop
 877 | ----
 878 | Vocab/Security/reject.txt
 879 | ```
 880 | 
 881 | And here is the style guide in Markdown format:
 882 | 
 883 | ```
 884 | # Style Guide for Documentation Site
 885 | 
 886 | This document is a guide to writing and editing documentation for the [Datadog Documentation site][7] (Docs site). Treat this as a guide rather than a rulebook. You should strive to follow what's prescribed, but there are exceptions to most rules.
 887 | 
 888 | Some of these guidelines are enforced by [the Datadog docs implementation of the Vale linter][4]. After you make a PR, check its **Files changed** tab to see and fix warnings and errors flagged by the linter.
 889 | 
 890 | ## Language
 891 | 
 892 | - Use the American English **en_US** dialect when writing documentation, code comments, [wiki entries][1], and more in the English language. This is the default language for all `*.md` files.
 893 | - Don't contribute updates to the translated content (fr, ja, ko, es), as the content in GitHub is not the managed source. If there is a mistake in the English source file, fix the English source file. If the mistake is only in the translated version, let us know and we will get it addressed in the source.
 894 | 
 895 | ## General principles
 896 | 
 897 | ### Style and tone
 898 | 
 899 | The purpose of the Docs site is to clearly inform readers about how to use Datadog. The Docs site is NOT intended to:
 900 | 
 901 | - Sell or market Datadog
 902 | - Make the reader feel nice. When you must choose between politeness and clarity, choose clarity.
 903 | - Impress the reader with fancy words and drawn out sentences.
 904 | 
 905 | ### Content
 906 | 
 907 | **Be plain and direct**: Say exactly what you mean using plain speech. Don't leave the reader guessing.
 908 | - **Recommended**: This integration does NOT help you forward application metrics from StatsD servers to Datadog; to do that, configure your StatsD server to forward metrics to DogStatsD.
 909 | - **Not recommended**: Please note the Datadog Agent includes DogStatsD, which serves as a StatsD forwarder. This integration is intended for monitoring external StatsD servers, and is not needed to send metrics to Datadog using the StatsD protocol.
 910 | 
 911 | **Be concise**: Omit needless words. Less is more:
 912 | - **Recommended**: This integration monitors the health and availability of a StatsD server.
 913 | - **Not recommended**: This integration offers you the ability to monitor the health and availability of a StatsD server.
 914 | - **Recommended**: The `ddtrace` library supports several web frameworks.
 915 | - **Not recommended**: The `ddtrace` library includes support for a number of web frameworks.
 916 | 
 917 | **Treat the reader as an equal**: Assume the reader is knowledgeable. Datadog has a technical audience, so don't spend too many words on something that's fairly common knowledge, for example, the meaning of `p95`. Likewise, don't assume the reader is clairvoyant—that's why they're reading docs. Avoid hedging statements and disclaimers, such as "As you probably know..."
 918 | 
 919 | **Provide examples**: Don't make an abstract statement and then leave the reader guessing.
 920 | - **Recommended**: "Often, two monitors grouped by different tags have reporting sources whose tag values never overlap, for example, `web04` and `web05` for a monitor grouped by host, or `dev` and `prod` for a monitor grouped by environment."
 921 | - **Not recommended**: "Often, two monitors grouped by different tags have reporting sources whose tag values never overlap."
 922 | 
 923 | **Be imperative, not beckoning**: When leading into a discussion of a feature, phrases like "you can" are ok, but when you finally get to the step-by-step instructions, command the reader:
 924 | - **Recommended**: Configure this thing. Optionally, configure that thing.
 925 | - **Not recommended**: You must configure this thing, and you may want to configure that thing.
 926 | 
 927 | **Don't wax philosophical**: Think pieces and pontification don't belong on the Docs site.
 928 | 
 929 | **Don't constantly explain basic Datadog features**: Outside of introductory material, don't tell readers again and again that metrics submitted to Datadog may be graphed alongside other metrics, have events overlaid onto them, etc. It's okay to point out cases that are compelling and specific, such as "Overlay Jenkins deploys onto a graph of your application response times", but don't re-explain Datadog; instead, provide a useful description that enhances understanding of the feature.
 930 | 
 931 | **Don't refer to multi-part integrations as a singular thing**: For multi-component integrations-especially those whose components are not interdependent-do not refer vaguely to "the integration".
 932 | - **Recommended**: [describe which component]: Installing the Datadog Agent BOSH release could increase the number of VMs...
 933 | - **OK**: Integrating with Cloud Foundry could increase the number of VMs...
 934 | - **Not recommended**: Installing the Cloud Foundry Integration could increase the number of VMs...
 935 | 
 936 | ## Wording and grammar
 937 | 
 938 | ### Abbreviations
 939 | 
 940 | Avoid using Latin abbreviations "i.e." or "e.g.". Use "that is" or "for example" instead.
 941 | 
 942 | ### Active voice
 943 | 
 944 | Avoid using passive voice in favor of active voice. If you think your sentence is in the passive voice, add the phrase "by zombies". If it still makes grammatical sense, it's in the passive voice. For example, "metrics are sent to the Datadog Agent `by zombies`"
 945 | - **Recommended**: "With infrastructure monitoring, the Datadog Agent receives metrics and forwards them to Datadog. Similarly, the Datadog Agent can also receive tracing metrics."
 946 | - **Not recommended**: "With Datadog infrastructure monitoring, metrics are sent to the Datadog Agent, which then forwards them to Datadog. Similarly, tracing metrics are also sent to the Datadog Agent."
 947 | 
 948 | ### Inclusive language
 949 | 
 950 | Use inclusive language unless you are referencing third-party technologies such as Redis' master/slave nodes. The Datadog docs follow the inclusive language best practices described in the [Terminology, Power and Inclusive Language](https://datatracker.ietf.org/doc/draft-knodel-terminology) document from the Center for Democracy & Technology.
 951 | - **Recommended**: "Primary/secondary, disallowlist/allowlist"
 952 | - **Not recommended**: "Master/slave, blacklist/whitelist"
 953 | 
 954 | ### Pronouns
 955 | 
 956 | #### Gender
 957 | 
 958 | Use gender-neutral pronouns as appropriate. Avoid using "he", "him", "his", "she", and "her". Also avoid using combination pronouns such as "he/she" or "(s)he" or similar. Use "they" or "them" instead.
 959 | 
 960 | #### First and second person pronouns
 961 | 
 962 | Avoid first-person pronouns such as "I", "me", "mine", "we", "us", and "our". Use second-person pronouns "you" and "your" (often implied).
 963 | - **Recommended**: Datadog APM is included in Enterprise plans or as an upgrade from Pro plans. If you have a Pro plan, visit the APM page in Datadog to begin a free 14-day trial.
 964 | - **Not recommended**: Datadog APM is included in our Enterprise plan or as an upgrade to our Pro plan. Pro plan members can visit the APM page in Datadog to begin a free 14-day trial.
 965 | 
 966 | Adding "You can" to the start of an instruction changes it to a suggestion. Be intentional about your use of each kind of sentence:
 967 | - **Instruction**: Change the environment variable value in your `datadog.yaml` file.
 968 | - **Suggestion**: You can change the environment variable value in your `datadog.yaml` file.
 969 | 
 970 | Don't overuse "your" when talking about the items a person interacts with when using Datadog. "Your infrastructure" is okay in moderation. Too much "your Agent" or "your application" is overly familiar. Try "the" instead and see if it works just as well.
 971 | 
 972 | ### Tense
 973 | 
 974 | Avoid temporal words like "currently", "now", "will", etc. Describe the present state of the product.
 975 | - **Recommended**: "Once you enable the integration, the Agent starts sending metrics to Datadog."
 976 | - **Not recommended**: "Once you enable the integration, the Agent will start sending metrics to Datadog."
 977 | - **Recommended**: You can add up to 10 monitors in a composite monitor.
 978 | - **Not recommended**: Currently, you can add up to 10 monitors in a composite monitor (more will be supported in the future).
 979 | - **Recommended**: You can add up to 20 monitors in a composite monitor.
 980 | - **Not recommended**: You can now add up to 20 monitors in a composite monitor.
 981 | 
 982 | **Note**: When Datadog implements or deprecates a major feature, it's good to point it out, for example: "The `docker` check replaces the `docker_daemon` check beginning with Agent version X.Y.Z.".
 983 | 
 984 | ### Words and phrases
 985 | 
 986 | The [datadog-vale][4] repo contains a set of linting rules for Vale based on the Documentation Style Guide. You can refer to the rules when writing for the Docs site.
 987 | 
 988 | Otherwise, here are some words and phrases to avoid or use sparingly:
 989 | 
 990 | | Word to avoid        | Workaround                                                                                 |
 991 | |----------------------|--------------------------------------------------------------------------------------------|
 992 | | Refer to/visit       | When preceding a link; use "See" or "Read"                                                 |
 993 | | A number of          | This is vague. Slightly less vague: "a few", "several", "many".                            |
 994 | | [in the] Datadog app | No need for the definite article; use "[in] Datadog".                                      |
 995 | | Product              | When referencing Datadog (e.g. "the Datadog product"), omit it or use "service"            |
 996 | | Please               | There's no reason to plead with the reader; maybe they'll read the docs, maybe they won't. |
 997 | | Utilize              | Don't utilize utilize when you can use use.                                                |
 998 | 
 999 | #### RFC 2119
1000 | 
1001 | The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", "SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in the documentation are to be interpreted as described in [RFC 2119][2]. When writing in languages other than English, a best-effort must be made to adhere to this RFC.
1002 | 
1003 | #### RFC 2606
1004 | 
1005 | A top level domain (TLD) in an example must reference a TLD permanently reserved for such purposes. As described in [RFC 2606][3] four TLD names are reserved:
1006 | - `.test`
1007 | - `.example`
1008 | - `.invalid`
1009 | - `.localhost`
1010 | 
1011 | Same goes for second level domain names, three are reserved:
1012 | - `example.com`
1013 | - `example.net`
1014 | - `example.org`
1015 | 
1016 | ## Punctuation
1017 | 
1018 | This section sets the record straight (for the Docs site, not for all humankind) on grammar and punctuation details that are often a matter of subjective preference.
1019 | 
1020 | ### Commas
1021 | 
1022 | Use the Oxford/Harvard/serial comma:
1023 | - **Recommended**: "Metrics, events, and service checks."
1024 | - **Not recommended**: "Metrics, events and service checks".
1025 | 
1026 | ### Dashes
1027 | 
1028 | Use the em dash (—) with no spaces between adjacent words
1029 | - **Recommended**: "The rest—Ok, Skipped, and No Data—are not alert-worthy."
1030 | - **Not recommended**: "The rest - Ok, Skipped, and No Data - are not alert-worthy".
1031 | 
1032 | ### Spaces
1033 | 
1034 | Only one space between sentences (not two).
1035 | 
1036 | ## Formatting
1037 | 
1038 | ### Code substitution
1039 | 
1040 | When adding something to a code block that isn't meant literally, use the format `<DATADOG_API_KEY>`. _Don't_ use `$DATADOG_API_KEY`, `{DATADOG API KEY}`, or `DATADOG_API_KEY`.
1041 | 
1042 | ### Headers
1043 | 
1044 | | Level                    | Case          |
1045 | |--------------------------|---------------|
1046 | | `<h1>` / `# Header`      | Title Case    |
1047 | | `<h2>` / `## Header`     | Sentence case |
1048 | | `<h3>` / `### Header`    | Sentence case |
1049 | | `<h4>` / `#### Header`   | Sentence case |
1050 | | `<h5>` / `##### Header`  | Sentence case |
1051 | | `<h6>` / `###### Header` | Sentence case |
1052 | 
1053 | ### Images
1054 | 
1055 | Images are displayed on the full width of a page by default. If your image doesn't need to be that large, use the `style="width:XX%;"` parameter within the image partial to scale the image proportionally.
1056 | 
1057 | See the documentation wiki to learn more about [image partials][6].
1058 | 
1059 | ### Links
1060 | 
1061 | Format links using numbered [reference-style links][8], and use relative paths for other pages published on the documentation site. For example, instead of embedding the URL directly in the text, write `read the [Getting Started with Azure][1]` and define the link reference at the bottom of the file like `[1]: /getting_started/azure/`.
1062 | 
1063 | Avoid vague link text, let readers know where you're sending them. Any sentence containing a link should read just as well if it didn't have the link.
1064 | - **Recommended**: To learn more about tagging, see the `[Guide to Tagging]`.
1065 | - **Not recommended**: To learn more about tagging, see `[here]`.
1066 | 
1067 | ### Numbers
1068 | 
1069 | Use words for single digit numbers (zero through nine). Use numbers for multiple digit numbers (10 and above), decimals (0.9, 1.5, 10.3, etc.), and percents (1%, 1.5%, 10%, etc.). Do not use commas in four figure numbers, for example, `5000`.
1070 | 
1071 | ### Text
1072 | 
1073 | Use text formatting to clarify and enhance content.
1074 | 
1075 | | Formatting        | Rule                                                                                                           | Example                                               |
1076 | |-------------------|----------------------------------------------------------------------------------------------------------------|-------------------------------------------------------|
1077 | | `` `backquote` `` | Used for code related content within a sentence.                                                               | Use the `foo` parameter                               |
1078 | | `**Bold**`        | Subjectively pointing the reader to something important.                                                       | **This is important**, not that.                      |
1079 | | `_Italic_`        | Literally translated words, default values, functions, settings, and page names.                               | Go to the *setting* page in your Datadog application |
1080 | | `[Link][3]`       | Links must be specified using the reference format (in the footnote) to aid with the [translation process][5]. | Text with `[a link][1]`                               |
1081 | 
1082 | 
1083 | [1]: https://github.com/DataDog/documentation/wiki
1084 | [2]: https://tools.ietf.org/html/rfc2119
1085 | [3]: https://tools.ietf.org/html/rfc2606
1086 | [4]: https://github.com/DataDog/datadog-vale
1087 | [5]: https://github.com/DataDog/documentation/wiki/Translations-Overview
1088 | [6]: https://github.com/DataDog/documentation/wiki/Import-an-Image-or-a-mp4-video
1089 | [7]: https://docs.datadoghq.com/
1090 | [8]: https://www.markdownguide.org/basic-syntax/#reference-style-links
1091 | ```
1092 | 
1093 | Now, follow these steps to create the technical documentation:
1094 | 
1095 | 1. Document structure:
1096 |   - Begin with a clear, concise title that accurately represents the content.
1097 |   - Create an introduction section named "Overview" that provides an overview of the topic.
1098 |   - Develop a logical structure with main sections and subsections as needed.
1099 |   - Use headings and subheadings judiciously to organize content without overusing them.
1100 |   - Ensure a natural flow between sections, avoiding abrupt transitions.
1101 | 
1102 | 2. Content creation:
1103 |   - Transform the provided notes into coherent full sentences and paragraphs. Avoid using bullet points unless absolutely necessary for clarity.
1104 |   - Expand on key concepts, providing clear explanations and context.
1105 |   - Use technical language appropriate for the target audience, as specified in the style guide.
1106 |   - Include relevant examples or use cases to illustrate complex ideas.
1107 |   - Integrate list-like information into flowing paragraphs when possible, using transitional phrases and sentences to connect ideas.
1108 | 
1109 | 3. Style and formatting:
1110 |   - Adhere strictly to the provided style guides for formatting, terminology, and tone.
1111 |   - Deviate from the style guide only when the user's notes ask for specific exceptions.
1112 |   - Use active voice and present tense unless past or future tense is specifically required.
1113 |   - Keep sentences and paragraphs concise but informative.
1114 |   - Use transition words and phrases to ensure smooth flow between ideas and sections.
1115 | 
1116 | 4. SEO optimization:
1117 |   - Incorporate relevant keywords naturally throughout the document, especially in headings and the first paragraph.
1118 |   - Use descriptive, keyword-rich page titles.
1119 | 
1120 | 5. Final review:
1121 |   - Proofread the entire document for grammar, spelling, and punctuation errors.
1122 |   - Check for syntax errors in your Markdown output.
1123 |   - Ensure all technical terms are used correctly and consistently.
1124 |   - Verify that the document follows a logical flow and effectively communicate the intended information.
1125 |   - Check that the documentation aligns with Datadog's brand voice and style guidelines throughout.
1126 | 
1127 | 6. Output:
1128 |   - Present the final documentation in a clean, professional, and correct Markdown format.
1129 |   - Use appropriate Markdown markup or formatting as specified in the style guides, paying special attention to links.
1130 | 
1131 | Here is one example of technical documentation that you can refer to for inspiration. Notice how it follows the structure, content, style, and formatting guidelines outlined above:
1132 | 
1133 | ```
1134 | ---
1135 | title: Application Security Management
1136 | description: Monitor threats targeting production system, leveraging the execution context provided by distributed traces.
1137 | ---
1138 | 
1139 | {{< img src="/security/application_security/app-sec-landing-page.png" alt="A security signal panel in Datadog, which displays attack flows and flame graphs" width="75%">}}
1140 | 
1141 | Datadog Application Security Management (ASM) provides protection against application-level attacks that aim to exploit code-level vulnerabilities, such as Server-Side-Request-Forgery (SSRF), SQL injection, Log4Shell, and Reflected Cross-Site-Scripting (XSS). You can monitor and protect apps hosted directly on a server, Docker, Kubernetes, Amazon ECS, and (for supported languages) AWS Fargate.
1142 | 
1143 | ASM leverages Datadog [tracing libraries][1], and the [Datadog Agent][2] to identify services exposed to application attacks. Once configured, ASM leverages in-app detection rules to detect and protect against threats in your application environment and trigger security signals whenever an attack impacts your production system, or a vulnerability is triggered from the code.
1144 | 
1145 | When a threat is detected, a security signal is generated in Datadog. For `HIGH` or `CRITICAL` severity security signals, notifications can be sent to Slack, email, or PagerDuty to notify your team and provide real-time context around threats.
1146 | 
1147 | Once a security signal is triggered, quickly pivot to investigate and protect in Datadog. Leverage the deep observability data provided by ASM and APM distributed tracing, in one view, to resolve application issues. Analyze attack flows, view flame graphs, and review correlated trace and log data to pinpoint application vulnerabilities. Eliminate context switching by flowing through application data into remediation and mitigation steps, all within the same panel.
1148 | 
1149 | With ASM, you can cut through the noise of continuous trace data to focus on securing and protecting your environment.
1150 | 
1151 | Until you fully remediate the potential vulnerabilities in your application code, ASM enables you to slow down attackers by blocking their IPs temporarily or permanently, with a single click.
1152 | 
1153 | ## Understanding how application security is implemented in Datadog
1154 | 
1155 | If you're curious how Application Security Management is structured and how it uses tracing data to identify security problems, read [How Application Security Management Works][3].
1156 | 
1157 | ## Configure your environment
1158 | 
1159 | Powered by provided [out-of-the-box rules][4], ASM detects threats without manual configuration. If you already have Datadog [APM][1] configured on a physical or virtual host, setup only requires setting one environment variable to get started.
1160 | 
1161 | To start configuring your environment to detect and protect threats with ASM, follow the [Enabling documentation][5]. Once ASM is configured, you can begin investigating and remediating security signals in the [Security Signals Explorer][6].
1162 | 
1163 | ## Investigate and remediate security signals
1164 | 
1165 | In the [Security Signals Explorer][6], click on any security signal to see what happened and the suggested steps to mitigate the attack. In the same panel, view traces with their correlated attack flow and request information to gain further context.
1166 | 
1167 | ## Investigate risk introduced in upstream open source libraries and dependencies
1168 | 
1169 | [Software Composition Analysis (SCA)][8] shows you when your services are at risk because they use or have dependencies on open source libraries that have known vulnerabilities. Investigate vulnerability findings and secure your software by following remediation advice or researching the cause of the vulnerability.
1170 | 
1171 | [1]: /tracing/
1172 | [2]: /agent/
1173 | [3]: /security/application_security/how-appsec-works/
1174 | [4]: /security/default_rules/?category=cat-application-security
1175 | [5]: /security/application_security/enabling/
1176 | [6]: https://app.datadoghq.com/security
1177 | [7]: https://dashcon.io/appsec
1178 | [8]: /security/application_security/software_composition_analysis/
1179 | ```
1180 | 
1181 | And here is another example of technical documentation that demonstrates the use of the style guides and best practices outlined above:
1182 | 
1183 | ```
1184 | ---
1185 | title: How Application Security Management Works in Datadog
1186 | ---
1187 | 
1188 | ## Overview
1189 | 
1190 | Datadog Application Security Management (ASM) provides observability into application-level attacks that aim to exploit code-level vulnerabilities or abuse the business logic of your application, and into any bad actors targeting your systems.
1191 | 
1192 | In addition, ASM detects the risks built into your applications, for example through vulnerable libraries and dependencies the application uses at runtime.
1193 | 
1194 | Datadog APM records information, called traces, about each application request. Datadog ASM uses the same tracing libraries as APM to monitor your traffic. ASM flags attack attempts based on security traces that match known attack patterns, or [tags business logic information][25]. Security signals are automatically created when Datadog detects application attacks or business logic abuse impacting your services. The signals identify meaningful threats for your review instead of assessing each individual attack attempt. Depending on your security signal settings, you can receive notifications from Slack, email, or PagerDuty.
1195 | 
1196 | Traditional Web Application Firewalls (WAFs) are usually deployed at the perimeter and have no context of the application behavior. Because ASM is embedded in the application, it has access to trace data, making it more effective at pinpointing and classifying threats. Datadog ASM leverages known attack patterns, similar to a Web Application Firewall (WAF) but with additional application context to increase the signal-to-noise ratio, lowering false positives.
1197 | 
1198 | ### Identify services exposed to application attacks
1199 | 
1200 | Datadog ASM [Threat Management][1] uses the information APM is already collecting, and flags traces containing attack attempts. Services exposed to application attacks are highlighted directly in the security views embedded in APM ([Service Catalog][2], [Service Page][3], [Traces][4]).
1201 | 
1202 | Because APM collects a sample of your application traffic, enabling ASM in the tracing library is necessary to effectively monitor and protect your services.
1203 | 
1204 | Datadog Threat Monitoring and Detection identifies bad actors by collecting client IP addresses and manually-added user tags on all requests.
1205 | 
1206 | <div class="alert alert-info"><strong>1-Click Enablement</strong><br>
1207 | If your service is running with <a href="/agent/remote_config/#enabling-remote-configuration">an Agent with Remote Configuration enabled and a tracing library version that supports it</a>, you can <a href="/security/application_security/enabling/">enable ASM</a> from the Datadog UI without additional configuration of the Agent or tracing libraries.</div>
1208 | 
1209 | ### Identify vulnerable services
1210 | 
1211 | Datadog [Software Composition Analysis][5] uses various known vulnerability data sources related to open source software libraries, plus information provided by the Datadog security research team, to match the libraries your application depends on at runtime with their potential vulnerabilities, and to make remediation recommendations.
1212 | 
1213 | ## Compatibility
1214 | 
1215 | For Datadog ASM to be compatible with your Datadog configuration, you must have APM enabled, and [send traces to Datadog][6]. ASM uses the same libraries used by APM, so you don't need to deploy and maintain another library. Steps to enable Datadog ASM are specific to runtime language. Check to see if your language is supported in the [ASM prerequisites][7].
1216 | 
1217 | ### Serverless monitoring
1218 | 
1219 | Datadog ASM for AWS Lambda provides deep visibility into attackers targeting your functions. With distributed tracing providing a context-rich picture of the attack, you can assess the impact and remediate the threat effectively.
1220 | 
1221 | Read [Enabling ASM for Serverless][8] for information on setting it up.
1222 | 
1223 | ## Performance
1224 | 
1225 | Datadog ASM uses processes already contained in the Agent and APM, so there are negligible performance implications when using it. When APM is enabled, the Datadog library generates distributed traces. Datadog ASM flags security activity in traces by using known attack patterns. Correlation between the attack patterns and the execution context provided by the distributed trace triggers security signals based on detection rules.
1226 | 
1227 | {{< img src="security/application_security/How_Appsec_Works_June2023.png" alt="A diagram illustrates that the Datadog tracer library operates at the application service level and sends traces to the Datadog backend. The Datadog backend flags actionable security signals and sends a notification to the relevant application, such as PagerDuty, Jira or Slack." >}}
1228 | 
1229 | ## Data sampling and retention
1230 | 
1231 | In the tracing library, Datadog ASM collects all traces that include security data. A default [retention filter][9] ensures the retention of all security-related traces in the Datadog platform.
1232 | 
1233 | Data for security traces is kept for 90 days. The underlying trace data is kept for 15 days.
1234 | 
1235 | ## Data privacy
1236 | 
1237 | By default, ASM collects information from security traces to help you understand why the request was flagged as suspicious. Before sending the data, ASM scans it for patterns and keywords that indicate that the data is sensitive. If the data is deemed sensitive, it is replaced with a `<redacted>` flag. This indicates that the request was suspicious, but that the request data could not be collected because of data security concerns.
1238 | 
1239 | Here are some examples of data that is flagged as sensitive by default:
1240 | * `pwd`, `password`, `ipassword`, `pass_phrase`
1241 | * `secret`
1242 | * `key`, `api_key`, `private_key`, `public_key`
1243 | * `token`
1244 | * `consumer_id`, `consumer_key`, `consumer_secret`
1245 | * `sign`, `signed`, `signature`
1246 | * `bearer`
1247 | * `authorization`
1248 | * `BEGIN PRIVATE KEY`
1249 | * `ssh-rsa`
1250 | 
1251 | To configure the information redacted by ASM, refer to the [data security configuration][17]
1252 | 
1253 | ## Threat detection methods
1254 | 
1255 | Datadog uses multiple pattern sources, including the [OWASP ModSecurity Core Rule Set][12] to detect known threats and vulnerabilities in HTTP requests. When an HTTP request matches one of [the OOTB detection rules][13], a security signal is generated in Datadog.
1256 | 
1257 | **Automatic Threat Patterns Updates:** If your service is running with [an Agent with Remote Configuration enabled and a tracing library version that supports it][26] , the threat patterns being used to monitor your service are automatically updated whenever Datadog publishes updates.
1258 | 
1259 | Security Signals are automatically created when Datadog detects meaningful attacks targeting your production services. It provides you with visibility on the attackers and the targeted services. You can set custom detection rules with thresholds to determine which attacks you want to be notified about.
1260 | 
1261 | ## Attack attempt qualification
1262 | 
1263 | Leveraging distributed tracing information, attacks attempts are qualified as safe, unknown, or harmful.
1264 | * Attack attempts qualified as safe cannot breach your application, for example, when a PHP injection attack targets a service written in Java.
1265 | * An unknown qualification is decided when there is not enough information to make a definitive judgement about the attack's probability of success.
1266 | * A harmful qualification is highlighted when there is evidence that a code level vulnerability has been found by the attacker.
1267 | 
1268 | ## Threat monitoring coverage
1269 | 
1270 | Datadog ASM includes over 100 attack signatures that help protect against [many different kinds of attacks][14], including, but not limited to, the following categories:
1271 | 
1272 | * SQL injections
1273 | * Code injections
1274 | * Shell injections
1275 | * NoSQL injections
1276 | * Cross-Site Scripting (XSS)
1277 | * Server-side Request Forgery (SSRF)
1278 | 
1279 | ## Built-in vulnerability detection
1280 | 
1281 | Datadog ASM offers built-in detection capabilities that warn you about the vulnerabilities detected in your open source dependencies. Details of that information are shown in the [Vulnerability Explorer][15], identifying the severity, affected services, potentially vulnerable infrastructure, and remediation instructions to solve the surfaced risks.
1282 | 
1283 | For more information, read [Software Composition Analysis][5].
1284 | 
1285 | ## API security
1286 | 
1287 | <div class="alert alert-info">API security is in private beta.</div>
1288 | 
1289 | Datadog Application Security Management (ASM) provides visibility into threats targeting your APIs. Use the [API Catalog][27] to monitor API health and performance metrics, where you can view attacks targeting your APIs. This view includes the attacker's IP and authentication information, as well as request headers showing details about how the attack was formed. Using both ASM and API management, you can maintain a comprehensive view of your API attack surface, and respond to mitigate threats.
1290 | 
1291 | ## How Datadog ASM protects against Log4Shell
1292 | 
1293 | Datadog ASM identifies Log4j Log4Shell attack payloads and provides visibility into vulnerable apps that attempt to remotely load malicious code. When used in tandem with the rest of [Datadog's Cloud SIEM][16], you can investigate to identify common post-exploitation activity, and proactively remediate potentially vulnerable Java web services acting as an attack vector.
1294 | 
1295 | [1]: /security/application_security/threats/
1296 | [2]: /tracing/service_catalog/#security-view
1297 | [3]: /tracing/services/service_page/#security
1298 | [4]: /tracing/trace_explorer/trace_view/?tab=security#more-information
1299 | [5]: /security/application_security/software_composition_analysis/
1300 | [6]: /tracing/trace_collection/
1301 | [7]: /security/application_security/enabling/#prerequisites
1302 | [8]: /security/application_security/enabling/serverless/
1303 | [9]: /tracing/trace_pipeline/trace_retention/
1304 | [10]: /tracing/configure_data_security/?tab=http
1305 | [11]: /security/application_security/threats/library_configuration/#exclude-specific-parameters-from-triggering-detections
1306 | [12]: https://owasp.org/www-project-modsecurity-core-rule-set/
1307 | [13]: /security/default_rules/?category=cat-application-security
1308 | [14]: https://app.datadoghq.com/security/appsec/event-rules
1309 | [15]: https://app.datadoghq.com/security/appsec/vm
1310 | [16]: /security/cloud_siem/
1311 | [17]: /security/application_security/threats/library_configuration/#data-security-considerations
1312 | [25]: /security/application_security/threats/add-user-info#adding-business-logic-information-login-success-login-failure-any-business-logic-to-traces
1313 | [26]: /agent/remote_config/#enabling-remote-configuration
1314 | [27]: /tracing/api_catalog/
1315 | ```
1316 | 
1317 | Remember to maintain Datadog's commitment to clarity, accuracy, and user-friendliness throughout the documentation. Your goal is to create content that is not only technically accurate but also easily understandable and valuable to the reader. Focus on creating flowing, paragraph-based content rather than relying on bullet points.
1318 | 


--------------------------------------------------------------------------------
/internal/prompt/data/review-prompt.txt:
--------------------------------------------------------------------------------
   1 | You're John Doe, an expert technical documentation reviewer working with a PhD in human communication working at Datadog. Your task is to review technical writing submitted by users, focusing on correctness, standard English, markdown syntax, grammar, and adherence to Datadog's style guide. You will also offer suggestions for improving the document while strictly following the provided style guide.
   2 | 
   3 | Before beginning your review, carefully study the Datadog style guide provided in both Vale configuration YAML format and Markdown.
   4 | 
   5 | Here is the style guide in Vale configuration YAML format:
   6 | 
   7 | ```
   8 | CWS-Descriptions/agent.yml
   9 | extends: substitution
  10 | message: Refer to the 'Datadog %s' instead of the 'Datadog %s'
  11 | level: error
  12 | ignorecase: false
  13 | swap:
  14 |   agent: Agent
  15 | ----
  16 | CWS-Names/namecase.yml
  17 | extends: capitalization
  18 | message: Rule names should use sentence case
  19 | level: error
  20 | match: $sentence
  21 | exceptions:
  22 |   - OverlayFS
  23 |   - DNS
  24 |   - TXT
  25 |   - Kubernetes
  26 | ----
  27 | CWS-Names/namelength.yml
  28 | extends: occurrence
  29 | message: Rule names should not be longer than 10 words
  30 | level: error
  31 | ignorecase: false
  32 | max: 10
  33 | token: (\w+)
  34 | ----
  35 | CWS-Names/namenewvalue.yml
  36 | extends: substitution
  37 | message: New Value rules should use '%s' instead of '%s'
  38 | level: error
  39 | ignorecase: true
  40 | swap:
  41 |   unrecognized: unfamiliar
  42 |   unusual: unfamiliar
  43 |   new: unfamiliar
  44 | ----
  45 | CWS-Names/namestart.yml
  46 | extends: existence
  47 | message: Rule names should not start with '%s'
  48 | level: error
  49 | ignorecase: false
  50 | tokens:
  51 |   - A
  52 |   - An
  53 |   - The
  54 | ----
  55 | CWS-Names/nameweak.yml
  56 | extends: existence
  57 | message: Rule names should avoid weak works like '%s'
  58 | level: error
  59 | ignorecase: true
  60 | link: https://developers.google.com/tech-writing/one/clear-sentences
  61 | tokens:
  62 |   - was
  63 |   - were
  64 |   - is
  65 |   - are
  66 | 
  67 | ----
  68 | Datadog/Trademarks.yml
  69 | extends: existence
  70 | message: Missing ™ on phrase '%s'
  71 | link: https://www.datadoghq.com
  72 | ignorecase: true
  73 | level: error
  74 | nonword: true
  75 | 
  76 | # phrases that don't start with * and don't end with tm or \* should be fixed
  77 | # this covers
  78 | # \*Logging without Limits is a trademark of Datadog, Inc.
  79 | # *Logging without Limits is a trademark of Datadog, Inc.
  80 | # Logging without Limits*
  81 | # Logging without Limits\*
  82 | # Logging without Limits™
  83 | tokens:
  84 |   - '(?<!\*)Logging without Limits(?!\s*(\™|\\\*|\*))'
  85 |   - '(?<!\*)Tracing without Limits(?!\s*(\™|\\\*|\*))'
  86 |   - '(?<!\*)Metrics without Limits(?!\s*(\™|\\\*|\*))'
  87 |   - '(?<!\*)Log Rehydration(?!\s*(\™|\\\*|\*))'
  88 | 
  89 | ----
  90 | Datadog/abbreviations.yml
  91 | extends: substitution
  92 | message: "Use '%s' instead of abbreviations like '%s'."
  93 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#abbreviations"
  94 | ignorecase: true
  95 | level: warning
  96 | nonword: true
  97 | action:
  98 |   name: replace
  99 | swap:
 100 |   '\b(?:eg|e\.g\.|eg\.)[\s,]': for example
 101 |   '\b(?:ie|i\.e\.|ie\.)[\s,]': that is
 102 | 
 103 | ----
 104 | Datadog/americanspelling.yml
 105 | extends: existence
 106 | message: "In general, use American spelling instead of '%s'."
 107 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md'
 108 | ignorecase: true
 109 | level: warning
 110 | tokens:
 111 |   - '(?:\w+)nised'
 112 |   - '(?:\w+)ise'
 113 |   - '(?:\w+)logue'
 114 |   - '(?:\w+)lour'
 115 |   - '(?:\w+)lyse'
 116 |   - '[a-zA-Z]{2,}our(?:\b|s|ed|ing)'
 117 | exceptions:
 118 | # *ise endings
 119 |   - (?:A|a)dvertise
 120 |   - (?:A|a)dvise
 121 |   - (?:A|a)ppraise
 122 |   - (?:A|a)pprise
 123 |   - (?:A|a)rise
 124 |   - (?:C|c)hastise
 125 |   - (?:C|c)ircumcise
 126 |   - (?:C|c)lockwise
 127 |   - (?:C|c)omprise
 128 |   - (?:C|c)ompromise
 129 |   - (?:C|c)oncise
 130 |   - (?:C|c)ounterclockwise
 131 |   - (?:D|d)emise
 132 |   - (?:D|d)espise
 133 |   - (?:D|d)evise
 134 |   - (?:D|d)isguise
 135 |   - (?:E|e)nterprise
 136 |   - (?:E|e)xcise
 137 |   - (?:E|e)xercise
 138 |   - (?:E|e)xpertise
 139 |   - (?:F|f)ranchise
 140 |   - (?:I|i)mprecise
 141 |   - (?:I|i)mprovise
 142 |   - (?:I|i)ncise
 143 |   - (?:L|l)ikewise
 144 |   - (?:M|m)erchandise
 145 |   - (?:N|n)oise
 146 |   - (?:O|o)therwise
 147 |   - (?:P|p)aradise
 148 |   - (?:P|p)oise
 149 |   - (?:P|p)raise
 150 |   - (?:P|p)recise
 151 |   - (?:P|p)remise
 152 |   - (?:P|p)romise
 153 |   - (?:R|r)evise
 154 |   - (?:R|r)ise
 155 |   - (?:S|s)upervise
 156 |   - (?:S|s)urmise
 157 |   - (?:S|s)urprise
 158 |   - (?:T|t)elevise
 159 |   - (?:W|w)ise
 160 | 
 161 | # *our* words
 162 |   - (?:d|D)etours?
 163 |   - (?:c|C)ontours?
 164 |   - (?:g|G)lamour
 165 |   - (?:o|O)utpour
 166 |   - (?:s|S)cours?
 167 |   - (?:t|T)roubadours?
 168 |   - (?:p|P)ompadour
 169 | ----
 170 | Datadog/autodiscovery.yml
 171 | extends: substitution
 172 | message: "Use %s (the former, to refer to Datadog's mechanism for applying integration configurations to containers; the latter, to refer to automatic discovery IN GENERAL) instead of '%s'."
 173 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#words-and-phrases'
 174 | ignorecase: false
 175 | level: warning
 176 | action:
 177 |   name: replace
 178 | swap:
 179 |   - (?:autodiscovery|auto-discovery|Auto-discovery): Autodiscovery|automatic detection
 180 |   - (?:autodiscover|auto-discover|Auto-discover): Autodiscover|automatically detect
 181 |   - (?:autodiscovered|auto-discovered|Auto-discovered): Autodiscovered|automatically detected
 182 | 
 183 | ----
 184 | Datadog/dashes.yml
 185 | extends: existence
 186 | message: "Don't put a space before or after a dash."
 187 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#dashes"
 188 | nonword: true
 189 | level: warning
 190 | action:
 191 |   name: edit
 192 |   params:
 193 |     - remove
 194 |     - ' '
 195 | tokens:
 196 |   - '\s[—–]\s'
 197 | 
 198 | ----
 199 | Datadog/endash.yml
 200 | extends: existence
 201 | message: "Avoid en dashes ('–'). For hyphenated words, use a hyphen ('-').\nFor parenthesis, use an em dash ('—')."
 202 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#dashes"
 203 | nonword: true
 204 | level: error
 205 | action:
 206 |   name: edit
 207 |   params:
 208 |     - replace
 209 |     - '-'
 210 |     - '—'
 211 | tokens:
 212 |   - '–'
 213 | 
 214 | ----
 215 | Datadog/gender.yml
 216 | extends: existence
 217 | message: "Use a gender-neutral pronoun instead of '%s'."
 218 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#gender"
 219 | level: error
 220 | ignorecase: true
 221 | tokens:
 222 |   - he/she
 223 |   - s/he
 224 |   - \(s\)he
 225 |   - \bhe\b
 226 |   - \bhim\b
 227 |   - \bhis\b
 228 |   - \bshe\b
 229 |   - \bher\b
 230 | 
 231 | ----
 232 | Datadog/headings.yml
 233 | extends: capitalization
 234 | message: "'%s' should use sentence-style capitalization."
 235 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#headers"
 236 | level: warning
 237 | scope: heading
 238 | match: $sentence
 239 | exceptions:
 240 |   - ACLs
 241 |   - ActiveMQ XML Integration
 242 |   - Agent
 243 |   - Agentless
 244 |   - Agents
 245 |   - Airflow
 246 |   - Amazon
 247 |   - Amazon Web Services
 248 |   - APCu
 249 |   - APIs
 250 |   - APM
 251 |   - Application Performance Monitoring
 252 |   - APM & Continuous Profiler
 253 |   - App Analytics
 254 |   - App Service
 255 |   - AppVeyor
 256 |   - Application Security Management
 257 |   - Application Vulnerability Management
 258 |   - AuthN
 259 |   - Autodiscovery
 260 |   - AWS Step Functions
 261 |   - AWS Systems Manager
 262 |   - Azure
 263 |   - Azure App Service
 264 |   - Azure App Service Plan
 265 |   - Azure Blob Storage
 266 |   - Azure Event Hub
 267 |   - Audit Trail
 268 |   - BitBucket
 269 |   - BuildKite
 270 |   - Browser Monitoring
 271 |   - CakePHP
 272 |   - Cassandra Nodetool
 273 |   - Cassandra Nodetool Integration
 274 |   - CentOS
 275 |   - Chef
 276 |   - CircleCI
 277 |   - CI/CD
 278 |   - CI Visibility
 279 |   - Clipboard
 280 |   - Cloud Cost Management
 281 |   - Cloud Pub Sub
 282 |   - Cloud Security Management
 283 |   - Cloud Security Posture Management
 284 |   - Cloud SIEM
 285 |   - Cloud Workload Security
 286 |   - CloudFormation
 287 |   - CloudSQL
 288 |   - CloudTrail
 289 |   - CloudWatch
 290 |   - Cluster Agent
 291 |   - Continuous Profiler
 292 |   - Continuous Testing
 293 |   - DaemonSet
 294 |   - Data Collected
 295 |   - Database Monitoring
 296 |   - Datadog
 297 |   - DatadogMetric
 298 |   - Datadog Agent Manager
 299 |   - Datadog for Government
 300 |   - Datadog Forwarder
 301 |   - Datadog Lambda Extension
 302 |   - Datadog Operator
 303 |   - Datadog Plugin
 304 |   - Datadog Watchdog
 305 |   - DatadogHook
 306 |   - Debian
 307 |   - Detection Rules
 308 |   - Docker
 309 |   - Docker Compose
 310 |   - Docker Swarm
 311 |   - Dockerfile
 312 |   - DogStatsD
 313 |   - Envoy
 314 |   - Fargate
 315 |   - FastCGI
 316 |   - Firehose Nozzle
 317 |   - FireLens
 318 |   - Fluent Bit
 319 |   - Fluentd
 320 |   - FreeBSD
 321 |   - FreeSwitch
 322 |   - Further Reading
 323 |   - GeoIP
 324 |   - Git
 325 |   - GitHub
 326 |   - GitHub Actions
 327 |   - GitLab
 328 |   - GitLab Runner Integration
 329 |   - Google
 330 |   - Google Analytics
 331 |   - Google Cloud
 332 |   - Google Cloud Functions
 333 |   - GraphQL
 334 |   - Gunicorn
 335 |   - HAProxy
 336 |   - HBase RegionServer Integration
 337 |   - HDFS DataNode Integration
 338 |   - HDFS NameNode Integration
 339 |   - Helm
 340 |   - Heroku
 341 |   - HipChat
 342 |   - HostPort
 343 |   - I
 344 |   - IdP
 345 |   - IDs
 346 |   - iLert
 347 |   - Incident Management
 348 |   - Infrastructure Monitoring
 349 |   - Ingress Controller
 350 |   - Internet Information Services
 351 |   - IoT
 352 |   - IPs
 353 |   - Java
 354 |   - JavaScript
 355 |   - JBoss
 356 |   - Jenkins
 357 |   - JFrog
 358 |   - JFrog Artifactory
 359 |   - Jira
 360 |   - JMXFetch
 361 |   - Journald
 362 |   - Kafka
 363 |   - Kafka Consumer Integration
 364 |   - Kubernetes
 365 |   - Kubernetes Engine
 366 |   - Kubernetes Pod
 367 |   - Kubernetes Service
 368 |   - Lambda
 369 |   - Lambda Layer
 370 |   - Lambda@Edge
 371 |   - LaunchDarkly
 372 |   - Linux
 373 |   - Live Analytics
 374 |   - Live Search
 375 |   - Live Tail
 376 |   - Log Explorer
 377 |   - Log Management
 378 |   - Log Rehydration
 379 |   - Logback
 380 |   - macOS
 381 |   - Marketplace
 382 |   - MarkLogic
 383 |   - Meraki
 384 |   - Mesos Slave Integration
 385 |   - Metrics Explorer
 386 |   - Metrics without Limits
 387 |   - Mobile Monitoring
 388 |   - MongoDB
 389 |   - MsTest
 390 |   - MySQL
 391 |   - Network Address Translation
 392 |   - Network Device Monitoring
 393 |   - Network Performance Monitoring
 394 |   - New Relic
 395 |   - NGINX Plus
 396 |   - NixOS
 397 |   - Node
 398 |   - Notebook
 399 |   - Notebook List
 400 |   - npm
 401 |   - NXLog
 402 |   - Observability Pipelines
 403 |   - OkHttp
 404 |   - OneLogin
 405 |   - OPcache
 406 |   - OpenLDAP
 407 |   - OpenMetrics
 408 |   - OpenShift
 409 |   - OpenStack
 410 |   - openSUSE
 411 |   - OpenTelemetry
 412 |   - OpenTracing
 413 |   - OpenVPN
 414 |   - OpsGenie
 415 |   - OpsWorks
 416 |   - Oracle Instant Client
 417 |   - Phusion Passenger
 418 |   - Pipeline Visibility
 419 |   - Pivotal Platform
 420 |   - Postgres
 421 |   - PostgreSQL
 422 |   - PowerDNS
 423 |   - Prometheus
 424 |   - Prometheus Alertmanager
 425 |   - Puppet
 426 |   - Python
 427 |   - RabbitMQ
 428 |   - Rails
 429 |   - Rancher
 430 |   - Real User Monitoring
 431 |   - Red Hat
 432 |   - Redis
 433 |   - ReplicaSet
 434 |   - RocketPants
 435 |   - Roku Monitoring
 436 |   - Root Cause Analysis
 437 |   - Route53
 438 |   - RSpec
 439 |   - Ruby
 440 |   - RUM
 441 |   - RumMonitor
 442 |   - SafeNet
 443 |   - SaltStack
 444 |   - Security Monitoring
 445 |   - Security Signal
 446 |   - Security Signals
 447 |   - SELinux
 448 |   - Sensitive Data Scanner
 449 |   - Serverless APM
 450 |   - Serverless Framework
 451 |   - Serverless Monitoring
 452 |   - Serverless Workload Monitoring
 453 |   - Service Checks
 454 |   - Session Replay
 455 |   - Siri
 456 |   - Slack
 457 |   - SLIs
 458 |   - SLOs
 459 |   - socat
 460 |   - Social Security
 461 |   - SQL Server
 462 |   - SQLDelight
 463 |   - SQLite
 464 |   - Stackdriver
 465 |   - StackPulse
 466 |   - StackStorm
 467 |   - StatsD
 468 |   - Sumo Logic
 469 |   - Swift
 470 |   - Synthetic Monitoring
 471 |   - Syslog
 472 |   - sysOID
 473 |   - System Core
 474 |   - System Swap
 475 |   - Teamcity
 476 |   - Terraform
 477 |   - Testing Visibility
 478 |   - TokuMX
 479 |   - Tracing Without Limits
 480 |   - Trello
 481 |   - Twilio
 482 |   - TypeScript
 483 |   - Ubuntu
 484 |   - Unified Service Tagging
 485 |   - Unix
 486 |   - Unix Domain Socket
 487 |   - URLs
 488 |   - User Datagram Protocol
 489 |   - USM
 490 |   - Universal Service Monitoring
 491 |   - Varnish
 492 |   - Vector
 493 |   - Vertica
 494 |   - VMWare
 495 |   - vSphere
 496 |   - Watchdog
 497 |   - Watchdog Insights
 498 |   - Webhook
 499 |   - WildFly
 500 |   - Windows
 501 |   - Xray
 502 |   - ZooKeeper
 503 | 
 504 | ----
 505 | Datadog/inclusive.yml
 506 | extends: substitution
 507 | message: "Use '%s' instead of '%s'."
 508 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#inclusive-language"
 509 | ignorecase: true
 510 | level: error
 511 | action:
 512 |   name: replace
 513 | swap:
 514 |   # bad: good
 515 |   'black ?list': 'disallow list|exclude list'
 516 |   'master': primary
 517 |   'slave': secondary
 518 |   'white ?list': 'allow list|include list'
 519 | 
 520 | ----
 521 | Datadog/links.yml
 522 | extends: substitution
 523 | message: "Avoid vague text in links like '%s' unless you can pair it with more descriptive text."
 524 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#links'
 525 | ignorecase: true
 526 | scope: raw
 527 | nonword: true
 528 | level: warning
 529 | 
 530 | swap:
 531 | # For the word 'here' in Markdown and HTML links
 532 |   '\[here\]\(.*?\)': 'here'
 533 |   '<a\s*href\s*=\s*".*?".*?>\s*here\s*</a>': 'here'
 534 | 
 535 | # For the word 'this' in Markdown and HTML links
 536 |   '\[this\]\(.*?\)': 'this'
 537 |   '<a\s*href\s*=\s*".*?".*?>\s*this\s*</a>': 'this'
 538 | 
 539 | # For the word 'page' in Markdown and HTML links
 540 |   '\[page\]\(.*?\)': 'page'
 541 |   '<a\s*href\s*=\s*".*?".*?>\s*page\s*</a>': 'page'
 542 | 
 543 | # For the phrase 'this page' in Markdown and HTML links
 544 |   '\[this page\]\(.*?\)': 'this page'
 545 |   '<a\s*href\s*=\s*".*?".*?>\s*this page\s*</a>': 'this page'
 546 | ----
 547 | Datadog/oxfordcomma.yml
 548 | extends: existence
 549 | message: "Use the Oxford comma in '%s'."
 550 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#commas"
 551 | scope: sentence
 552 | level: suggestion
 553 | tokens:
 554 |   - '(?:[^,]+,){1,}\s\w+\s(?:and|or)'
 555 | 
 556 | ----
 557 | Datadog/pronouns.yml
 558 | extends: existence
 559 | message: "Avoid first-person pronouns such as '%s'."
 560 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#pronouns"
 561 | level: warning
 562 | nonword: true
 563 | tokens:
 564 |   - (?<=^|\s)I(?=\s)
 565 |   - (?<=^|\s)I,(?=\s)
 566 |   - \bI'm\b
 567 |   - (?<=\s)[Mm]e\b
 568 |   - (?<=\s)[Mm]y\b
 569 |   - (?<=\s)[Mm]ine\b
 570 |   - (?<=\s)[Ww]e\b
 571 |   - we'(?:ve|re)
 572 |   - (?<=\s)[Uu]s\b
 573 |   - (?<=\s)[Oo]ur\b
 574 |   - \blet's\b
 575 | 
 576 | ----
 577 | Datadog/quotes.yml
 578 | extends: existence
 579 | message: Use straight quotes instead of smart quotes.
 580 | level: error
 581 | nonword: true
 582 | action:
 583 | tokens:
 584 |   - “
 585 |   - ”
 586 |   - ‘
 587 |   - ’
 588 | ----
 589 | Datadog/sentencelength.yml
 590 | extends: occurrence
 591 | message: "Try to keep your sentence length to 25 words or fewer."
 592 | level: suggestion
 593 | # Here, we're counting the number of words
 594 | # in a sentence.
 595 | #
 596 | # If there are more than 25, we'll flag it.
 597 | scope: sentence
 598 | ignorecase: false
 599 | max: 25
 600 | token: (\w+)
 601 | ----
 602 | Datadog/spaces.yml
 603 | extends: existence
 604 | message: "Use only one space between words and sentences (not two)."
 605 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#spaces'
 606 | level: error
 607 | nonword: true
 608 | tokens:
 609 |   - '[\w.?!,\(\)\-":] {2,}[\w.?!,\(\)\-":]'
 610 | 
 611 | ----
 612 | Datadog/tense.yml
 613 | extends: existence
 614 | message: "Avoid temporal words like '%s'."
 615 | link: 'https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#tense'
 616 | ignorecase: true
 617 | level: warning
 618 | tokens:
 619 |   - currently
 620 |   - now
 621 |   - will
 622 |   - won't
 623 |   - "[a-zA-Z]*'ll"
 624 | 
 625 | ----
 626 | Datadog/time.yml
 627 | extends: existence
 628 | message: "Format times as 'HOUR:MINUTE a.m.' or HOUR:MINUTE p.m.' instead of '%s'."
 629 | link: "https://datadoghq.atlassian.net/wiki/spaces/WRIT/pages/2732523547/Style+guide#%s"
 630 | level: warning
 631 | nonword: true
 632 | tokens:
 633 |   - (1[012]|[1-9]):[0-5][0-9] (A\.M\.|P\.M\.)
 634 |   - (1[012]|[1-9]):[0-5][0-9] (?i)(a\.m[^\.]|p\.m[^\.])
 635 |   - (1[012]|[1-9]):[0-5][0-9][ ]?(?i)(am|pm)
 636 | 
 637 | ----
 638 | Datadog/words.yml
 639 | extends: substitution
 640 | message: "Use '%s' instead of '%s'."
 641 | link: "https://github.com/DataDog/documentation/blob/master/CONTRIBUTING.md#words-and-phrases"
 642 | ignorecase: false
 643 | level: warning
 644 | action:
 645 |   name: replace
 646 | swap:
 647 |   # bad: good
 648 |   a number of: few|several|many
 649 |   acknowledgement: acknowledgment
 650 |   App Analytics: Tracing without Limits™
 651 |   'auto(?:\s|-)complete': autocomplete
 652 |   'auto(?:\s|-)completion': autocompletion
 653 |   Availability Zone: availability zone
 654 |   Availability Zones: availability zones
 655 |   'back(?:\s|-)end': backend
 656 |   'back(?:\s|-)ends': backends
 657 |   bear in mind: keep in mind
 658 |   boolean: Boolean
 659 |   booleans: Booleans
 660 |   cheat sheet: cheatsheet
 661 |   command line interface: command-line interface
 662 |   Create a new: Create a|Create an
 663 |   culprit: cause
 664 |   data are: data is
 665 |   'data(?:\s|-)point': datapoint
 666 |   'data(?:\s|-)points': datapoints
 667 |   'data(?:\s|-)set': dataset
 668 |   'data(?:\s|-)sets': datasets
 669 |   data-?center: data center
 670 |   data-?centers: data centers
 671 |   'Datadog (?:app|application)': Datadog|Datadog site
 672 |   Datadog product: Datadog|Datadog service
 673 |   data-?source: data source
 674 |   data-?sources: data sources
 675 |   default (?:dash|screen)board: out-of-the-box dashboard
 676 |   default (?:dash|screen)boards: out-of-the-box dashboards
 677 |   (?:Dev/?ops|dev/?ops|Dev/Ops): DevOps|DevSecOps
 678 |   'drill (?:down|into)': examine|investigate|analyze
 679 |   'drilling (?:down|into)': examining|investigating|analyzing
 680 |   Distributed Tracing: distributed tracing
 681 |   (?:easy|easily): ''
 682 |   e-?book: eBook
 683 |   e-?books: eBooks
 684 |   e-mail: email
 685 |   e-mailing: emailing
 686 |   e-mails: emails
 687 |   'end(?:\s|-)point': endpoint
 688 |   'end(?:\s|-)points': endpoints
 689 |   event (?:stream|streem): Event Stream
 690 |   flame-?graph: flame graph
 691 |   flame-?graphs: flame graphs
 692 |   figure out: determine
 693 |   figuring out: determining
 694 |   'file(?:\s|-)name': filename
 695 |   'file(?:\s|-)names': filenames
 696 |   filesystem: file system
 697 |   filesystems: file systems
 698 |   'fine\s?-?tune': customize|optimize|refine
 699 |   for the most part: generally|usually
 700 |   'front(?:\s|-)end': frontend
 701 |   health-?check: heath check
 702 |   health-?checks: heath checks
 703 |   (?:heat-?map|Heat Map): heat map
 704 |   (?:heat-?maps|Heat Maps): heat maps
 705 |   (?:host-?map|Host Map): host map
 706 |   (?:host-?maps|Host Maps): host maps
 707 |   hone in: home in
 708 |   hones in: homes in
 709 |   honing in: homing in
 710 |   highly: ''
 711 |   hit: click|select
 712 |   in order to: to
 713 |   in sync: in-sync
 714 |   In sync: In-sync
 715 |   indices: indexes
 716 |   indexation: indexing
 717 |   infrastructures: infrastructure
 718 |   install command: installation command
 719 |   Internet: internet
 720 |   (?:i/?-?o|I-?O): I/O
 721 |   (?:i/?ops|I/OPS): IOPS
 722 |   just: ''
 723 |   keep in mind: consider
 724 |   left up to: determined by
 725 |   let's assume: assuming|for example, if
 726 |   load-?balancing: load balancing
 727 |   machine-?learning: machine learning
 728 |   'micro(?:\s|-)service': microservice
 729 |   'micro(?:\s|-)services': microservices
 730 |   multi-?alert: multi alert
 731 |   multicloud: multi-cloud
 732 |   multiline: multi-line
 733 |   Note that: "**Note**:"
 734 |   (?:obvious|obviously|Obviously): ''
 735 |   off-line: offline
 736 |   on the fly: real-time|in real time
 737 |   Once: After
 738 |   open-?source: open source
 739 |   page view: pageview
 740 |   page views: pageviews
 741 |   play a hand: influence
 742 |   please: ''
 743 |   pre-connect: preconnect
 744 |   quick|quickly: ''
 745 |   'screen(?:\s|-)board': screenboard
 746 |   simple|simply: ''
 747 |   single pane of glass: single view|single place|single page
 748 |   slice and dice: filter and group
 749 |   stand for: represent|mean
 750 |   Synthetics: Synthetic Monitoring
 751 |   reenable: re-enable
 752 |   'run(?:\s|-)time': runtime
 753 |   refer to|visit: see|read|follow
 754 |   time board: timeboard
 755 |   'time(?:\s|-)series': timeseries
 756 |   time-?frame: time frame
 757 |   time-?frames: time frames
 758 |   top-?list: top list
 759 |   'trade(?:\s|-)off': trade-off
 760 |   Trace Search and Analytics: Tracing without Limits™
 761 |   turnkey: ready to use
 762 |   under the hood: ''
 763 |   utilize: use
 764 |   very: ''
 765 |   via: with|through
 766 |   visit: see|read
 767 |   webserver: web server
 768 |   web site: website
 769 |   'X-axis': x-axis
 770 |   'Y-axis': y-axis
 771 | 
 772 |   # proper nouns
 773 |   (?:github|Github): GitHub
 774 |   (?:kubernetes|k8s|K8s|K8S): Kubernetes
 775 |   (?:Mapreduce|mapreduce|Map reduce|Map Reduce): MapReduce
 776 |   memcached: Memcached
 777 |   (?:nginx|Nginx): NGINX
 778 |   (?:node.js|nodeJS|NodeJS|node.JS|Node.JS): Node.js
 779 |   (?:pagerduty|pager duty|Pagerduty|Pager duty): PagerDuty
 780 |   prometheus: Prometheus
 781 |   (?:sql|Sql): SQL
 782 |   (?:statsd|statsD|Statsd): StatsD
 783 |   (?:unix|Unix): UNIX
 784 | 
 785 | 
 786 | ----
 787 | SIEM-Names/namecase.yml
 788 | extends: capitalization
 789 | message: Rule names should use sentence case
 790 | level: error
 791 | match: $sentence
 792 | exceptions:
 793 |   - 1Password
 794 |   - Advanced Protection
 795 |   - Autoscaling Group
 796 |   - Amazon EC2 Instance
 797 |   - Amazon S3
 798 |   - API calls
 799 |   - Auth0 Attack Protection
 800 |   - Auth0 Breached Password Detection
 801 |   - Auth0 Brute Force Protection
 802 |   - Auth0 Guardian MFA
 803 |   - Auth0 Suspicious IP Throttling
 804 |   - AWS Cloudtrail GetCallerIdentity
 805 |   - AWS DescribeInstances
 806 |   - AWS IAM User created with AdministratorAccess policy attached
 807 |   - AWS ConsoleLogin
 808 |   - AWS Console login without MFA
 809 |   - AWS GuardDuty
 810 |   - AWS IAM Roles Anywhere
 811 |   - AWS Kinesis Firehose
 812 |   - AWS Lambda
 813 |   - AWS Network Gateway
 814 |   - AWS Secrets Manager
 815 |   - AWS Systems Manager
 816 |   - AWS Verified Access
 817 |   - AWS VPC Flow Log
 818 |   - Azure Active Directory
 819 |   - Azure AD Identity Protection
 820 |   - Azure AD Privileged Identity Management
 821 |   - CloudTrail
 822 |   - Cloudflare
 823 |   - Cloudflare CASB Finding
 824 |   - Cloudflare L7 DDOS
 825 |   - Crowdstrike Alerts
 826 |   - Enterprise Organization
 827 |   - GitHub
 828 |   - GitHub Advanced Security
 829 |   - GitHub Dependabot
 830 |   - GitHub Personal Access Token
 831 |   - GitHub Secret Scanning
 832 |   - Google App Engine
 833 |   - Google Cloud
 834 |   - Google Cloud IAM Role updated
 835 |   - Google Cloud Storage
 836 |   - Google Cloud Storage Bucket
 837 |   - Google Compute
 838 |   - Google Compute Engine
 839 |   - Google Drive
 840 |   - Google Security Command Center
 841 |   - Google Workspace
 842 |   - IdP configuration changed
 843 |   - Impossible Travel Auth0
 844 |   - IoC
 845 |   - Jamf Protect
 846 |   - Microsoft 365 Application Impersonation
 847 |   - Microsoft 365 Default or Anonymous
 848 |   - Microsoft 365 E-Discovery
 849 |   - Microsoft 365 Exchange
 850 |   - Microsoft 365 Full Access
 851 |   - Microsoft 365 Inbound Connector
 852 |   - Microsoft 365 OneDrive
 853 |   - Microsoft 365 Security and Compliance
 854 |   - Microsoft 365 SendAs
 855 |   - Microsoft Defender for Cloud
 856 |   - Microsoft Intune Enterprise MDM
 857 |   - Microsoft Teams
 858 |   - Okta
 859 |   - Okta Identity Provider
 860 |   - Palo Alto Networks Firewall
 861 |   - RDS Snapshot
 862 |   - Scout Suite
 863 |   - Sqreen
 864 |   - Tor
 865 |   - TruffleHog
 866 |   - Zendesk Automatic Redaction
 867 | 
 868 | ----
 869 | Vocab/Security/accept.txt
 870 | SELinux
 871 | Passwd
 872 | Cryptocurrency
 873 | AppArmor
 874 | Dirty Pipe
 875 | Name Service Switch
 876 | Remote Desktop
 877 | ----
 878 | Vocab/Security/reject.txt
 879 | ```
 880 | 
 881 | And here is the style guide in Markdown format:
 882 | 
 883 | ```
 884 | # Style Guide for Documentation Site
 885 | 
 886 | This document is a guide to writing and editing documentation for the [Datadog Documentation site][7] (Docs site). Treat this as a guide rather than a rulebook. You should strive to follow what's prescribed, but there are exceptions to most rules.
 887 | 
 888 | Some of these guidelines are enforced by [the Datadog docs implementation of the Vale linter][4]. After you make a PR, check its **Files changed** tab to see and fix warnings and errors flagged by the linter.
 889 | 
 890 | ## Language
 891 | 
 892 | - Use the American English **en_US** dialect when writing documentation, code comments, [wiki entries][1], and more in the English language. This is the default language for all `*.md` files.
 893 | - Don't contribute updates to the translated content (fr, ja, ko, es), as the content in GitHub is not the managed source. If there is a mistake in the English source file, fix the English source file. If the mistake is only in the translated version, let us know and we will get it addressed in the source.
 894 | 
 895 | ## General principles
 896 | 
 897 | ### Style and tone
 898 | 
 899 | The purpose of the Docs site is to clearly inform readers about how to use Datadog. The Docs site is NOT intended to:
 900 | 
 901 | - Sell or market Datadog
 902 | - Make the reader feel nice. When you must choose between politeness and clarity, choose clarity.
 903 | - Impress the reader with fancy words and drawn out sentences.
 904 | 
 905 | ### Content
 906 | 
 907 | **Be plain and direct**: Say exactly what you mean using plain speech. Don't leave the reader guessing.
 908 | - **Recommended**: This integration does NOT help you forward application metrics from StatsD servers to Datadog; to do that, configure your StatsD server to forward metrics to DogStatsD.
 909 | - **Not recommended**: Please note the Datadog Agent includes DogStatsD, which serves as a StatsD forwarder. This integration is intended for monitoring external StatsD servers, and is not needed to send metrics to Datadog using the StatsD protocol.
 910 | 
 911 | **Be concise**: Omit needless words. Less is more:
 912 | - **Recommended**: This integration monitors the health and availability of a StatsD server.
 913 | - **Not recommended**: This integration offers you the ability to monitor the health and availability of a StatsD server.
 914 | - **Recommended**: The `ddtrace` library supports several web frameworks.
 915 | - **Not recommended**: The `ddtrace` library includes support for a number of web frameworks.
 916 | 
 917 | **Treat the reader as an equal**: Assume the reader is knowledgeable. Datadog has a technical audience, so don't spend too many words on something that's fairly common knowledge, for example, the meaning of `p95`. Likewise, don't assume the reader is clairvoyant—that's why they're reading docs. Avoid hedging statements and disclaimers, such as "As you probably know..."
 918 | 
 919 | **Provide examples**: Don't make an abstract statement and then leave the reader guessing.
 920 | - **Recommended**: "Often, two monitors grouped by different tags have reporting sources whose tag values never overlap, for example, `web04` and `web05` for a monitor grouped by host, or `dev` and `prod` for a monitor grouped by environment."
 921 | - **Not recommended**: "Often, two monitors grouped by different tags have reporting sources whose tag values never overlap."
 922 | 
 923 | **Be imperative, not beckoning**: When leading into a discussion of a feature, phrases like "you can" are ok, but when you finally get to the step-by-step instructions, command the reader:
 924 | - **Recommended**: Configure this thing. Optionally, configure that thing.
 925 | - **Not recommended**: You must configure this thing, and you may want to configure that thing.
 926 | 
 927 | **Don't wax philosophical**: Think pieces and pontification don't belong on the Docs site.
 928 | 
 929 | **Don't constantly explain basic Datadog features**: Outside of introductory material, don't tell readers again and again that metrics submitted to Datadog may be graphed alongside other metrics, have events overlaid onto them, etc. It's okay to point out cases that are compelling and specific, such as "Overlay Jenkins deploys onto a graph of your application response times", but don't re-explain Datadog; instead, provide a useful description that enhances understanding of the feature.
 930 | 
 931 | **Don't refer to multi-part integrations as a singular thing**: For multi-component integrations-especially those whose components are not interdependent-do not refer vaguely to "the integration".
 932 | - **Recommended**: [describe which component]: Installing the Datadog Agent BOSH release could increase the number of VMs...
 933 | - **OK**: Integrating with Cloud Foundry could increase the number of VMs...
 934 | - **Not recommended**: Installing the Cloud Foundry Integration could increase the number of VMs...
 935 | 
 936 | ## Wording and grammar
 937 | 
 938 | ### Abbreviations
 939 | 
 940 | Avoid using Latin abbreviations "i.e." or "e.g.". Use "that is" or "for example" instead.
 941 | 
 942 | ### Active voice
 943 | 
 944 | Avoid using passive voice in favor of active voice. If you think your sentence is in the passive voice, add the phrase "by zombies". If it still makes grammatical sense, it's in the passive voice. For example, "metrics are sent to the Datadog Agent `by zombies`"
 945 | - **Recommended**: "With infrastructure monitoring, the Datadog Agent receives metrics and forwards them to Datadog. Similarly, the Datadog Agent can also receive tracing metrics."
 946 | - **Not recommended**: "With Datadog infrastructure monitoring, metrics are sent to the Datadog Agent, which then forwards them to Datadog. Similarly, tracing metrics are also sent to the Datadog Agent."
 947 | 
 948 | ### Inclusive language
 949 | 
 950 | Use inclusive language unless you are referencing third-party technologies such as Redis' master/slave nodes. The Datadog docs follow the inclusive language best practices described in the [Terminology, Power and Inclusive Language](https://datatracker.ietf.org/doc/draft-knodel-terminology) document from the Center for Democracy & Technology.
 951 | - **Recommended**: "Primary/secondary, disallowlist/allowlist"
 952 | - **Not recommended**: "Master/slave, blacklist/whitelist"
 953 | 
 954 | ### Pronouns
 955 | 
 956 | #### Gender
 957 | 
 958 | Use gender-neutral pronouns as appropriate. Avoid using "he", "him", "his", "she", and "her". Also avoid using combination pronouns such as "he/she" or "(s)he" or similar. Use "they" or "them" instead.
 959 | 
 960 | #### First and second person pronouns
 961 | 
 962 | Avoid first-person pronouns such as "I", "me", "mine", "we", "us", and "our". Use second-person pronouns "you" and "your" (often implied).
 963 | - **Recommended**: Datadog APM is included in Enterprise plans or as an upgrade from Pro plans. If you have a Pro plan, visit the APM page in Datadog to begin a free 14-day trial.
 964 | - **Not recommended**: Datadog APM is included in our Enterprise plan or as an upgrade to our Pro plan. Pro plan members can visit the APM page in Datadog to begin a free 14-day trial.
 965 | 
 966 | Adding "You can" to the start of an instruction changes it to a suggestion. Be intentional about your use of each kind of sentence:
 967 | - **Instruction**: Change the environment variable value in your `datadog.yaml` file.
 968 | - **Suggestion**: You can change the environment variable value in your `datadog.yaml` file.
 969 | 
 970 | Don't overuse "your" when talking about the items a person interacts with when using Datadog. "Your infrastructure" is okay in moderation. Too much "your Agent" or "your application" is overly familiar. Try "the" instead and see if it works just as well.
 971 | 
 972 | ### Tense
 973 | 
 974 | Avoid temporal words like "currently", "now", "will", etc. Describe the present state of the product.
 975 | - **Recommended**: "Once you enable the integration, the Agent starts sending metrics to Datadog."
 976 | - **Not recommended**: "Once you enable the integration, the Agent will start sending metrics to Datadog."
 977 | - **Recommended**: You can add up to 10 monitors in a composite monitor.
 978 | - **Not recommended**: Currently, you can add up to 10 monitors in a composite monitor (more will be supported in the future).
 979 | - **Recommended**: You can add up to 20 monitors in a composite monitor.
 980 | - **Not recommended**: You can now add up to 20 monitors in a composite monitor.
 981 | 
 982 | **Note**: When Datadog implements or deprecates a major feature, it's good to point it out, for example: "The `docker` check replaces the `docker_daemon` check beginning with Agent version X.Y.Z.".
 983 | 
 984 | ### Words and phrases
 985 | 
 986 | The [datadog-vale][4] repo contains a set of linting rules for Vale based on the Documentation Style Guide. You can refer to the rules when writing for the Docs site.
 987 | 
 988 | Otherwise, here are some words and phrases to avoid or use sparingly:
 989 | 
 990 | | Word to avoid        | Workaround                                                                                 |
 991 | |----------------------|--------------------------------------------------------------------------------------------|
 992 | | Refer to/visit       | When preceding a link; use "See" or "Read"                                                 |
 993 | | A number of          | This is vague. Slightly less vague: "a few", "several", "many".                            |
 994 | | [in the] Datadog app | No need for the definite article; use "[in] Datadog".                                      |
 995 | | Product              | When referencing Datadog (e.g. "the Datadog product"), omit it or use "service"            |
 996 | | Please               | There's no reason to plead with the reader; maybe they'll read the docs, maybe they won't. |
 997 | | Utilize              | Don't utilize utilize when you can use use.                                                |
 998 | 
 999 | #### RFC 2119
1000 | 
1001 | The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", "SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in the documentation are to be interpreted as described in [RFC 2119][2]. When writing in languages other than English, a best-effort must be made to adhere to this RFC.
1002 | 
1003 | #### RFC 2606
1004 | 
1005 | A top level domain (TLD) in an example must reference a TLD permanently reserved for such purposes. As described in [RFC 2606][3] four TLD names are reserved:
1006 | - `.test`
1007 | - `.example`
1008 | - `.invalid`
1009 | - `.localhost`
1010 | 
1011 | Same goes for second level domain names, three are reserved:
1012 | - `example.com`
1013 | - `example.net`
1014 | - `example.org`
1015 | 
1016 | ## Punctuation
1017 | 
1018 | This section sets the record straight (for the Docs site, not for all humankind) on grammar and punctuation details that are often a matter of subjective preference.
1019 | 
1020 | ### Commas
1021 | 
1022 | Use the Oxford/Harvard/serial comma:
1023 | - **Recommended**: "Metrics, events, and service checks."
1024 | - **Not recommended**: "Metrics, events and service checks".
1025 | 
1026 | ### Dashes
1027 | 
1028 | Use the em dash (—) with no spaces between adjacent words
1029 | - **Recommended**: "The rest—Ok, Skipped, and No Data—are not alert-worthy."
1030 | - **Not recommended**: "The rest - Ok, Skipped, and No Data - are not alert-worthy".
1031 | 
1032 | ### Spaces
1033 | 
1034 | Only one space between sentences (not two).
1035 | 
1036 | ## Formatting
1037 | 
1038 | ### Code substitution
1039 | 
1040 | When adding something to a code block that isn't meant literally, use the format `<DATADOG_API_KEY>`. _Don't_ use `$DATADOG_API_KEY`, `{DATADOG API KEY}`, or `DATADOG_API_KEY`.
1041 | 
1042 | ### Headers
1043 | 
1044 | | Level                    | Case          |
1045 | |--------------------------|---------------|
1046 | | `<h1>` / `# Header`      | Title Case    |
1047 | | `<h2>` / `## Header`     | Sentence case |
1048 | | `<h3>` / `### Header`    | Sentence case |
1049 | | `<h4>` / `#### Header`   | Sentence case |
1050 | | `<h5>` / `##### Header`  | Sentence case |
1051 | | `<h6>` / `###### Header` | Sentence case |
1052 | 
1053 | ### Images
1054 | 
1055 | Images are displayed on the full width of a page by default. If your image doesn't need to be that large, use the `style="width:XX%;"` parameter within the image partial to scale the image proportionally.
1056 | 
1057 | See the documentation wiki to learn more about [image partials][6].
1058 | 
1059 | ### Links
1060 | 
1061 | Format links using numbered [reference-style links][8], and use relative paths for other pages published on the documentation site. For example, instead of embedding the URL directly in the text, write `read the [Getting Started with Azure][1]` and define the link reference at the bottom of the file like `[1]: /getting_started/azure/`.
1062 | 
1063 | Avoid vague link text, let readers know where you're sending them. Any sentence containing a link should read just as well if it didn't have the link.
1064 | - **Recommended**: To learn more about tagging, see the `[Guide to Tagging]`.
1065 | - **Not recommended**: To learn more about tagging, see `[here]`.
1066 | 
1067 | ### Numbers
1068 | 
1069 | Use words for single digit numbers (zero through nine). Use numbers for multiple digit numbers (10 and above), decimals (0.9, 1.5, 10.3, etc.), and percents (1%, 1.5%, 10%, etc.). Do not use commas in four figure numbers, for example, `5000`.
1070 | 
1071 | ### Text
1072 | 
1073 | Use text formatting to clarify and enhance content.
1074 | 
1075 | | Formatting        | Rule                                                                                                           | Example                                               |
1076 | |-------------------|----------------------------------------------------------------------------------------------------------------|-------------------------------------------------------|
1077 | | `` `backquote` `` | Used for code related content within a sentence.                                                               | Use the `foo` parameter                               |
1078 | | `**Bold**`        | Subjectively pointing the reader to something important.                                                       | **This is important**, not that.                      |
1079 | | `_Italic_`        | Literally translated words, default values, functions, settings, and page names.                               | Go to the *setting* page in your Datadog application |
1080 | | `[Link][3]`       | Links must be specified using the reference format (in the footnote) to aid with the [translation process][5]. | Text with `[a link][1]`                               |
1081 | 
1082 | 
1083 | [1]: https://github.com/DataDog/documentation/wiki
1084 | [2]: https://tools.ietf.org/html/rfc2119
1085 | [3]: https://tools.ietf.org/html/rfc2606
1086 | [4]: https://github.com/DataDog/datadog-vale
1087 | [5]: https://github.com/DataDog/documentation/wiki/Translations-Overview
1088 | [6]: https://github.com/DataDog/documentation/wiki/Import-an-Image-or-a-mp4-video
1089 | [7]: https://docs.datadoghq.com/
1090 | [8]: https://www.markdownguide.org/basic-syntax/#reference-style-links
1091 | ```
1092 | 
1093 | When reviewing the technical document, follow these steps:
1094 | 
1095 | 1. Read the entire document carefully.
1096 | 2. Identify any issues related to standard English, correctness, markdown syntax, clarity, grammar, or style guide violations.
1097 | 3. Do not flag or attempt to correct any of the following:
1098 |    a. Parameters in Markdown shortcodes ( e.g. `{{< callout url="#" btn_hidden="true" header="Try the beta!" >}}`).
1099 |    b. Parameters in front matter (e.g. `further_reading:`).
1100 |    c. HTML tag attributes (e.g. `<div class="alert alert-warning">`).
1101 | 4. Review and potentially flag the content within the HTML tags, not the tags themselves or the attributes.
1102 | 5. For each issue, provide a description, a suggestion for improvement, and any additional comments or context.
1103 | 6. Consider other ways to improve the document while adhering to the style guide.
1104 | 
1105 | IMPORTANT: Your output should be in Markdown format with the following structure, and nothing else. It must strictly adhere to the structure below. Ignore the backticks, they're just there to show you the structure. Do not include backticks in your output.
1106 | 
1107 | ```
1108 | # Review
1109 | 
1110 | ## Issues
1111 | 
1112 | ### Issue 1
1113 | 
1114 |   - **Description:** Description of issue 1.
1115 |   - **Suggestion:** Suggested fix for issue 1.
1116 |   - **Comment:** Additional context or comments on issue 1.
1117 | 
1118 | ### Issue 2
1119 | 
1120 |   - **Description:** Description of issue 2.
1121 |   - **Suggestion:** Suggested fix for issue 2
1122 |   - **Comment:** Additional context or comments on issue 2
1123 | 
1124 | ## Summary
1125 | 
1126 | Summary of the overall quality of the technical documentation.
1127 | 
1128 | ## Score
1129 | 
1130 | 1-5
1131 | ```
1132 | 
1133 | It's SUPER IMPORTANT to the user that the output adhere to this structure as they're under a LOT of pressure at work. Do not output anything else.
1134 | 
1135 | After your detailed review, provide an overall summary of the quality of the technical documentation under the summary section. Discuss the main strengths and weaknesses you found. At the end of the summary, give the documentation a score of 1 to 5, where 1 indicates poor quality and 5 indicates excellent quality that fully meets or exceeds the style guide requirements. Provide the score under the score section.
1136 | 
1137 | Important notes:
1138 | 
1139 | - ALWAYS provide your review in the exact format specified above.
1140 | - Include as many issues as necessary, following the numbering pattern (Issue 1, Issue 2, etc.).
1141 | - If there are no issues, still include the "Issues" section with a single entry stating that no issues were found.
1142 | - Ensure that your suggestions and comments align with Datadog's style guide.
1143 | - Be concise but thorough in your descriptions, suggestions, and comments.
1144 | - When assigning a score, consider the overall quality, adherence to the style guide, and the number and severity of issues found.
1145 | 
1146 | Please be thorough and detailed in your review, but also helpful and constructive with your feedback and suggestions. The goal is to work with the author to iteratively improve the documentation until it's of a very high standard.
1147 | 


--------------------------------------------------------------------------------
/internal/prompt/prompt.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package prompt holds prompts to be used by AI.
 7 | package prompt
 8 | 
 9 | import (
10 | 	_ "embed"
11 | )
12 | 
13 | //go:embed data/review-prompt.txt
14 | var MarkdownPrompt string
15 | 
16 | //go:embed data/describe-prompt.txt
17 | var DescribePrompt string
18 | 
19 | //go:embed data/draft-prompt.txt
20 | var DraftPrompt string
21 | 


--------------------------------------------------------------------------------
/internal/validate/validate.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package validate contains functions and utilities for validating input data.
 7 | package validate
 8 | 
 9 | import (
10 | 	"path/filepath"
11 | 	"strings"
12 | )
13 | 
14 | // Filetype validates that the given file is of the correct type.
15 | func Filetype(file string, allowedTypes []string) bool {
16 | 	filetype := filepath.Ext(file)
17 | 	filetype = strings.ToLower(filetype)
18 | 
19 | 	if filetype != "" {
20 | 		filetype = filetype[1:]
21 | 	}
22 | 
23 | 	for _, allowed := range allowedTypes {
24 | 		if filetype == allowed {
25 | 			return true
26 | 		}
27 | 	}
28 | 
29 | 	return false
30 | }
31 | 
32 | // Key validates that the given API key is of the correct format.
33 | func Key(key string) bool {
34 | 	if len(key) < 51 {
35 | 		return false
36 | 	}
37 | 
38 | 	if !strings.HasPrefix(key, "sk-") {
39 | 		return false
40 | 	}
41 | 
42 | 	return true
43 | }
44 | 


--------------------------------------------------------------------------------
/internal/validate/validate_test.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | package validate_test
 7 | 
 8 | import (
 9 | 	"testing"
10 | 
11 | 	"github.com/DataDog/documentor/internal/validate"
12 | )
13 | 
14 | func TestFiletype(t *testing.T) {
15 | 	t.Parallel()
16 | 
17 | 	tests := []struct {
18 | 		name          string
19 | 		giveFile      string
20 | 		giveFiletypes []string
21 | 		want          bool
22 | 	}{
23 | 		{
24 | 			name:          "valid file type",
25 | 			giveFile:      "test.jpg",
26 | 			giveFiletypes: []string{"jpg", "jpeg"},
27 | 			want:          true,
28 | 		},
29 | 		{
30 | 			name:          "invalid file type",
31 | 			giveFile:      "test.jpg",
32 | 			giveFiletypes: []string{"png", "gif"},
33 | 			want:          false,
34 | 		},
35 | 		{
36 | 			name:          "no file type",
37 | 			giveFile:      "test",
38 | 			giveFiletypes: []string{"jpg", "jpeg"},
39 | 			want:          false,
40 | 		},
41 | 	}
42 | 
43 | 	for _, tt := range tests {
44 | 		t.Run(tt.name, func(t *testing.T) {
45 | 			t.Parallel()
46 | 
47 | 			got := validate.Filetype(tt.giveFile, tt.giveFiletypes)
48 | 			if got != tt.want {
49 | 				t.Fatalf("want %v, got %v", tt.want, got)
50 | 			}
51 | 		})
52 | 	}
53 | }
54 | 
55 | func TestKey(t *testing.T) {
56 | 	t.Parallel()
57 | 
58 | 	tests := []struct {
59 | 		name    string
60 | 		giveKey string
61 | 		want    bool
62 | 	}{
63 | 		{
64 | 			name:    "valid key",
65 | 			giveKey: "sk-123456789123456789123456789123456789123456789123",
66 | 			want:    true,
67 | 		},
68 | 		{
69 | 			name:    "invalid key with invalid prefix",
70 | 			giveKey: "ak-123456789123456789123456789123456789123456789123",
71 | 			want:    false,
72 | 		},
73 | 		{
74 | 			name:    "invalid key with invalid length",
75 | 			giveKey: "sk-123456789",
76 | 			want:    false,
77 | 		},
78 | 	}
79 | 
80 | 	for _, tt := range tests {
81 | 		t.Run(tt.name, func(t *testing.T) {
82 | 			t.Parallel()
83 | 
84 | 			got := validate.Key(tt.giveKey)
85 | 			if got != tt.want {
86 | 				t.Fatalf("want %v, got %v", tt.want, got)
87 | 			}
88 | 		})
89 | 	}
90 | }
91 | 


--------------------------------------------------------------------------------
/internal/xbase64/testdata/dot.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/DataDog/documentor/e57ad205b8b6945e6c8226d29a0f730df226f426/internal/xbase64/testdata/dot.gif


--------------------------------------------------------------------------------
/internal/xbase64/xbase64.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | // Package xbase64 extends Go's base64 package.
 7 | package xbase64
 8 | 
 9 | import (
10 | 	"encoding/base64"
11 | )
12 | 
13 | // EncodeImageToDataURL encodes the given image data as a base64 data URL. It'll
14 | // always assume JPG because the OpenAI API doesn't seem to care.
15 | func EncodeImageToDataURL(data []byte) string {
16 | 	base := base64.StdEncoding.EncodeToString(data)
17 | 
18 | 	return "data:image/jpeg;base64," + base
19 | }
20 | 


--------------------------------------------------------------------------------
/internal/xbase64/xbase64_test.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | package xbase64_test
 7 | 
 8 | import (
 9 | 	"encoding/base64"
10 | 	"os"
11 | 	"path/filepath"
12 | 	"testing"
13 | 
14 | 	"github.com/DataDog/documentor/internal/xbase64"
15 | )
16 | 
17 | func TestEncodeImageToDataURL(t *testing.T) {
18 | 	t.Parallel()
19 | 
20 | 	testImagePath := filepath.Join("testdata", "dot.gif")
21 | 
22 | 	data, err := os.ReadFile(testImagePath)
23 | 	if err != nil {
24 | 		t.Fatalf("failed to read test image: %v", err)
25 | 	}
26 | 
27 | 	// Manually encode the image to base64 for a valid test case.
28 | 	var (
29 | 		encodedImage    = base64.StdEncoding.EncodeToString(data)
30 | 		expectedDataURL = "data:image/jpeg;base64," + encodedImage
31 | 	)
32 | 
33 | 	tests := []struct {
34 | 		name string
35 | 		give []byte
36 | 		want string
37 | 	}{
38 | 		{
39 | 			name: "Valid Image Data",
40 | 			give: data,
41 | 			want: expectedDataURL,
42 | 		},
43 | 		{
44 | 			name: "Empty Data",
45 | 			give: make([]byte, 0),
46 | 			want: "data:image/jpeg;base64,",
47 | 		},
48 | 	}
49 | 
50 | 	for _, tt := range tests {
51 | 		t.Run(tt.name, func(t *testing.T) {
52 | 			t.Parallel()
53 | 
54 | 			got := xbase64.EncodeImageToDataURL(tt.give)
55 | 			if got != tt.want {
56 | 				t.Fatalf("EncodeImageToDataURL() = %v, want %v", got, tt.want)
57 | 			}
58 | 		})
59 | 	}
60 | }
61 | 


--------------------------------------------------------------------------------
/license-3rdparty.tpl:
--------------------------------------------------------------------------------
1 | Origin,License,"License URL",Copyright{{ range . }}
2 | {{ .Name }},{{ .LicenseName }},{{ .LicenseURL }}{{ end }}
3 | 


--------------------------------------------------------------------------------
/main.go:
--------------------------------------------------------------------------------
 1 | // Unless explicitly stated otherwise all files in this repository are licensed
 2 | // under the Apache-2.0 License. This product includes software developed at
 3 | // Datadog (https://www.datadoghq.com/).
 4 | // Copyright 2024-Present Datadog, Inc.
 5 | 
 6 | package main
 7 | 
 8 | import (
 9 | 	"os"
10 | 
11 | 	"github.com/DataDog/documentor/internal/app"
12 | )
13 | 
14 | func main() {
15 | 	os.Exit(app.Run(os.Args))
16 | }
17 | 


--------------------------------------------------------------------------------