├── .dockerignore ├── .github ├── dependabot.yml └── workflows │ ├── llama-cpp-rs-check.yml │ ├── publish-upon-release.yml │ ├── update-llama-cpp.yml │ └── update-toml-version.yaml ├── .gitignore ├── .gitmodules ├── Cargo.lock ├── Cargo.toml ├── LICENSE-APACHE ├── LICENSE-MIT ├── README.md ├── examples ├── embeddings │ ├── Cargo.toml │ └── src │ │ └── main.rs ├── mtmd │ ├── Cargo.toml │ ├── README.md │ └── src │ │ └── mtmd.rs ├── reranker │ ├── Cargo.toml │ ├── README.md │ └── src │ │ └── main.rs ├── simple │ ├── Cargo.toml │ └── src │ │ └── main.rs └── usage.rs ├── llama-cpp-2 ├── Cargo.toml ├── README.md └── src │ ├── context.rs │ ├── context │ ├── kv_cache.rs │ ├── params.rs │ └── session.rs │ ├── grammar │ ├── arithmetic.gbnf │ ├── c.gbnf │ ├── chess.gbnf │ ├── japanese.gbnf │ ├── json.gbnf │ ├── json_arr.gbnf │ ├── list.gbnf │ └── tests.rs │ ├── lib.rs │ ├── llama_backend.rs │ ├── llama_batch.rs │ ├── log.rs │ ├── model.rs │ ├── model │ ├── params.rs │ └── params │ │ └── kv_overrides.rs │ ├── mtmd.rs │ ├── sampling.rs │ ├── timing.rs │ ├── token.rs │ ├── token │ ├── data.rs │ ├── data_array.rs │ └── logit_bias.rs │ └── token_type.rs ├── llama-cpp-sys-2 ├── Cargo.lock ├── Cargo.toml ├── README.md ├── build.rs ├── src │ └── lib.rs ├── wrapper.h └── wrapper_mtmd.h └── test-build.Dockerfile /.dockerignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.dockerignore -------------------------------------------------------------------------------- /.github/dependabot.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.github/dependabot.yml -------------------------------------------------------------------------------- /.github/workflows/llama-cpp-rs-check.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.github/workflows/llama-cpp-rs-check.yml -------------------------------------------------------------------------------- /.github/workflows/publish-upon-release.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.github/workflows/publish-upon-release.yml -------------------------------------------------------------------------------- /.github/workflows/update-llama-cpp.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.github/workflows/update-llama-cpp.yml -------------------------------------------------------------------------------- /.github/workflows/update-toml-version.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.github/workflows/update-toml-version.yaml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/.gitmodules -------------------------------------------------------------------------------- /Cargo.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/Cargo.lock -------------------------------------------------------------------------------- /Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/Cargo.toml -------------------------------------------------------------------------------- /LICENSE-APACHE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/LICENSE-APACHE -------------------------------------------------------------------------------- /LICENSE-MIT: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/LICENSE-MIT -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/README.md -------------------------------------------------------------------------------- /examples/embeddings/Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/embeddings/Cargo.toml -------------------------------------------------------------------------------- /examples/embeddings/src/main.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/embeddings/src/main.rs -------------------------------------------------------------------------------- /examples/mtmd/Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/mtmd/Cargo.toml -------------------------------------------------------------------------------- /examples/mtmd/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/mtmd/README.md -------------------------------------------------------------------------------- /examples/mtmd/src/mtmd.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/mtmd/src/mtmd.rs -------------------------------------------------------------------------------- /examples/reranker/Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/reranker/Cargo.toml -------------------------------------------------------------------------------- /examples/reranker/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/reranker/README.md -------------------------------------------------------------------------------- /examples/reranker/src/main.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/reranker/src/main.rs -------------------------------------------------------------------------------- /examples/simple/Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/simple/Cargo.toml -------------------------------------------------------------------------------- /examples/simple/src/main.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/simple/src/main.rs -------------------------------------------------------------------------------- /examples/usage.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/examples/usage.rs -------------------------------------------------------------------------------- /llama-cpp-2/Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/Cargo.toml -------------------------------------------------------------------------------- /llama-cpp-2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/README.md -------------------------------------------------------------------------------- /llama-cpp-2/src/context.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/context.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/context/kv_cache.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/context/kv_cache.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/context/params.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/context/params.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/context/session.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/context/session.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/arithmetic.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/arithmetic.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/c.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/c.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/chess.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/chess.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/japanese.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/japanese.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/json.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/json.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/json_arr.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/json_arr.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/list.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/list.gbnf -------------------------------------------------------------------------------- /llama-cpp-2/src/grammar/tests.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/grammar/tests.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/lib.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/lib.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/llama_backend.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/llama_backend.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/llama_batch.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/llama_batch.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/log.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/log.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/model.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/model.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/model/params.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/model/params.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/model/params/kv_overrides.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/model/params/kv_overrides.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/mtmd.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/mtmd.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/sampling.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/sampling.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/timing.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/timing.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/token.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/token.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/token/data.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/token/data.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/token/data_array.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/token/data_array.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/token/logit_bias.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/token/logit_bias.rs -------------------------------------------------------------------------------- /llama-cpp-2/src/token_type.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-2/src/token_type.rs -------------------------------------------------------------------------------- /llama-cpp-sys-2/Cargo.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/Cargo.lock -------------------------------------------------------------------------------- /llama-cpp-sys-2/Cargo.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/Cargo.toml -------------------------------------------------------------------------------- /llama-cpp-sys-2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/README.md -------------------------------------------------------------------------------- /llama-cpp-sys-2/build.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/build.rs -------------------------------------------------------------------------------- /llama-cpp-sys-2/src/lib.rs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/src/lib.rs -------------------------------------------------------------------------------- /llama-cpp-sys-2/wrapper.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/wrapper.h -------------------------------------------------------------------------------- /llama-cpp-sys-2/wrapper_mtmd.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/llama-cpp-sys-2/wrapper_mtmd.h -------------------------------------------------------------------------------- /test-build.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/utilityai/llama-cpp-rs/HEAD/test-build.Dockerfile --------------------------------------------------------------------------------