├── .clang-tidy ├── .devops ├── cloud-v-pipeline ├── full-cuda.Dockerfile ├── full-rocm.Dockerfile ├── full.Dockerfile ├── llama-cli-cann.Dockerfile ├── llama-cli-cuda.Dockerfile ├── llama-cli-intel.Dockerfile ├── llama-cli-rocm.Dockerfile ├── llama-cli-vulkan.Dockerfile ├── llama-cli.Dockerfile ├── llama-cpp-cuda.srpm.spec ├── llama-cpp.srpm.spec ├── llama-server-cuda.Dockerfile ├── llama-server-intel.Dockerfile ├── llama-server-rocm.Dockerfile ├── llama-server-vulkan.Dockerfile ├── llama-server.Dockerfile ├── nix │ ├── apps.nix │ ├── devshells.nix │ ├── docker.nix │ ├── jetson-support.nix │ ├── nixpkgs-instances.nix │ ├── package-gguf-py.nix │ ├── package.nix │ ├── python-scripts.nix │ ├── scope.nix │ └── sif.nix └── tools.sh ├── .dockerignore ├── .ecrc ├── .editorconfig ├── .flake8 ├── .github ├── ISSUE_TEMPLATE │ ├── 01-bug-low.yml │ ├── 02-bug-medium.yml │ ├── 03-bug-high.yml │ ├── 04-bug-critical.yml │ ├── 05-enhancement.yml │ ├── 06-research.yml │ ├── 07-refactor.yml │ └── config.yml ├── labeler.yml ├── pull_request_template.md └── workflows │ ├── bench.yml.disabled │ ├── build.yml │ ├── close-issue.yml │ ├── docker.yml │ ├── editorconfig.yml │ ├── gguf-publish.yml │ ├── labeler.yml │ ├── nix-ci-aarch64.yml │ ├── nix-ci.yml │ ├── nix-flake-update.yml │ ├── nix-publish-flake.yml │ ├── python-check-requirements.yml │ ├── python-lint.yml │ ├── python-type-check.yml │ └── server.yml ├── .gitignore ├── .gitmodules ├── .pre-commit-config.yaml ├── AUTHORS ├── CMakeLists.txt ├── CMakePresets.json ├── CONTRIBUTING.md ├── LICENSE ├── Makefile ├── Package.swift ├── README.md ├── ci ├── README.md └── run.sh ├── cmake ├── arm64-windows-llvm.cmake ├── arm64-windows-msvc.cmake ├── build-info.cmake ├── git-vars.cmake ├── llama-config.cmake.in └── llama.pc.in ├── common ├── CMakeLists.txt ├── arg.cpp ├── arg.h ├── base64.hpp ├── build-info.cpp.in ├── cmake │ └── build-info-gen-cpp.cmake ├── common.cpp ├── common.h ├── console.cpp ├── console.h ├── json-schema-to-grammar.cpp ├── json-schema-to-grammar.h ├── json.hpp ├── log.cpp ├── log.h ├── ngram-cache.cpp ├── ngram-cache.h ├── sampling.cpp ├── sampling.h ├── stb_image.h ├── train.cpp └── train.h ├── convert_hf_to_gguf.py ├── convert_hf_to_gguf_update.py ├── convert_llama_ggml_to_gguf.py ├── convert_lora_to_gguf.py ├── docs ├── android.md ├── backend │ ├── BLIS.md │ ├── CANN.md │ └── SYCL.md ├── build.md ├── development │ ├── HOWTO-add-model.md │ ├── debugging-tests.md │ ├── llama-star │ │ ├── idea-arch.key │ │ └── idea-arch.pdf │ └── token_generation_performance_tips.md ├── docker.md └── install.md ├── flake.lock ├── flake.nix ├── ggml ├── .gitignore ├── CMakeLists.txt ├── cmake │ └── FindSIMD.cmake ├── include │ ├── ggml-alloc.h │ ├── ggml-backend.h │ ├── ggml-blas.h │ ├── ggml-cann.h │ ├── ggml-cuda.h │ ├── ggml-kompute.h │ ├── ggml-metal.h │ ├── ggml-rpc.h │ ├── ggml-sycl.h │ ├── ggml-vulkan.h │ └── ggml.h └── src │ ├── CMakeLists.txt │ ├── ggml-aarch64.c │ ├── ggml-aarch64.h │ ├── ggml-alloc.c │ ├── ggml-backend-impl.h │ ├── ggml-backend.cpp │ ├── ggml-blas.cpp │ ├── ggml-cann.cpp │ ├── ggml-cann │ ├── .clang-format │ ├── Doxyfile │ ├── acl_tensor.cpp │ ├── acl_tensor.h │ ├── aclnn_ops.cpp │ ├── aclnn_ops.h │ ├── common.h │ └── kernels │ │ ├── CMakeLists.txt │ │ ├── ascendc_kernels.h │ │ ├── dup.cpp │ │ ├── get_row_f16.cpp │ │ ├── get_row_f32.cpp │ │ ├── get_row_q4_0.cpp │ │ ├── get_row_q8_0.cpp │ │ ├── quantize_f16_q8_0.cpp │ │ ├── quantize_f32_q8_0.cpp │ │ └── quantize_float_to_q4_0.cpp │ ├── ggml-common.h │ ├── ggml-cpu-impl.h │ ├── ggml-cuda.cu │ ├── ggml-cuda │ ├── acc.cu │ ├── acc.cuh │ ├── arange.cu │ ├── arange.cuh │ ├── argmax.cu │ ├── argmax.cuh │ ├── argsort.cu │ ├── argsort.cuh │ ├── binbcast.cu │ ├── binbcast.cuh │ ├── clamp.cu │ ├── clamp.cuh │ ├── common.cuh │ ├── concat.cu │ ├── concat.cuh │ ├── conv-transpose-1d.cu │ ├── conv-transpose-1d.cuh │ ├── convert.cu │ ├── convert.cuh │ ├── count-equal.cu │ ├── count-equal.cuh │ ├── cpy.cu │ ├── cpy.cuh │ ├── cross-entropy-loss.cu │ ├── cross-entropy-loss.cuh │ ├── dequantize.cuh │ ├── diagmask.cu │ ├── diagmask.cuh │ ├── dmmv.cu │ ├── dmmv.cuh │ ├── fattn-common.cuh │ ├── fattn-tile-f16.cu │ ├── fattn-tile-f16.cuh │ ├── fattn-tile-f32.cu │ ├── fattn-tile-f32.cuh │ ├── fattn-vec-f16.cuh │ ├── fattn-vec-f32.cuh │ ├── fattn-wmma-f16.cuh │ ├── fattn.cu │ ├── fattn.cuh │ ├── getrows.cu │ ├── getrows.cuh │ ├── im2col.cu │ ├── im2col.cuh │ ├── mma.cuh │ ├── mmq.cu │ ├── mmq.cuh │ ├── mmvq.cu │ ├── mmvq.cuh │ ├── norm.cu │ ├── norm.cuh │ ├── opt-step-adamw.cu │ ├── opt-step-adamw.cuh │ ├── out-prod.cu │ ├── out-prod.cuh │ ├── pad.cu │ ├── pad.cuh │ ├── pool2d.cu │ ├── pool2d.cuh │ ├── quantize.cu │ ├── quantize.cuh │ ├── rope.cu │ ├── rope.cuh │ ├── rwkv-wkv.cu │ ├── rwkv-wkv.cuh │ ├── scale.cu │ ├── scale.cuh │ ├── softmax.cu │ ├── softmax.cuh │ ├── sum.cu │ ├── sum.cuh │ ├── sumrows.cu │ ├── sumrows.cuh │ ├── template-instances │ │ ├── fattn-vec-f16-instance-hs128-f16-f16.cu │ │ ├── fattn-vec-f16-instance-hs128-f16-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs128-f16-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs128-f16-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs128-f16-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs128-f16-q8_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_0-f16.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_0-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_0-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_0-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_0-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_0-q8_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_1-f16.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_1-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_1-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_1-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_1-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q4_1-q8_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_0-f16.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_0-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_0-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_0-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_0-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_0-q8_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_1-f16.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_1-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_1-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_1-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_1-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q5_1-q8_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q8_0-f16.cu │ │ ├── fattn-vec-f16-instance-hs128-q8_0-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q8_0-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q8_0-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs128-q8_0-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs128-q8_0-q8_0.cu │ │ ├── fattn-vec-f16-instance-hs256-f16-f16.cu │ │ ├── fattn-vec-f16-instance-hs64-f16-f16.cu │ │ ├── fattn-vec-f16-instance-hs64-f16-q4_0.cu │ │ ├── fattn-vec-f16-instance-hs64-f16-q4_1.cu │ │ ├── fattn-vec-f16-instance-hs64-f16-q5_0.cu │ │ ├── fattn-vec-f16-instance-hs64-f16-q5_1.cu │ │ ├── fattn-vec-f16-instance-hs64-f16-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs128-f16-f16.cu │ │ ├── fattn-vec-f32-instance-hs128-f16-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs128-f16-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs128-f16-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs128-f16-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs128-f16-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_0-f16.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_0-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_0-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_0-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_0-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_0-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_1-f16.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_1-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_1-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_1-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_1-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q4_1-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_0-f16.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_0-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_0-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_0-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_0-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_0-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_1-f16.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_1-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_1-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_1-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_1-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q5_1-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q8_0-f16.cu │ │ ├── fattn-vec-f32-instance-hs128-q8_0-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q8_0-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q8_0-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs128-q8_0-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs128-q8_0-q8_0.cu │ │ ├── fattn-vec-f32-instance-hs256-f16-f16.cu │ │ ├── fattn-vec-f32-instance-hs64-f16-f16.cu │ │ ├── fattn-vec-f32-instance-hs64-f16-q4_0.cu │ │ ├── fattn-vec-f32-instance-hs64-f16-q4_1.cu │ │ ├── fattn-vec-f32-instance-hs64-f16-q5_0.cu │ │ ├── fattn-vec-f32-instance-hs64-f16-q5_1.cu │ │ ├── fattn-vec-f32-instance-hs64-f16-q8_0.cu │ │ ├── fattn-wmma-f16-instance-kqfloat-cpb16.cu │ │ ├── fattn-wmma-f16-instance-kqfloat-cpb32.cu │ │ ├── fattn-wmma-f16-instance-kqhalf-cpb16.cu │ │ ├── fattn-wmma-f16-instance-kqhalf-cpb32.cu │ │ ├── fattn-wmma-f16-instance-kqhalf-cpb8.cu │ │ ├── generate_cu_files.py │ │ ├── mmq-instance-iq1_s.cu │ │ ├── mmq-instance-iq2_s.cu │ │ ├── mmq-instance-iq2_xs.cu │ │ ├── mmq-instance-iq2_xxs.cu │ │ ├── mmq-instance-iq3_s.cu │ │ ├── mmq-instance-iq3_xxs.cu │ │ ├── mmq-instance-iq4_nl.cu │ │ ├── mmq-instance-iq4_xs.cu │ │ ├── mmq-instance-q2_k.cu │ │ ├── mmq-instance-q3_k.cu │ │ ├── mmq-instance-q4_0.cu │ │ ├── mmq-instance-q4_1.cu │ │ ├── mmq-instance-q4_k.cu │ │ ├── mmq-instance-q5_0.cu │ │ ├── mmq-instance-q5_1.cu │ │ ├── mmq-instance-q5_k.cu │ │ ├── mmq-instance-q6_k.cu │ │ └── mmq-instance-q8_0.cu │ ├── tsembd.cu │ ├── tsembd.cuh │ ├── unary.cu │ ├── unary.cuh │ ├── upscale.cu │ ├── upscale.cuh │ ├── vecdotq.cuh │ └── vendors │ │ ├── cuda.h │ │ ├── hip.h │ │ └── musa.h │ ├── ggml-impl.h │ ├── ggml-kompute.cpp │ ├── ggml-metal.m │ ├── ggml-metal.metal │ ├── ggml-quants.c │ ├── ggml-quants.h │ ├── ggml-rpc.cpp │ ├── ggml-sycl.cpp │ ├── ggml-sycl │ ├── backend.hpp │ ├── common.cpp │ ├── common.hpp │ ├── concat.cpp │ ├── concat.hpp │ ├── conv.cpp │ ├── conv.hpp │ ├── convert.cpp │ ├── convert.hpp │ ├── dequantize.hpp │ ├── dmmv.cpp │ ├── dmmv.hpp │ ├── dpct │ │ └── helper.hpp │ ├── gemm.hpp │ ├── im2col.cpp │ ├── im2col.hpp │ ├── mmq.cpp │ ├── mmq.hpp │ ├── mmvq.cpp │ ├── mmvq.hpp │ ├── norm.cpp │ ├── norm.hpp │ ├── presets.hpp │ ├── rope.cpp │ ├── rope.hpp │ ├── softmax.cpp │ ├── softmax.hpp │ ├── tsembd.cpp │ ├── tsembd.hpp │ └── vecdotq.hpp │ ├── ggml-vulkan.cpp │ ├── ggml.c │ ├── kompute-shaders │ ├── common.comp │ ├── op_add.comp │ ├── op_addrow.comp │ ├── op_cpy_f16_f16.comp │ ├── op_cpy_f16_f32.comp │ ├── op_cpy_f32_f16.comp │ ├── op_cpy_f32_f32.comp │ ├── op_diagmask.comp │ ├── op_gelu.comp │ ├── op_getrows.comp │ ├── op_getrows_f16.comp │ ├── op_getrows_f32.comp │ ├── op_getrows_q4_0.comp │ ├── op_getrows_q4_1.comp │ ├── op_getrows_q6_k.comp │ ├── op_mul.comp │ ├── op_mul_mat_f16.comp │ ├── op_mul_mat_mat_f32.comp │ ├── op_mul_mat_q4_0.comp │ ├── op_mul_mat_q4_1.comp │ ├── op_mul_mat_q6_k.comp │ ├── op_mul_mat_q8_0.comp │ ├── op_mul_mv_q_n.comp │ ├── op_mul_mv_q_n_pre.comp │ ├── op_norm.comp │ ├── op_relu.comp │ ├── op_rmsnorm.comp │ ├── op_rope_f16.comp │ ├── op_rope_f32.comp │ ├── op_scale.comp │ ├── op_scale_8.comp │ ├── op_silu.comp │ ├── op_softmax.comp │ └── rope_common.comp │ ├── llamafile │ ├── sgemm.cpp │ └── sgemm.h │ └── vulkan-shaders │ ├── CMakeLists.txt │ ├── acc.comp │ ├── add.comp │ ├── argsort.comp │ ├── clamp.comp │ ├── concat.comp │ ├── copy.comp │ ├── cos.comp │ ├── dequant_f32.comp │ ├── dequant_funcs.comp │ ├── dequant_head.comp │ ├── dequant_iq4_nl.comp │ ├── dequant_q2_k.comp │ ├── dequant_q3_k.comp │ ├── dequant_q4_0.comp │ ├── dequant_q4_1.comp │ ├── dequant_q4_k.comp │ ├── dequant_q5_0.comp │ ├── dequant_q5_1.comp │ ├── dequant_q5_k.comp │ ├── dequant_q6_k.comp │ ├── dequant_q8_0.comp │ ├── diag_mask_inf.comp │ ├── div.comp │ ├── gelu.comp │ ├── gelu_quick.comp │ ├── generic_binary_head.comp │ ├── generic_head.comp │ ├── generic_unary_head.comp │ ├── get_rows.comp │ ├── get_rows_quant.comp │ ├── group_norm.comp │ ├── im2col.comp │ ├── leaky_relu.comp │ ├── mul.comp │ ├── mul_mat_split_k_reduce.comp │ ├── mul_mat_vec.comp │ ├── mul_mat_vec_base.comp │ ├── mul_mat_vec_nc.comp │ ├── mul_mat_vec_p021.comp │ ├── mul_mat_vec_q2_k.comp │ ├── mul_mat_vec_q3_k.comp │ ├── mul_mat_vec_q4_k.comp │ ├── mul_mat_vec_q5_k.comp │ ├── mul_mat_vec_q6_k.comp │ ├── mul_mm.comp │ ├── norm.comp │ ├── pad.comp │ ├── relu.comp │ ├── repeat.comp │ ├── rms_norm.comp │ ├── rope_head.comp │ ├── rope_neox.comp │ ├── rope_norm.comp │ ├── scale.comp │ ├── silu.comp │ ├── sin.comp │ ├── soft_max.comp │ ├── square.comp │ ├── sum_rows.comp │ ├── tanh.comp │ ├── timestep_embedding.comp │ ├── types.comp │ ├── upscale.comp │ └── vulkan-shaders-gen.cpp ├── gguf-py ├── LICENSE ├── README.md ├── examples │ ├── reader.py │ └── writer.py ├── gguf │ ├── __init__.py │ ├── constants.py │ ├── gguf.py │ ├── gguf_reader.py │ ├── gguf_writer.py │ ├── lazy.py │ ├── metadata.py │ ├── py.typed │ ├── quants.py │ ├── tensor_mapping.py │ ├── utility.py │ └── vocab.py ├── pyproject.toml ├── scripts │ ├── __init__.py │ ├── gguf_convert_endian.py │ ├── gguf_dump.py │ ├── gguf_hash.py │ ├── gguf_new_metadata.py │ └── gguf_set_metadata.py └── tests │ ├── __init__.py │ ├── test_metadata.py │ └── test_quants.py ├── grammars ├── README.md ├── arithmetic.gbnf ├── c.gbnf ├── chess.gbnf ├── japanese.gbnf ├── json.gbnf ├── json_arr.gbnf └── list.gbnf ├── include └── llama.h ├── lac.cpp ├── lang-cli-src ├── config.cpp ├── config.h ├── console_manager.cpp ├── console_manager.h ├── file_manager.cpp ├── file_manager.h ├── model_manager.cpp ├── model_manager.h ├── output_parser.cpp ├── output_parser.h ├── shell_executor.cpp ├── shell_executor.h ├── str_parser.cpp └── str_parser.h ├── media ├── llama-leader.jpeg ├── llama0-banner.png ├── llama0-logo.png ├── llama1-banner.png ├── llama1-logo.png ├── matmul.png └── matmul.svg ├── models ├── .editorconfig ├── ggml-vocab-aquila.gguf ├── ggml-vocab-baichuan.gguf ├── ggml-vocab-bert-bge.gguf ├── ggml-vocab-bert-bge.gguf.inp ├── ggml-vocab-bert-bge.gguf.out ├── ggml-vocab-chameleon.gguf.inp ├── ggml-vocab-chameleon.gguf.out ├── ggml-vocab-command-r.gguf ├── ggml-vocab-command-r.gguf.inp ├── ggml-vocab-command-r.gguf.out ├── ggml-vocab-deepseek-coder.gguf ├── ggml-vocab-deepseek-coder.gguf.inp ├── ggml-vocab-deepseek-coder.gguf.out ├── ggml-vocab-deepseek-llm.gguf ├── ggml-vocab-deepseek-llm.gguf.inp ├── ggml-vocab-deepseek-llm.gguf.out ├── ggml-vocab-falcon.gguf ├── ggml-vocab-falcon.gguf.inp ├── ggml-vocab-falcon.gguf.out ├── ggml-vocab-gpt-2.gguf ├── ggml-vocab-gpt-2.gguf.inp ├── ggml-vocab-gpt-2.gguf.out ├── ggml-vocab-gpt-neox.gguf ├── ggml-vocab-llama-bpe.gguf ├── ggml-vocab-llama-bpe.gguf.inp ├── ggml-vocab-llama-bpe.gguf.out ├── ggml-vocab-llama-spm.gguf ├── ggml-vocab-llama-spm.gguf.inp ├── ggml-vocab-llama-spm.gguf.out ├── ggml-vocab-mpt.gguf ├── ggml-vocab-mpt.gguf.inp ├── ggml-vocab-mpt.gguf.out ├── ggml-vocab-phi-3.gguf ├── ggml-vocab-phi-3.gguf.inp ├── ggml-vocab-phi-3.gguf.out ├── ggml-vocab-qwen2.gguf ├── ggml-vocab-qwen2.gguf.inp ├── ggml-vocab-qwen2.gguf.out ├── ggml-vocab-refact.gguf ├── ggml-vocab-refact.gguf.inp ├── ggml-vocab-refact.gguf.out ├── ggml-vocab-starcoder.gguf ├── ggml-vocab-starcoder.gguf.inp └── ggml-vocab-starcoder.gguf.out ├── mypy.ini ├── output.gif ├── pocs ├── CMakeLists.txt └── vdot │ ├── CMakeLists.txt │ ├── q8dot.cpp │ └── vdot.cpp ├── poetry.lock ├── prompts ├── LLM-questions.txt ├── alpaca.txt ├── assistant.txt ├── chat-with-baichuan.txt ├── chat-with-bob.txt ├── chat-with-qwen.txt ├── chat-with-vicuna-v0.txt ├── chat-with-vicuna-v1.txt ├── chat.txt ├── dan-modified.txt ├── dan.txt ├── mnemonics.txt ├── parallel-questions.txt └── reason-act.txt ├── pyproject.toml ├── pyrightconfig.json ├── requirements.txt ├── requirements ├── requirements-all.txt ├── requirements-compare-llama-bench.txt ├── requirements-convert_hf_to_gguf.txt ├── requirements-convert_hf_to_gguf_update.txt ├── requirements-convert_legacy_llama.txt ├── requirements-convert_llama_ggml_to_gguf.txt ├── requirements-convert_lora_to_gguf.txt ├── requirements-pydantic.txt └── requirements-test-tokenizer-random.txt ├── scripts ├── build-info.sh ├── check-requirements.sh ├── ci-run.sh ├── compare-commits.sh ├── compare-llama-bench.py ├── debug-test.sh ├── gen-authors.sh ├── gen-unicode-data.py ├── get-flags.mk ├── get-hellaswag.sh ├── get-pg.sh ├── get-wikitext-103.sh ├── get-wikitext-2.sh ├── get-winogrande.sh ├── hf.sh ├── install-oneapi.bat ├── pod-llama.sh ├── qnt-all.sh ├── run-all-perf.sh ├── run-all-ppl.sh ├── run-with-preset.py ├── server-llm.sh ├── sync-ggml-am.sh ├── sync-ggml.last ├── sync-ggml.sh ├── verify-checksum-models.py └── xxd.cmake ├── spm-headers ├── ggml-alloc.h ├── ggml-backend.h ├── ggml-metal.h ├── ggml.h └── llama.h ├── src ├── CMakeLists.txt ├── llama-grammar.cpp ├── llama-grammar.h ├── llama-impl.h ├── llama-sampling.cpp ├── llama-sampling.h ├── llama-vocab.cpp ├── llama-vocab.h ├── llama.cpp ├── unicode-data.cpp ├── unicode-data.h ├── unicode.cpp └── unicode.h └── tests ├── .gitignore ├── CMakeLists.txt ├── get-model.cpp ├── get-model.h ├── run-json-schema-to-grammar.mjs ├── test-arg-parser.cpp ├── test-autorelease.cpp ├── test-backend-ops.cpp ├── test-barrier.cpp ├── test-c.c ├── test-chat-template.cpp ├── test-double-float.cpp ├── test-grad0.cpp ├── test-grammar-integration.cpp ├── test-grammar-parser.cpp ├── test-json-schema-to-grammar.cpp ├── test-llama-grammar.cpp ├── test-log.cpp ├── test-lora-conversion-inference.sh ├── test-model-load-cancel.cpp ├── test-opt.cpp ├── test-quantize-fns.cpp ├── test-quantize-perf.cpp ├── test-rope.cpp ├── test-sampling.cpp ├── test-tokenizer-0.cpp ├── test-tokenizer-0.py ├── test-tokenizer-0.sh ├── test-tokenizer-1-bpe.cpp ├── test-tokenizer-1-spm.cpp └── test-tokenizer-random.py /.clang-tidy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.clang-tidy -------------------------------------------------------------------------------- /.devops/cloud-v-pipeline: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/cloud-v-pipeline -------------------------------------------------------------------------------- /.devops/full-cuda.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/full-cuda.Dockerfile -------------------------------------------------------------------------------- /.devops/full-rocm.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/full-rocm.Dockerfile -------------------------------------------------------------------------------- /.devops/full.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/full.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cli-cann.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cli-cann.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cli-cuda.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cli-cuda.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cli-intel.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cli-intel.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cli-rocm.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cli-rocm.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cli-vulkan.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cli-vulkan.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cli.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cli.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-cpp-cuda.srpm.spec: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cpp-cuda.srpm.spec -------------------------------------------------------------------------------- /.devops/llama-cpp.srpm.spec: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-cpp.srpm.spec -------------------------------------------------------------------------------- /.devops/llama-server-cuda.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-server-cuda.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-server-intel.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-server-intel.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-server-rocm.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-server-rocm.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-server-vulkan.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-server-vulkan.Dockerfile -------------------------------------------------------------------------------- /.devops/llama-server.Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/llama-server.Dockerfile -------------------------------------------------------------------------------- /.devops/nix/apps.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/apps.nix -------------------------------------------------------------------------------- /.devops/nix/devshells.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/devshells.nix -------------------------------------------------------------------------------- /.devops/nix/docker.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/docker.nix -------------------------------------------------------------------------------- /.devops/nix/jetson-support.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/jetson-support.nix -------------------------------------------------------------------------------- /.devops/nix/nixpkgs-instances.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/nixpkgs-instances.nix -------------------------------------------------------------------------------- /.devops/nix/package-gguf-py.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/package-gguf-py.nix -------------------------------------------------------------------------------- /.devops/nix/package.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/package.nix -------------------------------------------------------------------------------- /.devops/nix/python-scripts.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/python-scripts.nix -------------------------------------------------------------------------------- /.devops/nix/scope.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/scope.nix -------------------------------------------------------------------------------- /.devops/nix/sif.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/nix/sif.nix -------------------------------------------------------------------------------- /.devops/tools.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.devops/tools.sh -------------------------------------------------------------------------------- /.dockerignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.dockerignore -------------------------------------------------------------------------------- /.ecrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.ecrc -------------------------------------------------------------------------------- /.editorconfig: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.editorconfig -------------------------------------------------------------------------------- /.flake8: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.flake8 -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/01-bug-low.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/01-bug-low.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/02-bug-medium.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/02-bug-medium.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/03-bug-high.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/03-bug-high.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/04-bug-critical.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/04-bug-critical.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/05-enhancement.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/05-enhancement.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/06-research.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/06-research.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/07-refactor.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/07-refactor.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/ISSUE_TEMPLATE/config.yml -------------------------------------------------------------------------------- /.github/labeler.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/labeler.yml -------------------------------------------------------------------------------- /.github/pull_request_template.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/pull_request_template.md -------------------------------------------------------------------------------- /.github/workflows/bench.yml.disabled: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/bench.yml.disabled -------------------------------------------------------------------------------- /.github/workflows/build.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/build.yml -------------------------------------------------------------------------------- /.github/workflows/close-issue.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/close-issue.yml -------------------------------------------------------------------------------- /.github/workflows/docker.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/docker.yml -------------------------------------------------------------------------------- /.github/workflows/editorconfig.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/editorconfig.yml -------------------------------------------------------------------------------- /.github/workflows/gguf-publish.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/gguf-publish.yml -------------------------------------------------------------------------------- /.github/workflows/labeler.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/labeler.yml -------------------------------------------------------------------------------- /.github/workflows/nix-ci-aarch64.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/nix-ci-aarch64.yml -------------------------------------------------------------------------------- /.github/workflows/nix-ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/nix-ci.yml -------------------------------------------------------------------------------- /.github/workflows/nix-flake-update.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/nix-flake-update.yml -------------------------------------------------------------------------------- /.github/workflows/nix-publish-flake.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/nix-publish-flake.yml -------------------------------------------------------------------------------- /.github/workflows/python-check-requirements.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/python-check-requirements.yml -------------------------------------------------------------------------------- /.github/workflows/python-lint.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/python-lint.yml -------------------------------------------------------------------------------- /.github/workflows/python-type-check.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/python-type-check.yml -------------------------------------------------------------------------------- /.github/workflows/server.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.github/workflows/server.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.gitmodules -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /AUTHORS: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/AUTHORS -------------------------------------------------------------------------------- /CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/CMakeLists.txt -------------------------------------------------------------------------------- /CMakePresets.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/CMakePresets.json -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/Makefile -------------------------------------------------------------------------------- /Package.swift: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/Package.swift -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/README.md -------------------------------------------------------------------------------- /ci/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ci/README.md -------------------------------------------------------------------------------- /ci/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ci/run.sh -------------------------------------------------------------------------------- /cmake/arm64-windows-llvm.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/cmake/arm64-windows-llvm.cmake -------------------------------------------------------------------------------- /cmake/arm64-windows-msvc.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/cmake/arm64-windows-msvc.cmake -------------------------------------------------------------------------------- /cmake/build-info.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/cmake/build-info.cmake -------------------------------------------------------------------------------- /cmake/git-vars.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/cmake/git-vars.cmake -------------------------------------------------------------------------------- /cmake/llama-config.cmake.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/cmake/llama-config.cmake.in -------------------------------------------------------------------------------- /cmake/llama.pc.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/cmake/llama.pc.in -------------------------------------------------------------------------------- /common/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/CMakeLists.txt -------------------------------------------------------------------------------- /common/arg.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/arg.cpp -------------------------------------------------------------------------------- /common/arg.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/arg.h -------------------------------------------------------------------------------- /common/base64.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/base64.hpp -------------------------------------------------------------------------------- /common/build-info.cpp.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/build-info.cpp.in -------------------------------------------------------------------------------- /common/cmake/build-info-gen-cpp.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/cmake/build-info-gen-cpp.cmake -------------------------------------------------------------------------------- /common/common.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/common.cpp -------------------------------------------------------------------------------- /common/common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/common.h -------------------------------------------------------------------------------- /common/console.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/console.cpp -------------------------------------------------------------------------------- /common/console.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/console.h -------------------------------------------------------------------------------- /common/json-schema-to-grammar.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/json-schema-to-grammar.cpp -------------------------------------------------------------------------------- /common/json-schema-to-grammar.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/json-schema-to-grammar.h -------------------------------------------------------------------------------- /common/json.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/json.hpp -------------------------------------------------------------------------------- /common/log.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/log.cpp -------------------------------------------------------------------------------- /common/log.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/log.h -------------------------------------------------------------------------------- /common/ngram-cache.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/ngram-cache.cpp -------------------------------------------------------------------------------- /common/ngram-cache.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/ngram-cache.h -------------------------------------------------------------------------------- /common/sampling.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/sampling.cpp -------------------------------------------------------------------------------- /common/sampling.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/sampling.h -------------------------------------------------------------------------------- /common/stb_image.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/stb_image.h -------------------------------------------------------------------------------- /common/train.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/train.cpp -------------------------------------------------------------------------------- /common/train.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/common/train.h -------------------------------------------------------------------------------- /convert_hf_to_gguf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/convert_hf_to_gguf.py -------------------------------------------------------------------------------- /convert_hf_to_gguf_update.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/convert_hf_to_gguf_update.py -------------------------------------------------------------------------------- /convert_llama_ggml_to_gguf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/convert_llama_ggml_to_gguf.py -------------------------------------------------------------------------------- /convert_lora_to_gguf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/convert_lora_to_gguf.py -------------------------------------------------------------------------------- /docs/android.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/android.md -------------------------------------------------------------------------------- /docs/backend/BLIS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/backend/BLIS.md -------------------------------------------------------------------------------- /docs/backend/CANN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/backend/CANN.md -------------------------------------------------------------------------------- /docs/backend/SYCL.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/backend/SYCL.md -------------------------------------------------------------------------------- /docs/build.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/build.md -------------------------------------------------------------------------------- /docs/development/HOWTO-add-model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/development/HOWTO-add-model.md -------------------------------------------------------------------------------- /docs/development/debugging-tests.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/development/debugging-tests.md -------------------------------------------------------------------------------- /docs/development/llama-star/idea-arch.key: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/development/llama-star/idea-arch.key -------------------------------------------------------------------------------- /docs/development/llama-star/idea-arch.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/development/llama-star/idea-arch.pdf -------------------------------------------------------------------------------- /docs/development/token_generation_performance_tips.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/development/token_generation_performance_tips.md -------------------------------------------------------------------------------- /docs/docker.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/docker.md -------------------------------------------------------------------------------- /docs/install.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/docs/install.md -------------------------------------------------------------------------------- /flake.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/flake.lock -------------------------------------------------------------------------------- /flake.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/flake.nix -------------------------------------------------------------------------------- /ggml/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/.gitignore -------------------------------------------------------------------------------- /ggml/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/CMakeLists.txt -------------------------------------------------------------------------------- /ggml/cmake/FindSIMD.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/cmake/FindSIMD.cmake -------------------------------------------------------------------------------- /ggml/include/ggml-alloc.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-alloc.h -------------------------------------------------------------------------------- /ggml/include/ggml-backend.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-backend.h -------------------------------------------------------------------------------- /ggml/include/ggml-blas.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-blas.h -------------------------------------------------------------------------------- /ggml/include/ggml-cann.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-cann.h -------------------------------------------------------------------------------- /ggml/include/ggml-cuda.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-cuda.h -------------------------------------------------------------------------------- /ggml/include/ggml-kompute.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-kompute.h -------------------------------------------------------------------------------- /ggml/include/ggml-metal.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-metal.h -------------------------------------------------------------------------------- /ggml/include/ggml-rpc.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-rpc.h -------------------------------------------------------------------------------- /ggml/include/ggml-sycl.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-sycl.h -------------------------------------------------------------------------------- /ggml/include/ggml-vulkan.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml-vulkan.h -------------------------------------------------------------------------------- /ggml/include/ggml.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/include/ggml.h -------------------------------------------------------------------------------- /ggml/src/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/CMakeLists.txt -------------------------------------------------------------------------------- /ggml/src/ggml-aarch64.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-aarch64.c -------------------------------------------------------------------------------- /ggml/src/ggml-aarch64.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-aarch64.h -------------------------------------------------------------------------------- /ggml/src/ggml-alloc.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-alloc.c -------------------------------------------------------------------------------- /ggml/src/ggml-backend-impl.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-backend-impl.h -------------------------------------------------------------------------------- /ggml/src/ggml-backend.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-backend.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-blas.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-blas.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/.clang-format: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/.clang-format -------------------------------------------------------------------------------- /ggml/src/ggml-cann/Doxyfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/Doxyfile -------------------------------------------------------------------------------- /ggml/src/ggml-cann/acl_tensor.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/acl_tensor.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/acl_tensor.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/acl_tensor.h -------------------------------------------------------------------------------- /ggml/src/ggml-cann/aclnn_ops.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/aclnn_ops.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/aclnn_ops.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/aclnn_ops.h -------------------------------------------------------------------------------- /ggml/src/ggml-cann/common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/common.h -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/CMakeLists.txt -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/ascendc_kernels.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/ascendc_kernels.h -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/dup.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/dup.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/get_row_f16.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/get_row_f16.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/get_row_f32.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/get_row_f32.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/get_row_q4_0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/get_row_q4_0.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/get_row_q8_0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/get_row_q8_0.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/quantize_f16_q8_0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/quantize_f16_q8_0.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/quantize_f32_q8_0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/quantize_f32_q8_0.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-cann/kernels/quantize_float_to_q4_0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cann/kernels/quantize_float_to_q4_0.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-common.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-common.h -------------------------------------------------------------------------------- /ggml/src/ggml-cpu-impl.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cpu-impl.h -------------------------------------------------------------------------------- /ggml/src/ggml-cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/acc.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/acc.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/acc.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/acc.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/arange.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/arange.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/arange.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/arange.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/argmax.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/argmax.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/argmax.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/argmax.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/argsort.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/argsort.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/argsort.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/argsort.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/binbcast.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/binbcast.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/binbcast.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/binbcast.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/clamp.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/clamp.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/clamp.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/clamp.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/common.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/common.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/concat.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/concat.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/concat.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/concat.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/conv-transpose-1d.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/conv-transpose-1d.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/conv-transpose-1d.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/conv-transpose-1d.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/convert.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/convert.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/convert.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/convert.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/count-equal.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/count-equal.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/count-equal.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/count-equal.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/cpy.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/cpy.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/cpy.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/cpy.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/cross-entropy-loss.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/cross-entropy-loss.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/cross-entropy-loss.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/cross-entropy-loss.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/dequantize.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/dequantize.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/diagmask.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/diagmask.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/diagmask.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/diagmask.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/dmmv.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/dmmv.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/dmmv.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/dmmv.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-common.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-common.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-tile-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-tile-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-tile-f16.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-tile-f16.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-tile-f32.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-tile-f32.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-tile-f32.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-tile-f32.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-vec-f16.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-vec-f16.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-vec-f32.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-vec-f32.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn-wmma-f16.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn-wmma-f16.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/fattn.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/fattn.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/getrows.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/getrows.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/getrows.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/getrows.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/im2col.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/im2col.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/im2col.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/im2col.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/mma.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/mma.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/mmq.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/mmq.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/mmq.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/mmq.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/mmvq.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/mmvq.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/mmvq.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/mmvq.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/norm.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/norm.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/norm.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/norm.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/opt-step-adamw.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/opt-step-adamw.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/opt-step-adamw.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/opt-step-adamw.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/out-prod.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/out-prod.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/out-prod.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/out-prod.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/pad.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/pad.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/pad.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/pad.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/pool2d.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/pool2d.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/pool2d.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/pool2d.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/quantize.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/quantize.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/quantize.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/quantize.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/rope.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/rope.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/rope.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/rope.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/rwkv-wkv.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/rwkv-wkv.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/rwkv-wkv.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/rwkv-wkv.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/scale.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/scale.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/scale.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/scale.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/softmax.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/softmax.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/softmax.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/softmax.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/sum.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/sum.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/sum.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/sum.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/sumrows.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/sumrows.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/sumrows.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/sumrows.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/generate_cu_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/generate_cu_files.py -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/tsembd.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/tsembd.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/tsembd.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/tsembd.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/unary.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/unary.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/unary.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/unary.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/upscale.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/upscale.cu -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/upscale.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/upscale.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/vecdotq.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/vecdotq.cuh -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/vendors/cuda.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/vendors/cuda.h -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/vendors/hip.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/vendors/hip.h -------------------------------------------------------------------------------- /ggml/src/ggml-cuda/vendors/musa.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-cuda/vendors/musa.h -------------------------------------------------------------------------------- /ggml/src/ggml-impl.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-impl.h -------------------------------------------------------------------------------- /ggml/src/ggml-kompute.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-kompute.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-metal.m: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-metal.m -------------------------------------------------------------------------------- /ggml/src/ggml-metal.metal: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-metal.metal -------------------------------------------------------------------------------- /ggml/src/ggml-quants.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-quants.c -------------------------------------------------------------------------------- /ggml/src/ggml-quants.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-quants.h -------------------------------------------------------------------------------- /ggml/src/ggml-rpc.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-rpc.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/backend.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/backend.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/common.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/common.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/common.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/common.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/concat.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/concat.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/concat.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/concat.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/conv.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/conv.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/conv.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/conv.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/convert.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/convert.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/convert.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/convert.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/dequantize.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/dequantize.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/dmmv.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/dmmv.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/dmmv.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/dmmv.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/dpct/helper.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/dpct/helper.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/gemm.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/gemm.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/im2col.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/im2col.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/im2col.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/im2col.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/mmq.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/mmq.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/mmq.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/mmq.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/mmvq.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/mmvq.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/mmvq.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/mmvq.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/norm.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/norm.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/norm.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/norm.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/presets.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/presets.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/rope.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/rope.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/rope.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/rope.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/softmax.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/softmax.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/softmax.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/softmax.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/tsembd.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/tsembd.cpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/tsembd.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/tsembd.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-sycl/vecdotq.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-sycl/vecdotq.hpp -------------------------------------------------------------------------------- /ggml/src/ggml-vulkan.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml-vulkan.cpp -------------------------------------------------------------------------------- /ggml/src/ggml.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/ggml.c -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/common.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/common.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_add.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_add.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_addrow.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_addrow.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_cpy_f16_f16.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_cpy_f16_f16.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_cpy_f16_f32.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_cpy_f16_f32.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_cpy_f32_f16.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_cpy_f32_f16.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_cpy_f32_f32.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_cpy_f32_f32.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_diagmask.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_diagmask.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_gelu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_gelu.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_getrows.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_getrows.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_getrows_f16.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_getrows_f16.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_getrows_f32.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_getrows_f32.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_getrows_q4_0.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_getrows_q4_0.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_getrows_q4_1.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_getrows_q4_1.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_getrows_q6_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_getrows_q6_k.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mat_f16.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mat_f16.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mat_mat_f32.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mat_mat_f32.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mat_q4_0.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mat_q4_0.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mat_q4_1.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mat_q4_1.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mat_q6_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mat_q6_k.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mat_q8_0.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mat_q8_0.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mv_q_n.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mv_q_n.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_mul_mv_q_n_pre.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_mul_mv_q_n_pre.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_norm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_norm.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_relu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_relu.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_rmsnorm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_rmsnorm.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_rope_f16.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_rope_f16.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_rope_f32.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_rope_f32.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_scale.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_scale.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_scale_8.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_scale_8.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_silu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_silu.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/op_softmax.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/op_softmax.comp -------------------------------------------------------------------------------- /ggml/src/kompute-shaders/rope_common.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/kompute-shaders/rope_common.comp -------------------------------------------------------------------------------- /ggml/src/llamafile/sgemm.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/llamafile/sgemm.cpp -------------------------------------------------------------------------------- /ggml/src/llamafile/sgemm.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/llamafile/sgemm.h -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/CMakeLists.txt -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/acc.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/acc.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/add.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/add.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/argsort.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/argsort.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/clamp.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/clamp.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/concat.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/concat.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/copy.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/copy.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/cos.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/cos.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_f32.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_f32.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_funcs.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_funcs.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_head.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_head.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_iq4_nl.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_iq4_nl.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q2_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q2_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q3_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q3_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q4_0.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q4_0.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q4_1.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q4_1.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q4_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q4_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q5_0.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q5_0.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q5_1.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q5_1.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q5_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q5_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q6_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q6_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/dequant_q8_0.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/dequant_q8_0.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/diag_mask_inf.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/diag_mask_inf.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/div.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/div.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/gelu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/gelu.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/gelu_quick.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/gelu_quick.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/generic_binary_head.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/generic_binary_head.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/generic_head.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/generic_head.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/generic_unary_head.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/generic_unary_head.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/get_rows.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/get_rows.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/get_rows_quant.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/get_rows_quant.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/group_norm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/group_norm.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/im2col.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/im2col.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/leaky_relu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/leaky_relu.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_split_k_reduce.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_split_k_reduce.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_base.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_base.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_nc.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_nc.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_p021.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_p021.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_q2_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_q2_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_q3_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_q3_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_q4_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_q4_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_q5_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_q5_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mat_vec_q6_k.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mat_vec_q6_k.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/mul_mm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/mul_mm.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/norm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/norm.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/pad.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/pad.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/relu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/relu.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/repeat.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/repeat.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/rms_norm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/rms_norm.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/rope_head.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/rope_head.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/rope_neox.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/rope_neox.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/rope_norm.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/rope_norm.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/scale.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/scale.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/silu.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/silu.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/sin.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/sin.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/soft_max.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/soft_max.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/square.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/square.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/sum_rows.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/sum_rows.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/tanh.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/tanh.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/timestep_embedding.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/timestep_embedding.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/types.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/types.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/upscale.comp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/upscale.comp -------------------------------------------------------------------------------- /ggml/src/vulkan-shaders/vulkan-shaders-gen.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/ggml/src/vulkan-shaders/vulkan-shaders-gen.cpp -------------------------------------------------------------------------------- /gguf-py/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/LICENSE -------------------------------------------------------------------------------- /gguf-py/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/README.md -------------------------------------------------------------------------------- /gguf-py/examples/reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/examples/reader.py -------------------------------------------------------------------------------- /gguf-py/examples/writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/examples/writer.py -------------------------------------------------------------------------------- /gguf-py/gguf/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/__init__.py -------------------------------------------------------------------------------- /gguf-py/gguf/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/constants.py -------------------------------------------------------------------------------- /gguf-py/gguf/gguf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/gguf.py -------------------------------------------------------------------------------- /gguf-py/gguf/gguf_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/gguf_reader.py -------------------------------------------------------------------------------- /gguf-py/gguf/gguf_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/gguf_writer.py -------------------------------------------------------------------------------- /gguf-py/gguf/lazy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/lazy.py -------------------------------------------------------------------------------- /gguf-py/gguf/metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/metadata.py -------------------------------------------------------------------------------- /gguf-py/gguf/py.typed: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /gguf-py/gguf/quants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/quants.py -------------------------------------------------------------------------------- /gguf-py/gguf/tensor_mapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/tensor_mapping.py -------------------------------------------------------------------------------- /gguf-py/gguf/utility.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/utility.py -------------------------------------------------------------------------------- /gguf-py/gguf/vocab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/gguf/vocab.py -------------------------------------------------------------------------------- /gguf-py/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/pyproject.toml -------------------------------------------------------------------------------- /gguf-py/scripts/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/scripts/__init__.py -------------------------------------------------------------------------------- /gguf-py/scripts/gguf_convert_endian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/scripts/gguf_convert_endian.py -------------------------------------------------------------------------------- /gguf-py/scripts/gguf_dump.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/scripts/gguf_dump.py -------------------------------------------------------------------------------- /gguf-py/scripts/gguf_hash.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/scripts/gguf_hash.py -------------------------------------------------------------------------------- /gguf-py/scripts/gguf_new_metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/scripts/gguf_new_metadata.py -------------------------------------------------------------------------------- /gguf-py/scripts/gguf_set_metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/scripts/gguf_set_metadata.py -------------------------------------------------------------------------------- /gguf-py/tests/__init__.py: -------------------------------------------------------------------------------- 1 | from .test_metadata import * 2 | -------------------------------------------------------------------------------- /gguf-py/tests/test_metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/tests/test_metadata.py -------------------------------------------------------------------------------- /gguf-py/tests/test_quants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/gguf-py/tests/test_quants.py -------------------------------------------------------------------------------- /grammars/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/README.md -------------------------------------------------------------------------------- /grammars/arithmetic.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/arithmetic.gbnf -------------------------------------------------------------------------------- /grammars/c.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/c.gbnf -------------------------------------------------------------------------------- /grammars/chess.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/chess.gbnf -------------------------------------------------------------------------------- /grammars/japanese.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/japanese.gbnf -------------------------------------------------------------------------------- /grammars/json.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/json.gbnf -------------------------------------------------------------------------------- /grammars/json_arr.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/json_arr.gbnf -------------------------------------------------------------------------------- /grammars/list.gbnf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/grammars/list.gbnf -------------------------------------------------------------------------------- /include/llama.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/include/llama.h -------------------------------------------------------------------------------- /lac.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lac.cpp -------------------------------------------------------------------------------- /lang-cli-src/config.cpp: -------------------------------------------------------------------------------- 1 | #include "config.h" -------------------------------------------------------------------------------- /lang-cli-src/config.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/config.h -------------------------------------------------------------------------------- /lang-cli-src/console_manager.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/console_manager.cpp -------------------------------------------------------------------------------- /lang-cli-src/console_manager.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/console_manager.h -------------------------------------------------------------------------------- /lang-cli-src/file_manager.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/file_manager.cpp -------------------------------------------------------------------------------- /lang-cli-src/file_manager.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/file_manager.h -------------------------------------------------------------------------------- /lang-cli-src/model_manager.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/model_manager.cpp -------------------------------------------------------------------------------- /lang-cli-src/model_manager.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/model_manager.h -------------------------------------------------------------------------------- /lang-cli-src/output_parser.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/output_parser.cpp -------------------------------------------------------------------------------- /lang-cli-src/output_parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/output_parser.h -------------------------------------------------------------------------------- /lang-cli-src/shell_executor.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/shell_executor.cpp -------------------------------------------------------------------------------- /lang-cli-src/shell_executor.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/shell_executor.h -------------------------------------------------------------------------------- /lang-cli-src/str_parser.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/str_parser.cpp -------------------------------------------------------------------------------- /lang-cli-src/str_parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/lang-cli-src/str_parser.h -------------------------------------------------------------------------------- /media/llama-leader.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/llama-leader.jpeg -------------------------------------------------------------------------------- /media/llama0-banner.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/llama0-banner.png -------------------------------------------------------------------------------- /media/llama0-logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/llama0-logo.png -------------------------------------------------------------------------------- /media/llama1-banner.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/llama1-banner.png -------------------------------------------------------------------------------- /media/llama1-logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/llama1-logo.png -------------------------------------------------------------------------------- /media/matmul.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/matmul.png -------------------------------------------------------------------------------- /media/matmul.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/media/matmul.svg -------------------------------------------------------------------------------- /models/.editorconfig: -------------------------------------------------------------------------------- 1 | root = true 2 | -------------------------------------------------------------------------------- /models/ggml-vocab-aquila.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-aquila.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-baichuan.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-baichuan.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-bert-bge.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-bert-bge.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-bert-bge.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-bert-bge.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-bert-bge.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-bert-bge.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-chameleon.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-chameleon.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-chameleon.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-chameleon.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-command-r.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-command-r.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-command-r.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-command-r.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-command-r.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-command-r.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-deepseek-coder.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-deepseek-coder.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-deepseek-coder.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-deepseek-coder.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-deepseek-coder.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-deepseek-coder.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-deepseek-llm.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-deepseek-llm.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-deepseek-llm.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-deepseek-llm.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-deepseek-llm.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-deepseek-llm.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-falcon.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-falcon.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-falcon.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-falcon.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-falcon.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-falcon.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-gpt-2.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-gpt-2.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-gpt-2.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-gpt-2.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-gpt-2.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-gpt-2.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-gpt-neox.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-gpt-neox.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-llama-bpe.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-llama-bpe.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-llama-bpe.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-llama-bpe.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-llama-bpe.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-llama-bpe.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-llama-spm.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-llama-spm.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-llama-spm.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-llama-spm.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-llama-spm.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-llama-spm.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-mpt.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-mpt.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-mpt.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-mpt.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-mpt.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-mpt.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-phi-3.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-phi-3.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-phi-3.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-phi-3.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-phi-3.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-phi-3.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-qwen2.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-qwen2.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-qwen2.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-qwen2.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-qwen2.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-qwen2.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-refact.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-refact.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-refact.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-refact.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-refact.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-refact.gguf.out -------------------------------------------------------------------------------- /models/ggml-vocab-starcoder.gguf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-starcoder.gguf -------------------------------------------------------------------------------- /models/ggml-vocab-starcoder.gguf.inp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-starcoder.gguf.inp -------------------------------------------------------------------------------- /models/ggml-vocab-starcoder.gguf.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/models/ggml-vocab-starcoder.gguf.out -------------------------------------------------------------------------------- /mypy.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/mypy.ini -------------------------------------------------------------------------------- /output.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/output.gif -------------------------------------------------------------------------------- /pocs/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/pocs/CMakeLists.txt -------------------------------------------------------------------------------- /pocs/vdot/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/pocs/vdot/CMakeLists.txt -------------------------------------------------------------------------------- /pocs/vdot/q8dot.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/pocs/vdot/q8dot.cpp -------------------------------------------------------------------------------- /pocs/vdot/vdot.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/pocs/vdot/vdot.cpp -------------------------------------------------------------------------------- /poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/poetry.lock -------------------------------------------------------------------------------- /prompts/LLM-questions.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/LLM-questions.txt -------------------------------------------------------------------------------- /prompts/alpaca.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/alpaca.txt -------------------------------------------------------------------------------- /prompts/assistant.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/assistant.txt -------------------------------------------------------------------------------- /prompts/chat-with-baichuan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/chat-with-baichuan.txt -------------------------------------------------------------------------------- /prompts/chat-with-bob.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/chat-with-bob.txt -------------------------------------------------------------------------------- /prompts/chat-with-qwen.txt: -------------------------------------------------------------------------------- 1 | You are a helpful assistant. -------------------------------------------------------------------------------- /prompts/chat-with-vicuna-v0.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/chat-with-vicuna-v0.txt -------------------------------------------------------------------------------- /prompts/chat-with-vicuna-v1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/chat-with-vicuna-v1.txt -------------------------------------------------------------------------------- /prompts/chat.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/chat.txt -------------------------------------------------------------------------------- /prompts/dan-modified.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/dan-modified.txt -------------------------------------------------------------------------------- /prompts/dan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/dan.txt -------------------------------------------------------------------------------- /prompts/mnemonics.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/mnemonics.txt -------------------------------------------------------------------------------- /prompts/parallel-questions.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/parallel-questions.txt -------------------------------------------------------------------------------- /prompts/reason-act.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/prompts/reason-act.txt -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/pyproject.toml -------------------------------------------------------------------------------- /pyrightconfig.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/pyrightconfig.json -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/requirements.txt -------------------------------------------------------------------------------- /requirements/requirements-all.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/requirements/requirements-all.txt -------------------------------------------------------------------------------- /requirements/requirements-compare-llama-bench.txt: -------------------------------------------------------------------------------- 1 | tabulate~=0.9.0 2 | GitPython~=3.1.43 3 | -------------------------------------------------------------------------------- /requirements/requirements-convert_hf_to_gguf.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/requirements/requirements-convert_hf_to_gguf.txt -------------------------------------------------------------------------------- /requirements/requirements-convert_hf_to_gguf_update.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/requirements/requirements-convert_hf_to_gguf_update.txt -------------------------------------------------------------------------------- /requirements/requirements-convert_legacy_llama.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/requirements/requirements-convert_legacy_llama.txt -------------------------------------------------------------------------------- /requirements/requirements-convert_llama_ggml_to_gguf.txt: -------------------------------------------------------------------------------- 1 | -r ./requirements-convert_legacy_llama.txt 2 | -------------------------------------------------------------------------------- /requirements/requirements-convert_lora_to_gguf.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/requirements/requirements-convert_lora_to_gguf.txt -------------------------------------------------------------------------------- /requirements/requirements-pydantic.txt: -------------------------------------------------------------------------------- 1 | docstring_parser~=0.15 2 | pydantic~=2.6.3 3 | requests 4 | -------------------------------------------------------------------------------- /requirements/requirements-test-tokenizer-random.txt: -------------------------------------------------------------------------------- 1 | cffi~=1.16.0 2 | -------------------------------------------------------------------------------- /scripts/build-info.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/build-info.sh -------------------------------------------------------------------------------- /scripts/check-requirements.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/check-requirements.sh -------------------------------------------------------------------------------- /scripts/ci-run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/ci-run.sh -------------------------------------------------------------------------------- /scripts/compare-commits.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/compare-commits.sh -------------------------------------------------------------------------------- /scripts/compare-llama-bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/compare-llama-bench.py -------------------------------------------------------------------------------- /scripts/debug-test.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/debug-test.sh -------------------------------------------------------------------------------- /scripts/gen-authors.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/gen-authors.sh -------------------------------------------------------------------------------- /scripts/gen-unicode-data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/gen-unicode-data.py -------------------------------------------------------------------------------- /scripts/get-flags.mk: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/get-flags.mk -------------------------------------------------------------------------------- /scripts/get-hellaswag.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/get-hellaswag.sh -------------------------------------------------------------------------------- /scripts/get-pg.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/get-pg.sh -------------------------------------------------------------------------------- /scripts/get-wikitext-103.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/get-wikitext-103.sh -------------------------------------------------------------------------------- /scripts/get-wikitext-2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/get-wikitext-2.sh -------------------------------------------------------------------------------- /scripts/get-winogrande.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/get-winogrande.sh -------------------------------------------------------------------------------- /scripts/hf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/hf.sh -------------------------------------------------------------------------------- /scripts/install-oneapi.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/install-oneapi.bat -------------------------------------------------------------------------------- /scripts/pod-llama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/pod-llama.sh -------------------------------------------------------------------------------- /scripts/qnt-all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/qnt-all.sh -------------------------------------------------------------------------------- /scripts/run-all-perf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/run-all-perf.sh -------------------------------------------------------------------------------- /scripts/run-all-ppl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/run-all-ppl.sh -------------------------------------------------------------------------------- /scripts/run-with-preset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/run-with-preset.py -------------------------------------------------------------------------------- /scripts/server-llm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/server-llm.sh -------------------------------------------------------------------------------- /scripts/sync-ggml-am.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/sync-ggml-am.sh -------------------------------------------------------------------------------- /scripts/sync-ggml.last: -------------------------------------------------------------------------------- 1 | b77f48b1efa671e094696b99fbf566aac8c87d74 2 | -------------------------------------------------------------------------------- /scripts/sync-ggml.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/sync-ggml.sh -------------------------------------------------------------------------------- /scripts/verify-checksum-models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/verify-checksum-models.py -------------------------------------------------------------------------------- /scripts/xxd.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/scripts/xxd.cmake -------------------------------------------------------------------------------- /spm-headers/ggml-alloc.h: -------------------------------------------------------------------------------- 1 | ../ggml/include/ggml-alloc.h -------------------------------------------------------------------------------- /spm-headers/ggml-backend.h: -------------------------------------------------------------------------------- 1 | ../ggml/include/ggml-backend.h -------------------------------------------------------------------------------- /spm-headers/ggml-metal.h: -------------------------------------------------------------------------------- 1 | ../ggml/include/ggml-metal.h -------------------------------------------------------------------------------- /spm-headers/ggml.h: -------------------------------------------------------------------------------- 1 | ../ggml/include/ggml.h -------------------------------------------------------------------------------- /spm-headers/llama.h: -------------------------------------------------------------------------------- 1 | ../include/llama.h -------------------------------------------------------------------------------- /src/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/CMakeLists.txt -------------------------------------------------------------------------------- /src/llama-grammar.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-grammar.cpp -------------------------------------------------------------------------------- /src/llama-grammar.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-grammar.h -------------------------------------------------------------------------------- /src/llama-impl.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-impl.h -------------------------------------------------------------------------------- /src/llama-sampling.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-sampling.cpp -------------------------------------------------------------------------------- /src/llama-sampling.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-sampling.h -------------------------------------------------------------------------------- /src/llama-vocab.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-vocab.cpp -------------------------------------------------------------------------------- /src/llama-vocab.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama-vocab.h -------------------------------------------------------------------------------- /src/llama.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/llama.cpp -------------------------------------------------------------------------------- /src/unicode-data.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/unicode-data.cpp -------------------------------------------------------------------------------- /src/unicode-data.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/unicode-data.h -------------------------------------------------------------------------------- /src/unicode.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/unicode.cpp -------------------------------------------------------------------------------- /src/unicode.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/src/unicode.h -------------------------------------------------------------------------------- /tests/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | !*.* 3 | *.o 4 | ggml-common.h 5 | -------------------------------------------------------------------------------- /tests/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/CMakeLists.txt -------------------------------------------------------------------------------- /tests/get-model.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/get-model.cpp -------------------------------------------------------------------------------- /tests/get-model.h: -------------------------------------------------------------------------------- 1 | #pragma once 2 | char * get_model_or_exit(int, char*[]); 3 | -------------------------------------------------------------------------------- /tests/run-json-schema-to-grammar.mjs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/run-json-schema-to-grammar.mjs -------------------------------------------------------------------------------- /tests/test-arg-parser.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-arg-parser.cpp -------------------------------------------------------------------------------- /tests/test-autorelease.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-autorelease.cpp -------------------------------------------------------------------------------- /tests/test-backend-ops.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-backend-ops.cpp -------------------------------------------------------------------------------- /tests/test-barrier.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-barrier.cpp -------------------------------------------------------------------------------- /tests/test-c.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-c.c -------------------------------------------------------------------------------- /tests/test-chat-template.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-chat-template.cpp -------------------------------------------------------------------------------- /tests/test-double-float.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-double-float.cpp -------------------------------------------------------------------------------- /tests/test-grad0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-grad0.cpp -------------------------------------------------------------------------------- /tests/test-grammar-integration.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-grammar-integration.cpp -------------------------------------------------------------------------------- /tests/test-grammar-parser.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-grammar-parser.cpp -------------------------------------------------------------------------------- /tests/test-json-schema-to-grammar.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-json-schema-to-grammar.cpp -------------------------------------------------------------------------------- /tests/test-llama-grammar.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-llama-grammar.cpp -------------------------------------------------------------------------------- /tests/test-log.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-log.cpp -------------------------------------------------------------------------------- /tests/test-lora-conversion-inference.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-lora-conversion-inference.sh -------------------------------------------------------------------------------- /tests/test-model-load-cancel.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-model-load-cancel.cpp -------------------------------------------------------------------------------- /tests/test-opt.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-opt.cpp -------------------------------------------------------------------------------- /tests/test-quantize-fns.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-quantize-fns.cpp -------------------------------------------------------------------------------- /tests/test-quantize-perf.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-quantize-perf.cpp -------------------------------------------------------------------------------- /tests/test-rope.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-rope.cpp -------------------------------------------------------------------------------- /tests/test-sampling.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-sampling.cpp -------------------------------------------------------------------------------- /tests/test-tokenizer-0.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-tokenizer-0.cpp -------------------------------------------------------------------------------- /tests/test-tokenizer-0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-tokenizer-0.py -------------------------------------------------------------------------------- /tests/test-tokenizer-0.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-tokenizer-0.sh -------------------------------------------------------------------------------- /tests/test-tokenizer-1-bpe.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-tokenizer-1-bpe.cpp -------------------------------------------------------------------------------- /tests/test-tokenizer-1-spm.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-tokenizer-1-spm.cpp -------------------------------------------------------------------------------- /tests/test-tokenizer-random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/guoriyue/LangCommand/HEAD/tests/test-tokenizer-random.py --------------------------------------------------------------------------------