├── .gitmodules
├── models
    ├── .gitignore
    ├── requirements-openvino.txt
    ├── requirements-coreml.txt
    ├── for-tests-ggml-base.bin
    ├── for-tests-ggml-tiny.bin
    ├── for-tests-ggml-base.en.bin
    ├── for-tests-ggml-large.bin
    ├── for-tests-ggml-medium.bin
    ├── for-tests-ggml-small.bin
    ├── for-tests-ggml-tiny.en.bin
    ├── for-tests-ggml-medium.en.bin
    └── for-tests-ggml-small.en.bin
├── bindings
    ├── go
    │   ├── .gitignore
    │   ├── samples
    │   │   └── jfk.wav
    │   ├── pkg
    │   │   └── whisper
    │   │   │   ├── doc.go
    │   │   │   ├── util_test.go
    │   │   │   └── consts.go
    │   ├── doc.go
    │   ├── go.mod
    │   └── examples
    │   │   ├── go-whisper
    │   │       └── color.go
    │   │   └── go-model-download
    │   │       └── context.go
    ├── javascript
    │   ├── .gitignore
    │   ├── package.json
    │   └── package-tmpl.json
    ├── ruby
    │   ├── .gitignore
    │   ├── tests
    │   │   ├── jfk_reader
    │   │   │   ├── extconf.rb
    │   │   │   └── .gitignore
    │   │   ├── test_error.rb
    │   │   └── helper.rb
    │   ├── ext
    │   │   ├── .gitignore
    │   │   ├── metal.mk
    │   │   ├── cpu.mk
    │   │   └── ruby_whisper.h
    │   └── extsources.rb
    ├── java
    │   ├── settings.gradle
    │   ├── gradle
    │   │   └── wrapper
    │   │   │   ├── gradle-wrapper.jar
    │   │   │   └── gradle-wrapper.properties
    │   ├── src
    │   │   ├── main
    │   │   │   └── java
    │   │   │   │   └── io
    │   │   │   │       └── github
    │   │   │   │           └── ggerganov
    │   │   │   │               └── whispercpp
    │   │   │   │                   ├── ggml
    │   │   │   │                       ├── GgmlTensor.java
    │   │   │   │                       └── GgmlType.java
    │   │   │   │                   ├── model
    │   │   │   │                       ├── WhisperState.java
    │   │   │   │                       └── EModel.java
    │   │   │   │                   ├── params
    │   │   │   │                       ├── WhisperFilters.java
    │   │   │   │                       ├── WhisperSamplingStrategy.java
    │   │   │   │                       ├── WhisperHParams.java
    │   │   │   │                       ├── GreedyParams.java
    │   │   │   │                       ├── BeamSearchParams.java
    │   │   │   │                       └── CBool.java
    │   │   │   │                   └── callbacks
    │   │   │   │                       └── WhisperProgressCallback.java
    │   │   └── test
    │   │   │   └── java
    │   │   │       └── io
    │   │   │           └── github
    │   │   │               └── ggerganov
    │   │   │                   └── whispercpp
    │   │   │                       └── WhisperJnaLibraryTest.java
    │   └── gradle.properties
    └── CMakeLists.txt
├── examples
    ├── whisper.android
    │   ├── app
    │   │   ├── .gitignore
    │   │   ├── src
    │   │   │   ├── main
    │   │   │   │   ├── res
    │   │   │   │   │   ├── values
    │   │   │   │   │   │   ├── strings.xml
    │   │   │   │   │   │   └── themes.xml
    │   │   │   │   │   ├── mipmap-anydpi
    │   │   │   │   │   │   └── ic_launcher.xml
    │   │   │   │   │   └── xml
    │   │   │   │   │   │   ├── backup_rules.xml
    │   │   │   │   │   │   └── data_extraction_rules.xml
    │   │   │   │   └── java
    │   │   │   │   │   └── com
    │   │   │   │   │       └── whispercppdemo
    │   │   │   │   │           ├── ui
    │   │   │   │   │               └── theme
    │   │   │   │   │               │   └── Color.kt
    │   │   │   │   │           └── MainActivity.kt
    │   │   │   ├── test
    │   │   │   │   └── java
    │   │   │   │   │   └── com
    │   │   │   │   │       └── whispercppdemo
    │   │   │   │   │           └── ExampleUnitTest.kt
    │   │   │   └── androidTest
    │   │   │   │   └── java
    │   │   │   │       └── com
    │   │   │   │           └── whispercppdemo
    │   │   │   │               └── ExampleInstrumentedTest.kt
    │   │   └── proguard-rules.pro
    │   ├── lib
    │   │   ├── .gitignore
    │   │   └── src
    │   │   │   └── main
    │   │   │       └── AndroidManifest.xml
    │   ├── .idea
    │   │   ├── .name
    │   │   ├── .gitignore
    │   │   ├── compiler.xml
    │   │   ├── vcs.xml
    │   │   ├── misc.xml
    │   │   └── gradle.xml
    │   ├── gradle
    │   │   └── wrapper
    │   │   │   ├── gradle-wrapper.jar
    │   │   │   └── gradle-wrapper.properties
    │   ├── .gitignore
    │   ├── build.gradle
    │   └── settings.gradle
    ├── talk-llama
    │   ├── llama-quant.h
    │   ├── .gitignore
    │   ├── llama-cparams.cpp
    │   ├── llama-memory.cpp
    │   ├── speak.bat
    │   ├── llama-io.cpp
    │   ├── speak.ps1
    │   ├── unicode-data.h
    │   ├── llama-sampling.h
    │   ├── llama-memory.h
    │   └── llama-io.h
    ├── whisper.android.java
    │   ├── app
    │   │   ├── .gitignore
    │   │   ├── src
    │   │   │   ├── main
    │   │   │   │   ├── res
    │   │   │   │   │   ├── values
    │   │   │   │   │   │   ├── strings.xml
    │   │   │   │   │   │   ├── colors.xml
    │   │   │   │   │   │   └── themes.xml
    │   │   │   │   │   ├── mipmap-hdpi
    │   │   │   │   │   │   ├── ic_launcher.png
    │   │   │   │   │   │   └── ic_launcher_round.png
    │   │   │   │   │   ├── mipmap-mdpi
    │   │   │   │   │   │   ├── ic_launcher.png
    │   │   │   │   │   │   └── ic_launcher_round.png
    │   │   │   │   │   ├── mipmap-xhdpi
    │   │   │   │   │   │   ├── ic_launcher.png
    │   │   │   │   │   │   └── ic_launcher_round.png
    │   │   │   │   │   ├── mipmap-xxhdpi
    │   │   │   │   │   │   ├── ic_launcher.png
    │   │   │   │   │   │   └── ic_launcher_round.png
    │   │   │   │   │   ├── mipmap-xxxhdpi
    │   │   │   │   │   │   ├── ic_launcher.png
    │   │   │   │   │   │   └── ic_launcher_round.png
    │   │   │   │   │   ├── mipmap-anydpi-v26
    │   │   │   │   │   │   ├── ic_launcher.xml
    │   │   │   │   │   │   └── ic_launcher_round.xml
    │   │   │   │   │   └── values-night
    │   │   │   │   │   │   └── themes.xml
    │   │   │   │   ├── java
    │   │   │   │   │   └── com
    │   │   │   │   │   │   ├── litongjava
    │   │   │   │   │   │       └── whisper
    │   │   │   │   │   │       │   └── android
    │   │   │   │   │   │       │       └── java
    │   │   │   │   │   │       │           └── app
    │   │   │   │   │   │       │               └── App.java
    │   │   │   │   │   │   └── whispercpp
    │   │   │   │   │   │       └── java
    │   │   │   │   │   │           └── whisper
    │   │   │   │   │   │               └── WhisperCpuConfig.java
    │   │   │   │   └── AndroidManifest.xml
    │   │   │   └── test
    │   │   │   │   └── java
    │   │   │   │       └── com
    │   │   │   │           └── litongjava
    │   │   │   │               └── whisper
    │   │   │   │                   └── android
    │   │   │   │                       └── java
    │   │   │   │                           └── ExampleUnitTest.java
    │   │   └── proguard-rules.pro
    │   ├── settings.gradle
    │   ├── README_files
    │   │   └── 1.jpg
    │   ├── gradle
    │   │   └── wrapper
    │   │   │   ├── gradle-wrapper.jar
    │   │   │   └── gradle-wrapper.properties
    │   ├── .gitignore
    │   └── build.gradle
    ├── addon.node
    │   ├── .gitignore
    │   ├── package.json
    │   └── __test__
    │   │   └── whisper.spec.js
    ├── whisper.swiftui
    │   ├── .gitignore
    │   ├── whisper.swiftui.demo
    │   │   ├── Resources
    │   │   │   ├── models
    │   │   │   │   └── .gitignore
    │   │   │   └── samples
    │   │   │   │   └── .gitignore
    │   │   ├── Supporting files
    │   │   │   ├── Assets.xcassets
    │   │   │   │   ├── Contents.json
    │   │   │   │   └── AccentColor.colorset
    │   │   │   │   │   └── Contents.json
    │   │   │   ├── Preview Content
    │   │   │   │   └── Preview Assets.xcassets
    │   │   │   │   │   └── Contents.json
    │   │   │   └── WhisperCppDemo.entitlements
    │   │   ├── WhisperCppDemoApp.swift
    │   │   ├── Utils
    │   │   │   └── RiffWaveUtils.swift
    │   │   └── Models
    │   │   │   └── Model.swift
    │   └── whisper.swiftui.xcodeproj
    │   │   ├── .gitignore
    │   │   └── project.xcworkspace
    │   │       ├── .gitignore
    │   │       └── xcshareddata
    │   │           └── IDEWorkspaceChecks.plist
    ├── quantize
    │   ├── README.md
    │   └── CMakeLists.txt
    ├── command
    │   ├── commands.txt
    │   └── CMakeLists.txt
    ├── whisper.objc
    │   ├── whisper.objc
    │   │   ├── Assets.xcassets
    │   │   │   ├── Contents.json
    │   │   │   ├── AccentColor.colorset
    │   │   │   │   └── Contents.json
    │   │   │   └── AppIcon.appiconset
    │   │   │   │   └── Contents.json
    │   │   ├── AppDelegate.h
    │   │   ├── SceneDelegate.h
    │   │   ├── main.m
    │   │   └── Info.plist
    │   └── whisper.objc.xcodeproj
    │   │   └── project.xcworkspace
    │   │       ├── contents.xcworkspacedata
    │   │       └── xcshareddata
    │   │           └── IDEWorkspaceChecks.plist
    ├── wchess
    │   ├── wchess.wasm
    │   │   └── chessboardjs-1.0.0
    │   │   │   ├── img
    │   │   │       └── chesspieces
    │   │   │       │   └── wikipedia
    │   │   │       │       ├── bB.png
    │   │   │       │       ├── bK.png
    │   │   │       │       ├── bN.png
    │   │   │       │       ├── bP.png
    │   │   │       │       ├── bQ.png
    │   │   │       │       ├── bR.png
    │   │   │       │       ├── wB.png
    │   │   │       │       ├── wK.png
    │   │   │       │       ├── wN.png
    │   │   │       │       ├── wP.png
    │   │   │       │       ├── wQ.png
    │   │   │       │       └── wR.png
    │   │   │   ├── css
    │   │   │       └── chessboard-1.0.0.min.css
    │   │   │   └── js
    │   │   │       └── chessboard-1.0.0
    │   │   │           └── package.json
    │   ├── wchess.cmd
    │   │   └── CMakeLists.txt
    │   ├── CMakeLists.txt
    │   └── libwchess
    │   │   └── CMakeLists.txt
    ├── deprecation-warning
    │   ├── CMakeLists.txt
    │   └── README.md
    ├── python
    │   └── test_whisper_processor.py
    ├── bench
    │   └── CMakeLists.txt
    ├── cli
    │   └── CMakeLists.txt
    ├── sycl
    │   ├── ls-sycl-device.cpp
    │   ├── CMakeLists.txt
    │   ├── run-whisper.sh
    │   └── build.sh
    ├── lsp
    │   └── CMakeLists.txt
    ├── stream
    │   └── CMakeLists.txt
    ├── server
    │   └── CMakeLists.txt
    ├── common-ggml.h
    ├── stream.wasm
    │   └── README.md
    ├── console.h
    ├── bench.wasm
    │   └── README.md
    └── command.wasm
    │   └── README.md
├── tests
    ├── .gitignore
    ├── test-c.c
    └── en-2-ref.txt
├── samples
    ├── .gitignore
    ├── jfk.mp3
    ├── jfk.wav
    └── README.md
├── scripts
    ├── sync-ggml.last
    ├── sha-all.sh
    ├── apple
    │   └── validate-apps.sh
    ├── convert-all.sh
    ├── gen-authors.sh
    ├── sync-llama.sh
    └── build-info.sh
├── ggml
    ├── .gitignore
    ├── src
    │   ├── ggml-cuda
    │   │   ├── argmax.cuh
    │   │   ├── out-prod.cuh
    │   │   ├── argsort.cuh
    │   │   ├── fattn.cuh
    │   │   ├── gla.cuh
    │   │   ├── fattn-tile-f16.cuh
    │   │   ├── fattn-tile-f32.cuh
    │   │   ├── fattn-wmma-f16.cuh
    │   │   ├── acc.cuh
    │   │   ├── pad.cuh
    │   │   ├── clamp.cuh
    │   │   ├── scale.cuh
    │   │   ├── arange.cuh
    │   │   ├── concat.cuh
    │   │   ├── im2col.cuh
    │   │   ├── pool2d.cuh
    │   │   ├── wkv6.cuhold
    │   │   ├── upscale.cuh
    │   │   ├── count-equal.cuh
    │   │   ├── diagmask.cuh
    │   │   ├── opt-step-adamw.cuh
    │   │   ├── tsembd.cuh
    │   │   ├── conv-transpose-1d.cuh
    │   │   ├── template-instances
    │   │   │   ├── mmq-instance-iq1_s.cu
    │   │   │   ├── mmq-instance-iq2_s.cu
    │   │   │   ├── mmq-instance-iq3_s.cu
    │   │   │   ├── mmq-instance-q2_k.cu
    │   │   │   ├── mmq-instance-q3_k.cu
    │   │   │   ├── mmq-instance-q4_0.cu
    │   │   │   ├── mmq-instance-q4_1.cu
    │   │   │   ├── mmq-instance-q4_k.cu
    │   │   │   ├── mmq-instance-q5_0.cu
    │   │   │   ├── mmq-instance-q5_1.cu
    │   │   │   ├── mmq-instance-q5_k.cu
    │   │   │   ├── mmq-instance-q6_k.cu
    │   │   │   ├── mmq-instance-q8_0.cu
    │   │   │   ├── mmq-instance-iq2_xs.cu
    │   │   │   ├── mmq-instance-iq2_xxs.cu
    │   │   │   ├── mmq-instance-iq3_xxs.cu
    │   │   │   ├── mmq-instance-iq4_nl.cu
    │   │   │   ├── mmq-instance-iq4_xs.cu
    │   │   │   ├── fattn-vec-f16-instance-hs64-f16-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs64-f16-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-f16-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-f16-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-f16-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-f16-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-f16-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-f16-q8_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_0-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_0-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_0-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_0-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_0-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_0-q8_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_1-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_1-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_1-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_1-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_1-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q4_1-q8_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_0-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_0-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_0-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_0-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_0-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_0-q8_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_1-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_1-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_1-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_1-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_1-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q5_1-q8_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q8_0-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q8_0-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q8_0-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q8_0-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q8_0-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs128-q8_0-q8_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs256-f16-f16.cu
    │   │   │   ├── fattn-vec-f16-instance-hs64-f16-q4_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs64-f16-q4_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs64-f16-q5_0.cu
    │   │   │   ├── fattn-vec-f16-instance-hs64-f16-q5_1.cu
    │   │   │   ├── fattn-vec-f16-instance-hs64-f16-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-f16-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-f16-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-f16-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-f16-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-f16-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-f16-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_0-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_0-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_0-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_0-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_0-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_0-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_1-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_1-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_1-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_1-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_1-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q4_1-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_0-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_0-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_0-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_0-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_0-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_0-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_1-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_1-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_1-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_1-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_1-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q5_1-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q8_0-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q8_0-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q8_0-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q8_0-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q8_0-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs128-q8_0-q8_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs256-f16-f16.cu
    │   │   │   ├── fattn-vec-f32-instance-hs64-f16-q4_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs64-f16-q4_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs64-f16-q5_0.cu
    │   │   │   ├── fattn-vec-f32-instance-hs64-f16-q5_1.cu
    │   │   │   ├── fattn-vec-f32-instance-hs64-f16-q8_0.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_1-ncols2_8.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_2-ncols2_4.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_2-ncols2_8.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_4-ncols2_2.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_4-ncols2_4.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_4-ncols2_8.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_8-ncols2_1.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_8-ncols2_2.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_8-ncols2_4.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_8-ncols2_8.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_16-ncols2_1.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_16-ncols2_2.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_16-ncols2_4.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_32-ncols2_1.cu
    │   │   │   ├── fattn-mma-f16-instance-ncols1_32-ncols2_2.cu
    │   │   │   └── fattn-mma-f16-instance-ncols1_64-ncols2_1.cu
    │   │   ├── sum.cuh
    │   │   ├── sumrows.cuh
    │   │   ├── rope.cuh
    │   │   ├── wkv.cuh
    │   │   ├── softmax.cuh
    │   │   ├── cross-entropy-loss.cuh
    │   │   ├── getrows.cuh
    │   │   ├── cpy.cuh
    │   │   ├── convert.cuh
    │   │   ├── norm.cuh
    │   │   ├── mmvq.cuh
    │   │   ├── binbcast.cuh
    │   │   ├── vendors
    │   │   │   └── cuda.h
    │   │   └── mmv.cuh
    │   ├── ggml-vulkan
    │   │   ├── vulkan-shaders
    │   │   │   ├── test_coopmat2_support.comp
    │   │   │   ├── test_coopmat_support.comp
    │   │   │   ├── generic_head.comp
    │   │   │   ├── CMakeLists.txt
    │   │   │   ├── dequant_head.comp
    │   │   │   ├── cos.comp
    │   │   │   ├── sin.comp
    │   │   │   ├── square.comp
    │   │   │   ├── clamp.comp
    │   │   │   ├── dequant_f32.comp
    │   │   │   ├── copy.comp
    │   │   │   ├── relu.comp
    │   │   │   ├── sigmoid.comp
    │   │   │   ├── tanh.comp
    │   │   │   ├── silu.comp
    │   │   │   ├── leaky_relu.comp
    │   │   │   ├── scale.comp
    │   │   │   ├── gelu_quick.comp
    │   │   │   ├── gelu.comp
    │   │   │   ├── silu_back.comp
    │   │   │   ├── div.comp
    │   │   │   ├── mul.comp
    │   │   │   ├── repeat.comp
    │   │   │   └── count_equal.comp
    │   │   └── cmake
    │   │   │   └── host-toolchain.cmake.in
    │   ├── ggml-cpu
    │   │   ├── ggml-cpu-hbm.h
    │   │   ├── ggml-cpu-aarch64.h
    │   │   ├── amx
    │   │   │   ├── amx.h
    │   │   │   └── mmq.h
    │   │   ├── llamafile
    │   │   │   └── sgemm.h
    │   │   └── kleidiai
    │   │   │   └── kleidiai.h
    │   ├── ggml-sycl
    │   │   ├── gla.hpp
    │   │   ├── wkv6.hpp
    │   │   ├── outprod.hpp
    │   │   ├── wkv.hpp
    │   │   ├── cpy.hpp
    │   │   ├── sycl_hw.cpp
    │   │   ├── sycl_hw.hpp
    │   │   ├── concat.hpp
    │   │   ├── conv.hpp
    │   │   ├── softmax.hpp
    │   │   ├── tsembd.hpp
    │   │   ├── rope.hpp
    │   │   ├── getrows.hpp
    │   │   ├── im2col.hpp
    │   │   ├── mmvq.hpp
    │   │   ├── dmmv.hpp
    │   │   ├── convert.hpp
    │   │   └── backend.hpp
    │   ├── ggml-rpc
    │   │   └── CMakeLists.txt
    │   ├── ggml-threading.h
    │   ├── ggml-threading.cpp
    │   ├── ggml-amx
    │   │   └── mmq.h
    │   ├── ggml-kompute
    │   │   └── kompute-shaders
    │   │   │   ├── op_scale.comp
    │   │   │   ├── op_relu.comp
    │   │   │   ├── op_scale_8.comp
    │   │   │   ├── op_silu.comp
    │   │   │   ├── op_getrows.comp
    │   │   │   ├── op_gelu.comp
    │   │   │   ├── op_mul_mv_q_n_pre.comp
    │   │   │   ├── op_addrow.comp
    │   │   │   ├── op_diagmask.comp
    │   │   │   ├── op_getrows_f32.comp
    │   │   │   └── op_getrows_f16.comp
    │   ├── ggml-opencl
    │   │   └── kernels
    │   │   │   └── embed_kernel.py
    │   └── ggml-cann
    │   │   └── kernels
    │   │       └── ascendc_kernels.h
    ├── include
    │   ├── ggml-blas.h
    │   ├── ggml-opencl.h
    │   └── ggml-rpc.h
    └── cmake
    │   └── GitVars.cmake
├── README_sycl.md
├── SDL2
    ├── lib
    │   ├── x64
    │   │   ├── SDL2.dll
    │   │   ├── SDL2.lib
    │   │   ├── SDL2main.lib
    │   │   └── SDL2test.lib
    │   └── x86
    │   │   ├── SDL2.dll
    │   │   ├── SDL2.lib
    │   │   ├── SDL2main.lib
    │   │   └── SDL2test.lib
    ├── docs
    │   ├── README-hg.md
    │   ├── README-platforms.md
    │   ├── README-wince.md
    │   ├── README-git.md
    │   └── README-pandora.md
    ├── include
    │   ├── SDL_revision.h
    │   └── SDL_opengles2_gl2platform.h
    ├── README-SDL.txt
    ├── BUGS.txt
    └── README.txt
├── cmake
    ├── whisper.pc.in
    ├── DefaultTargetOptions.cmake
    └── git-vars.cmake
├── grammars
    └── colors.gbnf
├── .github
    └── workflows
    │   └── bindings-go.yml
├── .devops
    ├── main.Dockerfile
    └── cublas.Dockerfile
└── src
    └── coreml
        └── whisper-encoder.h


/.gitmodules:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/models/.gitignore:
--------------------------------------------------------------------------------
1 | *.bin
2 | 


--------------------------------------------------------------------------------
/bindings/go/.gitignore:
--------------------------------------------------------------------------------
1 | build
2 | models
3 | 


--------------------------------------------------------------------------------
/bindings/javascript/.gitignore:
--------------------------------------------------------------------------------
1 | publish.log
2 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/.gitignore:
--------------------------------------------------------------------------------
1 | /build


--------------------------------------------------------------------------------
/examples/whisper.android/lib/.gitignore:
--------------------------------------------------------------------------------
1 | /build


--------------------------------------------------------------------------------
/examples/talk-llama/llama-quant.h:
--------------------------------------------------------------------------------
1 | #pragma once
2 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/.gitignore:
--------------------------------------------------------------------------------
1 | /build


--------------------------------------------------------------------------------
/examples/whisper.android/.idea/.name:
--------------------------------------------------------------------------------
1 | WhisperCppDemo


--------------------------------------------------------------------------------
/tests/.gitignore:
--------------------------------------------------------------------------------
1 | *.wav
2 | *.ogg
3 | *.wav.txt
4 | 


--------------------------------------------------------------------------------
/samples/.gitignore:
--------------------------------------------------------------------------------
1 | *
2 | !jfk.wave
3 | !jfk.mp3
4 | 
5 | 


--------------------------------------------------------------------------------
/bindings/ruby/.gitignore:
--------------------------------------------------------------------------------
1 | LICENSE
2 | pkg/
3 | lib/whisper.*
4 | 


--------------------------------------------------------------------------------
/examples/talk-llama/.gitignore:
--------------------------------------------------------------------------------
1 | audio.mp3
2 | to_speak.txt
3 | 


--------------------------------------------------------------------------------
/bindings/java/settings.gradle:
--------------------------------------------------------------------------------
1 | rootProject.name = "whispercpp"
2 | 


--------------------------------------------------------------------------------
/examples/addon.node/.gitignore:
--------------------------------------------------------------------------------
1 | .idea
2 | node_modules
3 | build
4 | 


--------------------------------------------------------------------------------
/examples/talk-llama/llama-cparams.cpp:
--------------------------------------------------------------------------------
1 | #include "llama-cparams.h"
2 | 


--------------------------------------------------------------------------------
/examples/talk-llama/llama-memory.cpp:
--------------------------------------------------------------------------------
1 | #include "llama-memory.h"
2 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/.gitignore:
--------------------------------------------------------------------------------
1 | xcuserdata
2 | xcshareddata
3 | 


--------------------------------------------------------------------------------
/scripts/sync-ggml.last:
--------------------------------------------------------------------------------
1 | 7b08f4cd9e32781e769a52cf0dcaeb2c556632c3
2 | 


--------------------------------------------------------------------------------
/tests/test-c.c:
--------------------------------------------------------------------------------
1 | #include "whisper.h"
2 | 
3 | int main(void) {}
4 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Resources/models/.gitignore:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Resources/samples/.gitignore:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.xcodeproj/.gitignore:
--------------------------------------------------------------------------------
1 | xcuserdata/
2 | 


--------------------------------------------------------------------------------
/models/requirements-openvino.txt:
--------------------------------------------------------------------------------
1 | openvino-dev[pytorch,onnx]
2 | openai-whisper


--------------------------------------------------------------------------------
/ggml/.gitignore:
--------------------------------------------------------------------------------
1 | src/ggml-vulkan-shaders.hpp
2 | src/ggml-vulkan-shaders.cpp
3 | 


--------------------------------------------------------------------------------
/README_sycl.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/README_sycl.md


--------------------------------------------------------------------------------
/samples/jfk.mp3:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/samples/jfk.mp3


--------------------------------------------------------------------------------
/samples/jfk.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/samples/jfk.wav


--------------------------------------------------------------------------------
/models/requirements-coreml.txt:
--------------------------------------------------------------------------------
1 | torch
2 | coremltools
3 | openai-whisper
4 | ane_transformers
5 | 


--------------------------------------------------------------------------------
/SDL2/lib/x64/SDL2.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x64/SDL2.dll


--------------------------------------------------------------------------------
/SDL2/lib/x64/SDL2.lib:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x64/SDL2.lib


--------------------------------------------------------------------------------
/SDL2/lib/x86/SDL2.dll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x86/SDL2.dll


--------------------------------------------------------------------------------
/SDL2/lib/x86/SDL2.lib:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x86/SDL2.lib


--------------------------------------------------------------------------------
/bindings/ruby/tests/jfk_reader/extconf.rb:
--------------------------------------------------------------------------------
1 | require "mkmf"
2 | 
3 | create_makefile("jfk_reader")
4 | 


--------------------------------------------------------------------------------
/examples/whisper.android/.idea/.gitignore:
--------------------------------------------------------------------------------
1 | # Default ignored files
2 | /shelf/
3 | /workspace.xml
4 | 


--------------------------------------------------------------------------------
/SDL2/lib/x64/SDL2main.lib:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x64/SDL2main.lib


--------------------------------------------------------------------------------
/SDL2/lib/x64/SDL2test.lib:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x64/SDL2test.lib


--------------------------------------------------------------------------------
/SDL2/lib/x86/SDL2main.lib:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x86/SDL2main.lib


--------------------------------------------------------------------------------
/SDL2/lib/x86/SDL2test.lib:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/SDL2/lib/x86/SDL2test.lib


--------------------------------------------------------------------------------
/examples/whisper.android.java/settings.gradle:
--------------------------------------------------------------------------------
1 | include ':app'
2 | rootProject.name = "whisper.android.java"


--------------------------------------------------------------------------------
/bindings/go/samples/jfk.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/bindings/go/samples/jfk.wav


--------------------------------------------------------------------------------
/examples/talk-llama/speak.bat:
--------------------------------------------------------------------------------
1 | @powershell -ExecutionPolicy Bypass -F examples\talk-llama\speak.ps1 %1 %2
2 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.xcodeproj/project.xcworkspace/.gitignore:
--------------------------------------------------------------------------------
1 | contents.xcworkspacedata
2 | 


--------------------------------------------------------------------------------
/examples/quantize/README.md:
--------------------------------------------------------------------------------
1 | # quantize
2 | 
3 | Tool for integer quantization of Whisper `ggml` model files
4 | 


--------------------------------------------------------------------------------
/models/for-tests-ggml-base.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-base.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-tiny.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-tiny.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-base.en.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-base.en.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-large.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-large.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-medium.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-medium.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-small.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-small.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-tiny.en.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-tiny.en.bin


--------------------------------------------------------------------------------
/SDL2/docs/README-hg.md:
--------------------------------------------------------------------------------
1 | We are no longer hosted in Mercurial. Please see README-git.md for details.
2 | 
3 | Thanks!
4 | 
5 | 


--------------------------------------------------------------------------------
/models/for-tests-ggml-medium.en.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-medium.en.bin


--------------------------------------------------------------------------------
/models/for-tests-ggml-small.en.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/models/for-tests-ggml-small.en.bin


--------------------------------------------------------------------------------
/bindings/go/pkg/whisper/doc.go:
--------------------------------------------------------------------------------
1 | /*
2 | This is the higher-level speech-to-text whisper.cpp API for go
3 | */
4 | package whisper
5 | 


--------------------------------------------------------------------------------
/bindings/ruby/tests/jfk_reader/.gitignore:
--------------------------------------------------------------------------------
1 | Makefile
2 | jfk_reader.o
3 | jfk_reader.so
4 | jfk_reader.bundle
5 | jfk_reader.dll
6 | 


--------------------------------------------------------------------------------
/examples/command/commands.txt:
--------------------------------------------------------------------------------
 1 | enable
 2 | disable
 3 | cat
 4 | dog
 5 | apple
 6 | red
 7 | blue
 8 | green
 9 | lightblue
10 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/argmax.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_argmax(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/out-prod.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_out_prod(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/res/values/strings.xml:
--------------------------------------------------------------------------------
1 | <resources>
2 |     <string name="app_name">WhisperCppDemo</string>
3 | </resources>


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/argsort.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_op_argsort(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/fattn.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_flash_attn_ext(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/bindings/java/gradle/wrapper/gradle-wrapper.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/bindings/java/gradle/wrapper/gradle-wrapper.jar


--------------------------------------------------------------------------------
/examples/whisper.android.java/README_files/1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/README_files/1.jpg


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/values/strings.xml:
--------------------------------------------------------------------------------
1 | <resources>
2 |   <string name="app_name">whisper.android.java</string>
3 | </resources>


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/Assets.xcassets/Contents.json:
--------------------------------------------------------------------------------
1 | {
2 |   "info" : {
3 |     "author" : "xcode",
4 |     "version" : 1
5 |   }
6 | }
7 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/gla.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_op_gated_linear_attn(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/fattn-tile-f16.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_flash_attn_ext_tile_f16(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/fattn-tile-f32.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_flash_attn_ext_tile_f32(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void ggml_cuda_flash_attn_ext_wmma_f16(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
4 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/test_coopmat2_support.comp:
--------------------------------------------------------------------------------
1 | #version 460
2 | 
3 | #extension GL_NV_cooperative_matrix2 : require
4 | 
5 | void main()
6 | {
7 | }
8 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/test_coopmat_support.comp:
--------------------------------------------------------------------------------
1 | #version 460
2 | 
3 | #extension GL_KHR_cooperative_matrix : require
4 | 
5 | void main()
6 | {
7 | }
8 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/ggml/GgmlTensor.java:
--------------------------------------------------------------------------------
1 | package io.github.ggerganov.whispercpp.ggml;
2 | 
3 | public class GgmlTensor {
4 | }
5 | 


--------------------------------------------------------------------------------
/examples/whisper.android/gradle/wrapper/gradle-wrapper.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android/gradle/wrapper/gradle-wrapper.jar


--------------------------------------------------------------------------------
/bindings/go/pkg/whisper/util_test.go:
--------------------------------------------------------------------------------
1 | package whisper_test
2 | 
3 | const (
4 | 	ModelPath  = "../../models/ggml-small.en.bin"
5 | 	SamplePath = "../../samples/jfk.wav"
6 | )
7 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/acc.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_ACC_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_acc(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/pad.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_PAD_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_pad(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/bindings/go/doc.go:
--------------------------------------------------------------------------------
1 | /*
2 | github.com/ggerganov/whisper.cpp/bindings/go
3 | provides a speech-to-text service bindings for the Go programming language.
4 | */
5 | package whisper
6 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/model/WhisperState.java:
--------------------------------------------------------------------------------
1 | package io.github.ggerganov.whispercpp.model;
2 | 
3 | public class WhisperState {
4 | }
5 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/gradle/wrapper/gradle-wrapper.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/gradle/wrapper/gradle-wrapper.jar


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Supporting files/Assets.xcassets/Contents.json:
--------------------------------------------------------------------------------
1 | {
2 |   "info" : {
3 |     "author" : "xcode",
4 |     "version" : 1
5 |   }
6 | }
7 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/clamp.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_CLAMP_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_clamp(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/scale.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_SCALE_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_scale(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/scripts/sha-all.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | # Compute the SHA1 of all model files in ./models/ggml-*.bin
4 | 
5 | for f in ./models/ggml-*.bin; do
6 |     shasum "$f" -a 1
7 | done
8 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/arange.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_ARANGE_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_arange(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/concat.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_CONCAT_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_concat(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/im2col.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_IM2COL_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_im2col(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/pool2d.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_POOL2D_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_pool2d(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/wkv6.cuhold:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_WKV_BLOCK_SIZE 64
4 | 
5 | void ggml_cuda_op_rwkv_wkv6(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/examples/whisper.android/lib/src/main/AndroidManifest.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <manifest xmlns:android="http://schemas.android.com/apk/res/android">
3 | 
4 | </manifest>


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/upscale.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_UPSCALE_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_upscale(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/count-equal.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_COUNT_EQUAL_CHUNK_SIZE 128
4 | 
5 | void ggml_cuda_count_equal(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/scripts/apple/validate-apps.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | ./scripts/apple/validate-ios.sh
3 | ./scripts/apple/validate-macos.sh
4 | ./scripts/apple/validate-visionos.sh
5 | ./scripts/apple/validate-tvos.sh
6 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Supporting files/Preview Content/Preview Assets.xcassets/Contents.json:
--------------------------------------------------------------------------------
1 | {
2 |   "info" : {
3 |     "author" : "xcode",
4 |     "version" : 1
5 |   }
6 | }
7 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/diagmask.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_DIAG_MASK_INF_BLOCK_SIZE 32
4 | 
5 | void ggml_cuda_op_diag_mask_inf(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-hdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-hdpi/ic_launcher.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-mdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-mdpi/ic_launcher.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-xhdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-xhdpi/ic_launcher.png


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/opt-step-adamw.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_OPT_STEP_ADAMW_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_opt_step_adamw(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/bindings/ruby/ext/.gitignore:
--------------------------------------------------------------------------------
 1 | Makefile
 2 | whisper.so
 3 | whisper.bundle
 4 | whisper.dll
 5 | scripts/get-flags.mk
 6 | *.o
 7 | /*/**/*.c
 8 | /*/**/*.cpp
 9 | /*/**/*.h
10 | /*/**/*.m
11 | /*/**/*.metal
12 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-xxhdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-xxhdpi/ic_launcher.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-xxxhdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-xxxhdpi/ic_launcher.png


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/tsembd.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_TIMESTEP_EMBEDDING_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_timestep_embedding(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bB.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bB.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bK.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bK.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bN.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bN.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bP.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bP.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bQ.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bQ.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bR.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/bR.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wB.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wB.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wK.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wK.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wN.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wN.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wP.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wP.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wQ.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wQ.png


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wR.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/wchess/wchess.wasm/chessboardjs-1.0.0/img/chesspieces/wikipedia/wR.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-hdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-hdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-mdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-mdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/conv-transpose-1d.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_CONV_TRANPOSE_1D_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_conv_transpose_1d(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ1_S);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ2_S);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ3_S);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q2_K);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q3_K);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q4_K);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q5_K);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q6_K);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-xhdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-xhdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Mozer/talk-llama-fast/HEAD/examples/whisper.android.java/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/ggml/src/ggml-cpu/ggml-cpu-hbm.h:
--------------------------------------------------------------------------------
1 | #pragma once
2 | 
3 | #include "ggml-backend.h"
4 | #include "ggml.h"
5 | 
6 | // GGML CPU internal header
7 | 
8 | ggml_backend_buffer_type_t ggml_backend_cpu_hbm_buffer_type(void);
9 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ2_XS);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ2_XXS);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ3_XXS);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ4_NL);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../mmq.cuh"
4 | 
5 | DECL_MMQ_CASE(GGML_TYPE_IQ4_XS);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cpu/ggml-cpu-aarch64.h:
--------------------------------------------------------------------------------
1 | #pragma once
2 | 
3 | #include "ggml-cpu-traits.h"
4 | #include "ggml.h"
5 | 
6 | // GGML internal header
7 | 
8 | ggml_backend_buffer_type_t ggml_backend_cpu_aarch64_buffer_type(void);
9 | 


--------------------------------------------------------------------------------
/examples/quantize/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | set(TARGET quantize)
2 | add_executable(${TARGET} quantize.cpp)
3 | 
4 | include(DefaultTargetOptions)
5 | 
6 | target_link_libraries(${TARGET} PRIVATE common whisper ${CMAKE_THREAD_LIBS_INIT})
7 | 


--------------------------------------------------------------------------------
/examples/whisper.android/.idea/compiler.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="CompilerConfiguration">
4 |     <bytecodeTargetLevel target="17" />
5 |   </component>
6 | </project>


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/res/values/themes.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <resources>
3 | 
4 |     <style name="Theme.WhisperCppDemo" parent="android:Theme.Material.Light.NoActionBar" />
5 | </resources>


--------------------------------------------------------------------------------
/SDL2/docs/README-platforms.md:
--------------------------------------------------------------------------------
1 | Platforms
2 | =========
3 | 
4 | We maintain the list of supported platforms on our wiki now, and how to
5 | build and install SDL for those platforms:
6 | 
7 |     https://wiki.libsdl.org/Installation
8 | 
9 | 


--------------------------------------------------------------------------------
/bindings/ruby/ext/metal.mk:
--------------------------------------------------------------------------------
1 | ggml/src/ggml-metal/ggml-metal.o: \
2 | 	ggml/src/ggml-metal/ggml-metal.m \
3 | 	ggml/src/ggml-metal/ggml-metal-impl.h \
4 | 	ggml/include/ggml-metal.h \
5 | 	ggml/include/ggml.h
6 | 	$(CC) $(CFLAGS) -c $< -o $@
7 | 


--------------------------------------------------------------------------------
/examples/whisper.android/.idea/vcs.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="VcsDirectoryMappings">
4 |     <mapping directory="$PROJECT_DIR$/../.." vcs="Git" />
5 |   </component>
6 | </project>


--------------------------------------------------------------------------------
/examples/deprecation-warning/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | add_executable(main ./deprecation-warning.cpp)
2 | add_executable(bench ./deprecation-warning.cpp)
3 | add_executable(stream ./deprecation-warning.cpp)
4 | add_executable(command ./deprecation-warning.cpp)
5 | 


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc.xcodeproj/project.xcworkspace/contents.xcworkspacedata:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <Workspace
3 |    version = "1.0">
4 |    <FileRef
5 |       location = "self:">
6 |    </FileRef>
7 | </Workspace>
8 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/gla.hpp:
--------------------------------------------------------------------------------
1 | #ifndef GGML_SYCL_GLA_HPP
2 | #define GGML_SYCL_GLA_HPP
3 | 
4 | #include "common.hpp"
5 | 
6 | void ggml_sycl_op_gated_linear_attn(ggml_backend_sycl_context & ctx, ggml_tensor * dst);
7 | 
8 | #endif  // GGML_SYCL_GLA_HPP
9 | 


--------------------------------------------------------------------------------
/examples/python/test_whisper_processor.py:
--------------------------------------------------------------------------------
1 | import whisper_processor
2 | 
3 | try:
4 |     result = whisper_processor.process_audio("./audio/wake_word_detected16k.wav", "base.en")
5 |     print(result)
6 | except Exception as e:
7 |     print(f"Error: {e}")


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/sum.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void sum_f32_cuda(ggml_cuda_pool & pool, const float * x, float * dst, const int64_t ne, cudaStream_t stream);
4 | 
5 | void ggml_cuda_op_sum(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cpu/amx/amx.h:
--------------------------------------------------------------------------------
1 | #include "ggml-backend.h"
2 | #include "ggml-cpu-impl.h"
3 | 
4 | // GGML internal header
5 | 
6 | #if defined(__AMX_INT8__) && defined(__AVX512VNNI__)
7 | ggml_backend_buffer_type_t ggml_backend_amx_buffer_type(void);
8 | #endif
9 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/sumrows.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | void sum_rows_f32_cuda(const float * x, float * dst, const int ncols, const int nrows, cudaStream_t stream);
4 | 
5 | void ggml_cuda_op_sum_rows(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/wkv6.hpp:
--------------------------------------------------------------------------------
 1 | #ifndef GGML_SYCL_WKV6_HPP
 2 | #define GGML_SYCL_WKV6_HPP
 3 | 
 4 | #include "common.hpp"
 5 | 
 6 | void ggml_sycl_op_rwkv_wkv6(ggml_backend_sycl_context & ctx, ggml_tensor * dst);
 7 | 
 8 | 
 9 | #endif // GGML_SYCL_WKV6_HPP
10 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/generic_head.comp:
--------------------------------------------------------------------------------
 1 | #extension GL_EXT_shader_16bit_storage : require
 2 | 
 3 | layout (push_constant) uniform parameter
 4 | {
 5 |     uint KX;
 6 |     uint KY;
 7 |     float param1;
 8 |     float param2;
 9 | } p;
10 | 


--------------------------------------------------------------------------------
/examples/bench/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | set(TARGET whisper-bench)
2 | add_executable(${TARGET} bench.cpp)
3 | 
4 | include(DefaultTargetOptions)
5 | 
6 | target_link_libraries(${TARGET} PRIVATE whisper ${CMAKE_THREAD_LIBS_INIT})
7 | 
8 | install(TARGETS ${TARGET} RUNTIME)
9 | 


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/Assets.xcassets/AccentColor.colorset/Contents.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "colors" : [
 3 |     {
 4 |       "idiom" : "universal"
 5 |     }
 6 |   ],
 7 |   "info" : {
 8 |     "author" : "xcode",
 9 |     "version" : 1
10 |   }
11 | }
12 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/WhisperCppDemoApp.swift:
--------------------------------------------------------------------------------
 1 | import SwiftUI
 2 | 
 3 | @main
 4 | struct WhisperCppDemoApp: App {
 5 |     var body: some Scene {
 6 |         WindowGroup {
 7 |             ContentView()
 8 |         }
 9 |     }
10 | }
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/rope.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_ROPE_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_op_rope(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 
7 | void ggml_cuda_op_rope_back(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
8 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/wkv.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_WKV_BLOCK_SIZE 64
4 | 
5 | void ggml_cuda_op_rwkv_wkv6(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 
7 | void ggml_cuda_op_rwkv_wkv7(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
8 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f16.cuh"
4 | 
5 | DECL_FATTN_VEC_F16_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_F16, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_0, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q4_1, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_0, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q5_1, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(128, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(256, GGML_TYPE_F16, GGML_TYPE_F16);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q4_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_1.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q5_1);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q8_0.cu:
--------------------------------------------------------------------------------
1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
2 | 
3 | #include "../fattn-vec-f32.cuh"
4 | 
5 | DECL_FATTN_VEC_F32_CASE(64, GGML_TYPE_F16, GGML_TYPE_Q8_0);
6 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/outprod.hpp:
--------------------------------------------------------------------------------
 1 | #ifndef GGML_SYCL_OUTPROD_HPP
 2 | #define GGML_SYCL_OUTPROD_HPP
 3 | 
 4 | #include "common.hpp"
 5 | 
 6 | void ggml_sycl_op_out_prod(ggml_backend_sycl_context& ctx, ggml_tensor* dst);
 7 | 
 8 | 
 9 | #endif // GGML_SYCL_OUTPROD_HPP
10 | 
11 | 


--------------------------------------------------------------------------------
/SDL2/docs/README-wince.md:
--------------------------------------------------------------------------------
 1 | WinCE
 2 | =====
 3 | 
 4 | Windows CE is no longer supported by SDL.
 5 | 
 6 | We have left the CE support in SDL 1.2 for those that must have it, and we
 7 | have support for Windows Phone 8 and WinRT in SDL2, as of SDL 2.0.3.
 8 | 
 9 | --ryan.
10 | 
11 | 


--------------------------------------------------------------------------------
/examples/cli/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | set(TARGET whisper-cli)
2 | add_executable(${TARGET} cli.cpp)
3 | 
4 | include(DefaultTargetOptions)
5 | 
6 | target_link_libraries(${TARGET} PRIVATE common whisper ${FFMPEG_LIBRARIES} ${CMAKE_THREAD_LIBS_INIT})
7 | 
8 | install(TARGETS ${TARGET} RUNTIME)
9 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/softmax.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_SOFT_MAX_BLOCK_SIZE 1024
4 | 
5 | void ggml_cuda_op_soft_max(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 
7 | void ggml_cuda_op_soft_max_back(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
8 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-rpc/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | message(STATUS "Using RPC backend")
 2 | 
 3 | ggml_add_backend_library(ggml-rpc
 4 |                          ggml-rpc.cpp
 5 |                         )
 6 | 
 7 | if (WIN32)
 8 |     target_link_libraries(ggml-rpc PRIVATE ws2_32)
 9 | endif()
10 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Supporting files/Assets.xcassets/AccentColor.colorset/Contents.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "colors" : [
 3 |     {
 4 |       "idiom" : "universal"
 5 |     }
 6 |   ],
 7 |   "info" : {
 8 |     "author" : "xcode",
 9 |     "version" : 1
10 |   }
11 | }
12 | 


--------------------------------------------------------------------------------
/SDL2/include/SDL_revision.h:
--------------------------------------------------------------------------------
1 | /* Generated by updaterev.sh, do not edit */
2 | #ifdef SDL_VENDOR_INFO
3 | #define SDL_REVISION "SDL-release-2.28.5-0-g15ead9a40 (" SDL_VENDOR_INFO ")"
4 | #else
5 | #define SDL_REVISION "SDL-release-2.28.5-0-g15ead9a40"
6 | #endif
7 | #define SDL_REVISION_NUMBER 0
8 | 


--------------------------------------------------------------------------------
/examples/wchess/wchess.cmd/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | if (WHISPER_SDL2)
2 |     set(TARGET wchess)
3 |     add_executable(${TARGET} wchess.cmd.cpp)
4 | 
5 |     include(DefaultTargetOptions)
6 | 
7 |     target_link_libraries(${TARGET} PRIVATE wchess-core common-sdl ${CMAKE_THREAD_LIBS_INIT})
8 | endif ()
9 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-threading.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "ggml.h"
 4 | 
 5 | #ifdef __cplusplus
 6 | extern "C" {
 7 | #endif
 8 | 
 9 | GGML_API void ggml_critical_section_start(void);
10 | GGML_API void ggml_critical_section_end(void);
11 | 
12 | #ifdef __cplusplus
13 | }
14 | #endif
15 | 


--------------------------------------------------------------------------------
/bindings/java/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | distributionBase=GRADLE_USER_HOME
2 | distributionPath=wrapper/dists
3 | distributionUrl=https\://services.gradle.org/distributions/gradle-8.1-bin.zip
4 | networkTimeout=10000
5 | zipStoreBase=GRADLE_USER_HOME
6 | zipStorePath=wrapper/dists
7 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/params/WhisperFilters.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.params;
 2 | 
 3 | import java.util.List;
 4 | 
 5 | public class WhisperFilters {
 6 |     int n_mel;
 7 |     int n_fft;
 8 | 
 9 |     List<Float> data;
10 | }
11 | 


--------------------------------------------------------------------------------
/examples/sycl/ls-sycl-device.cpp:
--------------------------------------------------------------------------------
 1 | /*MIT license
 2 |   Copyright (C) 2024 Intel Corporation
 3 |   SPDX-License-Identifier: MIT
 4 | */
 5 | 
 6 | #include "ggml-sycl.h"
 7 | 
 8 | int main(int argc, char ** argv) {
 9 |     ggml_backend_sycl_print_sycl_devices();
10 |     return 0;
11 | }


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/AppDelegate.h:
--------------------------------------------------------------------------------
 1 | //
 2 | //  AppDelegate.h
 3 | //  whisper.objc
 4 | //
 5 | //  Created by Georgi Gerganov on 23.10.22.
 6 | //
 7 | 
 8 | #import <UIKit/UIKit.h>
 9 | 
10 | @interface AppDelegate : UIResponder <UIApplicationDelegate>
11 | 
12 | 
13 | @end
14 | 
15 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/model/EModel.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.model;
 2 | 
 3 | public enum EModel {
 4 |     MODEL_UNKNOWN,
 5 |     MODEL_TINY,
 6 |     MODEL_BASE,
 7 |     MODEL_SMALL,
 8 |     MODEL_MEDIUM,
 9 |     MODEL_LARGE,
10 | }
11 | 


--------------------------------------------------------------------------------
/examples/lsp/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | if (WHISPER_SDL2)
 2 |     # stream
 3 |     set(TARGET lsp)
 4 |     add_executable(${TARGET} lsp.cpp)
 5 | 
 6 |     include(DefaultTargetOptions)
 7 | 
 8 |     target_link_libraries(${TARGET} PRIVATE common json_cpp common-sdl whisper ${CMAKE_THREAD_LIBS_INIT})
 9 | endif ()
10 | 


--------------------------------------------------------------------------------
/examples/whisper.android/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | #Wed Dec 14 10:37:24 EST 2022
2 | distributionBase=GRADLE_USER_HOME
3 | distributionUrl=https\://services.gradle.org/distributions/gradle-8.2-bin.zip
4 | distributionPath=wrapper/dists
5 | zipStorePath=wrapper/dists
6 | zipStoreBase=GRADLE_USER_HOME
7 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/cross-entropy-loss.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_CROSS_ENTROPY_LOSS_BLOCK_SIZE 256
4 | 
5 | void ggml_cuda_cross_entropy_loss(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
6 | 
7 | void ggml_cuda_cross_entropy_loss_back(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
8 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | #Fri Oct 20 11:07:15 HST 2023
2 | distributionBase=GRADLE_USER_HOME
3 | distributionPath=wrapper/dists
4 | zipStoreBase=GRADLE_USER_HOME
5 | zipStorePath=wrapper/dists
6 | distributionUrl=https\://services.gradle.org/distributions/gradle-6.5-all.zip
7 | 


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/Assets.xcassets/AppIcon.appiconset/Contents.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "images" : [
 3 |     {
 4 |       "idiom" : "universal",
 5 |       "platform" : "ios",
 6 |       "size" : "1024x1024"
 7 |     }
 8 |   ],
 9 |   "info" : {
10 |     "author" : "xcode",
11 |     "version" : 1
12 |   }
13 | }
14 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/getrows.cuh:
--------------------------------------------------------------------------------
1 | #include "common.cuh"
2 | 
3 | #define CUDA_GET_ROWS_BLOCK_SIZE 256
4 | #define CUDA_GET_ROWS_BACK_BLOCK_SIZE 256
5 | 
6 | void ggml_cuda_op_get_rows(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
7 | 
8 | void ggml_cuda_op_get_rows_back(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
9 | 


--------------------------------------------------------------------------------
/bindings/ruby/ext/cpu.mk:
--------------------------------------------------------------------------------
 1 | ggml/src/ggml-cpu/ggml-cpu-cpp.o: \
 2 | 	ggml/src/ggml-cpu/ggml-cpu.cpp \
 3 | 	ggml/include/ggml-backend.h \
 4 | 	ggml/include/ggml.h \
 5 | 	ggml/include/ggml-alloc.h \
 6 | 	ggml/src/ggml-backend-impl.h \
 7 | 	ggml/include/ggml-cpu.h \
 8 | 	ggml/src/ggml-impl.h
 9 | 	$(CXX) $(CXXFLAGS)   -c $< -o $@
10 | 


--------------------------------------------------------------------------------
/examples/whisper.android/.gitignore:
--------------------------------------------------------------------------------
 1 | *.iml
 2 | .gradle
 3 | /local.properties
 4 | /.idea/caches
 5 | /.idea/libraries
 6 | /.idea/modules.xml
 7 | /.idea/workspace.xml
 8 | /.idea/navEditor.xml
 9 | /.idea/assetWizardSettings.xml
10 | .DS_Store
11 | /build
12 | /captures
13 | .externalNativeBuild
14 | .cxx
15 | local.properties
16 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-threading.cpp:
--------------------------------------------------------------------------------
 1 | #include "ggml-threading.h"
 2 | #include <mutex>
 3 | 
 4 | std::mutex ggml_critical_section_mutex;
 5 | 
 6 | void ggml_critical_section_start() {
 7 |     ggml_critical_section_mutex.lock();
 8 | }
 9 | 
10 | void ggml_critical_section_end(void) {
11 |     ggml_critical_section_mutex.unlock();
12 | }
13 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/.gitignore:
--------------------------------------------------------------------------------
 1 | *.iml
 2 | .gradle
 3 | /local.properties
 4 | /.idea/caches
 5 | /.idea/libraries
 6 | /.idea/modules.xml
 7 | /.idea/workspace.xml
 8 | /.idea/navEditor.xml
 9 | /.idea/assetWizardSettings.xml
10 | .DS_Store
11 | /build
12 | /captures
13 | .externalNativeBuild
14 | .cxx
15 | local.properties
16 | 


--------------------------------------------------------------------------------
/bindings/ruby/extsources.rb:
--------------------------------------------------------------------------------
1 | require "yaml"
2 | 
3 | sources = `git ls-files -z ../..`.split("\x0")
4 | paths = YAML.load_file("../../.github/workflows/bindings-ruby.yml")[true]["push"]["paths"]
5 | paths.delete "bindings/ruby/**"
6 | EXTSOURCES = (Dir.glob(paths, base: "../..").collect {|path| "../../#{path}"} << "../../LICENSE") & sources
7 | 


--------------------------------------------------------------------------------
/cmake/whisper.pc.in:
--------------------------------------------------------------------------------
 1 | prefix=@CMAKE_INSTALL_PREFIX@
 2 | exec_prefix=${prefix}
 3 | libdir=${exec_prefix}/lib
 4 | includedir=${prefix}/include
 5 | 
 6 | Name: whisper
 7 | Description: Port of OpenAI's Whisper model in C/C++
 8 | Version: @PROJECT_VERSION@
 9 | Libs: -L${libdir} -lggml  -lggml-base -lwhisper
10 | Cflags: -I${includedir}
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/wkv.hpp:
--------------------------------------------------------------------------------
 1 | #ifndef GGML_SYCL_WKV_HPP
 2 | #define GGML_SYCL_WKV_HPP
 3 | 
 4 | #include "common.hpp"
 5 | 
 6 | void ggml_sycl_op_rwkv_wkv6(ggml_backend_sycl_context & ctx, ggml_tensor * dst);
 7 | 
 8 | void ggml_sycl_op_rwkv_wkv7(ggml_backend_sycl_context & ctx, ggml_tensor * dst);
 9 | 
10 | #endif // GGML_SYCL_WKV_HPP
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | find_package (Threads REQUIRED)
2 | 
3 | set(TARGET vulkan-shaders-gen)
4 | add_executable(${TARGET} vulkan-shaders-gen.cpp)
5 | install(TARGETS ${TARGET} RUNTIME)
6 | target_compile_features(${TARGET} PRIVATE cxx_std_17)
7 | target_link_libraries(vulkan-shaders-gen PUBLIC Threads::Threads)
8 | 


--------------------------------------------------------------------------------
/bindings/java/gradle.properties:
--------------------------------------------------------------------------------
1 | org.gradle.jvmargs=-Xms256m -Xmx1024m
2 | system.include.dir=/usr/include
3 | #system.local.include.dir=../../include
4 | system.local.include.dir=./build/generated/sources/headers/java/main
5 | jni.include.dir=/usr/lib/jvm/java-8-openjdk-amd64/include/
6 | jni.lib.dir=/usr/lib/jvm/java-8-openjdk-amd64/lib/
7 | 


--------------------------------------------------------------------------------
/examples/stream/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | if (WHISPER_SDL2)
 2 |     set(TARGET whisper-stream)
 3 |     add_executable(${TARGET} stream.cpp)
 4 | 
 5 |     include(DefaultTargetOptions)
 6 | 
 7 |     target_link_libraries(${TARGET} PRIVATE common common-sdl whisper ${CMAKE_THREAD_LIBS_INIT})
 8 | 
 9 |     install(TARGETS ${TARGET} RUNTIME)
10 | endif ()
11 | 


--------------------------------------------------------------------------------
/examples/whisper.android/build.gradle:
--------------------------------------------------------------------------------
1 | // Top-level build file where you can add configuration options common to all sub-projects/modules.
2 | plugins {
3 |     id 'com.android.application' version '8.1.1' apply false
4 |     id 'com.android.library' version '8.1.1' apply false
5 |     id 'org.jetbrains.kotlin.android' version '1.9.0' apply false
6 | }


--------------------------------------------------------------------------------
/examples/command/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | if (WHISPER_SDL2)
 2 |     set(TARGET whisper-command)
 3 |     add_executable(${TARGET} command.cpp)
 4 | 
 5 |     include(DefaultTargetOptions)
 6 | 
 7 |     target_link_libraries(${TARGET} PRIVATE common common-sdl whisper ${CMAKE_THREAD_LIBS_INIT})
 8 | 
 9 |     install(TARGETS ${TARGET} RUNTIME)
10 | endif ()
11 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/res/mipmap-anydpi/ic_launcher.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <background android:drawable="@drawable/ic_launcher_background" />
4 |     <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 | </adaptive-icon>


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/SceneDelegate.h:
--------------------------------------------------------------------------------
 1 | //
 2 | //  SceneDelegate.h
 3 | //  whisper.objc
 4 | //
 5 | //  Created by Georgi Gerganov on 23.10.22.
 6 | //
 7 | 
 8 | #import <UIKit/UIKit.h>
 9 | 
10 | @interface SceneDelegate : UIResponder <UIWindowSceneDelegate>
11 | 
12 | @property (strong, nonatomic) UIWindow * window;
13 | 
14 | @end
15 | 
16 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |   <background android:drawable="@drawable/ic_launcher_background" />
4 |   <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 | </adaptive-icon>


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/dequant_head.comp:
--------------------------------------------------------------------------------
 1 | #extension GL_EXT_control_flow_attributes : require
 2 | #extension GL_EXT_shader_16bit_storage : require
 3 | 
 4 | layout (push_constant) uniform parameter
 5 | {
 6 |     uint M;
 7 |     uint K;
 8 |     uint stride_a;
 9 |     uint stride_b;
10 |     uint nel;
11 | } p;
12 | 
13 | #include "types.comp"
14 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |   <background android:drawable="@drawable/ic_launcher_background" />
4 |   <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 | </adaptive-icon>


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
3 | <plist version="1.0">
4 | <dict>
5 | 	<key>IDEDidComputeMac32BitWarning</key>
6 | 	<true/>
7 | </dict>
8 | </plist>
9 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/cpy.cuh:
--------------------------------------------------------------------------------
 1 | #include "common.cuh"
 2 | 
 3 | #define CUDA_CPY_BLOCK_SIZE 64
 4 | 
 5 | void ggml_cuda_cpy(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, ggml_tensor * src1);
 6 | 
 7 | void ggml_cuda_dup(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 8 | 
 9 | void* ggml_cuda_cpy_fn(const ggml_tensor * src0, ggml_tensor * src1);
10 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
3 | <plist version="1.0">
4 | <dict>
5 | 	<key>IDEDidComputeMac32BitWarning</key>
6 | 	<true/>
7 | </dict>
8 | </plist>
9 | 


--------------------------------------------------------------------------------
/scripts/convert-all.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | models=( "tiny.en" "tiny" "base.en" "base" "small.en" "small" "medium.en" "medium" "large-v1" "large-v2" "large-v3" "large-v3-turbo" )
4 | 
5 | for model in "${models[@]}"; do
6 |     python3 models/convert-pt-to-ggml.py ~/.cache/whisper/$model.pt ../whisper models/
7 |     mv -v models/ggml-model.bin models/ggml-$model.bin
8 | done
9 | 


--------------------------------------------------------------------------------
/examples/wchess/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | add_subdirectory(libwchess)
 2 | set_target_properties(wchess-core PROPERTIES FOLDER "libs")
 3 | 
 4 | if (EMSCRIPTEN)
 5 |     add_subdirectory(wchess.wasm)
 6 |     set_target_properties(wchess.wasm PROPERTIES FOLDER "libs")
 7 | else()
 8 |     add_subdirectory(wchess.cmd)
 9 |     set_target_properties(wchess PROPERTIES FOLDER "libs")
10 | endif()
11 | 


--------------------------------------------------------------------------------
/examples/addon.node/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "addon.node",
 3 |   "version": "0.0.0",
 4 |   "description": "",
 5 |   "main": "index.js",
 6 |   "author": "Qanhe Chen",
 7 |   "license": "MIT",
 8 |   "scripts": {
 9 |     "test": "jest"
10 |   },
11 |   "devDependencies": {
12 |     "cmake-js": "^7.1.1",
13 |     "jest": "^29.4.0",
14 |     "node-addon-api": "^5.0.0"
15 |   }
16 | }
17 | 


--------------------------------------------------------------------------------
/examples/server/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | set(TARGET whisper-server)
 2 | add_executable(${TARGET} server.cpp httplib.h)
 3 | 
 4 | include(DefaultTargetOptions)
 5 | 
 6 | target_link_libraries(${TARGET} PRIVATE common json_cpp whisper ${CMAKE_THREAD_LIBS_INIT})
 7 | 
 8 | if (WIN32)
 9 |     target_link_libraries(${TARGET} PRIVATE ws2_32)
10 | endif()
11 | 
12 | install(TARGETS ${TARGET} RUNTIME)
13 | 


--------------------------------------------------------------------------------
/samples/README.md:
--------------------------------------------------------------------------------
1 | # Audio samples
2 | 
3 | This folder contains various audio files used for testing.
4 | If you want to quickly get some more samples, simply run `make samples`. This will download several public audio files and convert them to appropriate 16-bit WAV format using `ffmpeg`
5 | 
6 | https://github.com/ggerganov/whisper.cpp/blob/a09ce6e8899198015729ffc49ae10f67370906b1/Makefile#L104-L123
7 | 


--------------------------------------------------------------------------------
/scripts/gen-authors.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | printf "# date: $(date)\n" > AUTHORS
 4 | printf "# this file is auto-generated by scripts/gen-authors.sh\n\n" >> AUTHORS
 5 | 
 6 | git log --format='%an <%ae>' --reverse --date=short master | awk '!seen[$0]++' | sort >> AUTHORS
 7 | 
 8 | # if necessary, update your name here. for example: jdoe -> John Doe
 9 | sed -i '' 's/^jdoe/John Doe/g' AUTHORS
10 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/java/com/litongjava/whisper/android/java/app/App.java:
--------------------------------------------------------------------------------
 1 | package com.litongjava.whisper.android.java.app;
 2 | 
 3 | import android.app.Application;
 4 | 
 5 | import com.blankj.utilcode.util.Utils;
 6 | 
 7 | public class App extends Application {
 8 |   @Override
 9 |   public void onCreate() {
10 |     super.onCreate();
11 |     Utils.init(this);
12 |   }
13 | }
14 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/java/com/whispercppdemo/ui/theme/Color.kt:
--------------------------------------------------------------------------------
 1 | package com.whispercppdemo.ui.theme
 2 | 
 3 | import androidx.compose.ui.graphics.Color
 4 | 
 5 | val Purple80 = Color(0xFFD0BCFF)
 6 | val PurpleGrey80 = Color(0xFFCCC2DC)
 7 | val Pink80 = Color(0xFFEFB8C8)
 8 | 
 9 | val Purple40 = Color(0xFF6650a4)
10 | val PurpleGrey40 = Color(0xFF625b71)
11 | val Pink40 = Color(0xFF7D5260)


--------------------------------------------------------------------------------
/examples/sycl/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | #  MIT license
 2 | #  Copyright (C) 2024 Intel Corporation
 3 | #  SPDX-License-Identifier: MIT
 4 | 
 5 | set(TARGET ls-sycl-device)
 6 | add_executable(${TARGET} ls-sycl-device.cpp)
 7 | install(TARGETS ${TARGET} RUNTIME)
 8 | target_link_libraries(${TARGET} PRIVATE common whisper ${CMAKE_THREAD_LIBS_INIT})
 9 | target_compile_features(${TARGET} PRIVATE cxx_std_17)
10 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/cpy.hpp:
--------------------------------------------------------------------------------
 1 | #ifndef GGML_SYCL_CPY_HPP
 2 | #define GGML_SYCL_CPY_HPP
 3 | 
 4 | #include "common.hpp"
 5 | 
 6 | typedef void (*cpy_kernel_t)(const char * cx, char * cdst);
 7 | 
 8 | void ggml_sycl_cpy(ggml_backend_sycl_context & ctx, const ggml_tensor * src0, const ggml_tensor * src1);
 9 | void ggml_sycl_dup(ggml_backend_sycl_context & ctx, ggml_tensor * dst);
10 | 
11 | #endif // GGML_SYCL_CPY_HPP
12 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/sycl_hw.cpp:
--------------------------------------------------------------------------------
 1 | #include "sycl_hw.hpp"
 2 | 
 3 | 
 4 | sycl_hw_info get_device_hw_info(sycl::device *device_ptr) {
 5 |   sycl_hw_info res;
 6 |   int32_t id = device_ptr->get_info<sycl::ext::intel::info::device::device_id>();
 7 |   res.device_id = id;
 8 | 
 9 |   syclex::architecture arch = device_ptr->get_info<syclex::info::device::architecture>();
10 |   res.arch = arch;
11 | 
12 |   return res;
13 | }
14 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/params/WhisperSamplingStrategy.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.params;
 2 | 
 3 | /** Available sampling strategies */
 4 | public enum WhisperSamplingStrategy {
 5 |     /** similar to OpenAI's GreedyDecoder */
 6 |     WHISPER_SAMPLING_GREEDY,
 7 | 
 8 |     /** similar to OpenAI's BeamSearchDecoder */
 9 |     WHISPER_SAMPLING_BEAM_SEARCH
10 | }
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cpu/llamafile/sgemm.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | #include <stdint.h>
 3 | #include <stdbool.h>
 4 | #ifdef __cplusplus
 5 | extern "C" {
 6 | #endif
 7 | 
 8 | bool llamafile_sgemm(const struct ggml_compute_params * params, int64_t, int64_t, int64_t,
 9 |                      const void *, int64_t, const void *, int64_t, void *, int64_t,
10 |                      int, int, int);
11 | 
12 | #ifdef __cplusplus
13 | }
14 | #endif
15 | 


--------------------------------------------------------------------------------
/grammars/colors.gbnf:
--------------------------------------------------------------------------------
 1 | # - red
 2 | # - green
 3 | # - blue
 4 | #
 5 | # example:
 6 | #
 7 | #   ./command -m ./models/ggml-tiny.en.bin -t 8 --grammar ./grammars/colors.gbnf --prompt "red, green, blue," --context "green, red, blue,"
 8 | #
 9 | 
10 | root   ::= init color "."
11 | prompt ::= init "."
12 | 
13 | # leading space is very important!
14 | init ::= " red, green, blue"
15 | 
16 | color ::= ", " ("red" | "green" | "blue")
17 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/java/com/whispercpp/java/whisper/WhisperCpuConfig.java:
--------------------------------------------------------------------------------
 1 | package com.whispercpp.java.whisper;
 2 | 
 3 | import android.os.Build;
 4 | 
 5 | import androidx.annotation.RequiresApi;
 6 | 
 7 | public class WhisperCpuConfig {
 8 |   @RequiresApi(api = Build.VERSION_CODES.N)
 9 |   public static int getPreferredThreadCount() {
10 |     return Math.max(CpuInfo.getHighPerfCpuCount(), 2);
11 |   }
12 | }
13 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cpu/kleidiai/kleidiai.h:
--------------------------------------------------------------------------------
 1 | // SPDX-FileCopyrightText: Copyright 2025 Arm Limited and/or its affiliates <open-source-office@arm.com>
 2 | // SPDX-License-Identifier: MIT
 3 | //
 4 | 
 5 | #pragma once
 6 | 
 7 | #include "ggml-alloc.h"
 8 | 
 9 | #ifdef  __cplusplus
10 | extern "C" {
11 | #endif
12 | 
13 | ggml_backend_buffer_type_t ggml_backend_cpu_kleidiai_buffer_type(void);
14 | 
15 | #ifdef  __cplusplus
16 | }
17 | #endif
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_1-ncols2_8.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 1, 8);
 6 | DECL_FATTN_MMA_F16_CASE(80, 1, 8);
 7 | DECL_FATTN_MMA_F16_CASE(96, 1, 8);
 8 | DECL_FATTN_MMA_F16_CASE(112, 1, 8);
 9 | DECL_FATTN_MMA_F16_CASE(128, 1, 8);
10 | DECL_FATTN_MMA_F16_CASE(256, 1, 8);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_2-ncols2_4.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 2, 4);
 6 | DECL_FATTN_MMA_F16_CASE(80, 2, 4);
 7 | DECL_FATTN_MMA_F16_CASE(96, 2, 4);
 8 | DECL_FATTN_MMA_F16_CASE(112, 2, 4);
 9 | DECL_FATTN_MMA_F16_CASE(128, 2, 4);
10 | DECL_FATTN_MMA_F16_CASE(256, 2, 4);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_2-ncols2_8.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 2, 8);
 6 | DECL_FATTN_MMA_F16_CASE(80, 2, 8);
 7 | DECL_FATTN_MMA_F16_CASE(96, 2, 8);
 8 | DECL_FATTN_MMA_F16_CASE(112, 2, 8);
 9 | DECL_FATTN_MMA_F16_CASE(128, 2, 8);
10 | DECL_FATTN_MMA_F16_CASE(256, 2, 8);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_4-ncols2_2.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 4, 2);
 6 | DECL_FATTN_MMA_F16_CASE(80, 4, 2);
 7 | DECL_FATTN_MMA_F16_CASE(96, 4, 2);
 8 | DECL_FATTN_MMA_F16_CASE(112, 4, 2);
 9 | DECL_FATTN_MMA_F16_CASE(128, 4, 2);
10 | DECL_FATTN_MMA_F16_CASE(256, 4, 2);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_4-ncols2_4.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 4, 4);
 6 | DECL_FATTN_MMA_F16_CASE(80, 4, 4);
 7 | DECL_FATTN_MMA_F16_CASE(96, 4, 4);
 8 | DECL_FATTN_MMA_F16_CASE(112, 4, 4);
 9 | DECL_FATTN_MMA_F16_CASE(128, 4, 4);
10 | DECL_FATTN_MMA_F16_CASE(256, 4, 4);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_4-ncols2_8.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 4, 8);
 6 | DECL_FATTN_MMA_F16_CASE(80, 4, 8);
 7 | DECL_FATTN_MMA_F16_CASE(96, 4, 8);
 8 | DECL_FATTN_MMA_F16_CASE(112, 4, 8);
 9 | DECL_FATTN_MMA_F16_CASE(128, 4, 8);
10 | DECL_FATTN_MMA_F16_CASE(256, 4, 8);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_8-ncols2_1.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 8, 1);
 6 | DECL_FATTN_MMA_F16_CASE(80, 8, 1);
 7 | DECL_FATTN_MMA_F16_CASE(96, 8, 1);
 8 | DECL_FATTN_MMA_F16_CASE(112, 8, 1);
 9 | DECL_FATTN_MMA_F16_CASE(128, 8, 1);
10 | DECL_FATTN_MMA_F16_CASE(256, 8, 1);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_8-ncols2_2.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 8, 2);
 6 | DECL_FATTN_MMA_F16_CASE(80, 8, 2);
 7 | DECL_FATTN_MMA_F16_CASE(96, 8, 2);
 8 | DECL_FATTN_MMA_F16_CASE(112, 8, 2);
 9 | DECL_FATTN_MMA_F16_CASE(128, 8, 2);
10 | DECL_FATTN_MMA_F16_CASE(256, 8, 2);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_8-ncols2_4.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 8, 4);
 6 | DECL_FATTN_MMA_F16_CASE(80, 8, 4);
 7 | DECL_FATTN_MMA_F16_CASE(96, 8, 4);
 8 | DECL_FATTN_MMA_F16_CASE(112, 8, 4);
 9 | DECL_FATTN_MMA_F16_CASE(128, 8, 4);
10 | DECL_FATTN_MMA_F16_CASE(256, 8, 4);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_8-ncols2_8.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 8, 8);
 6 | DECL_FATTN_MMA_F16_CASE(80, 8, 8);
 7 | DECL_FATTN_MMA_F16_CASE(96, 8, 8);
 8 | DECL_FATTN_MMA_F16_CASE(112, 8, 8);
 9 | DECL_FATTN_MMA_F16_CASE(128, 8, 8);
10 | DECL_FATTN_MMA_F16_CASE(256, 8, 8);
11 | 


--------------------------------------------------------------------------------
/examples/whisper.android/settings.gradle:
--------------------------------------------------------------------------------
 1 | pluginManagement {
 2 |     repositories {
 3 |         gradlePluginPortal()
 4 |         google()
 5 |         mavenCentral()
 6 |     }
 7 | }
 8 | dependencyResolutionManagement {
 9 |     repositoriesMode.set(RepositoriesMode.FAIL_ON_PROJECT_REPOS)
10 |     repositories {
11 |         google()
12 |         mavenCentral()
13 |     }
14 | }
15 | rootProject.name = "WhisperCppDemo"
16 | include ':app'
17 | include ':lib'
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_16-ncols2_1.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 16, 1);
 6 | DECL_FATTN_MMA_F16_CASE(80, 16, 1);
 7 | DECL_FATTN_MMA_F16_CASE(96, 16, 1);
 8 | DECL_FATTN_MMA_F16_CASE(112, 16, 1);
 9 | DECL_FATTN_MMA_F16_CASE(128, 16, 1);
10 | DECL_FATTN_MMA_F16_CASE(256, 16, 1);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_16-ncols2_2.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 16, 2);
 6 | DECL_FATTN_MMA_F16_CASE(80, 16, 2);
 7 | DECL_FATTN_MMA_F16_CASE(96, 16, 2);
 8 | DECL_FATTN_MMA_F16_CASE(112, 16, 2);
 9 | DECL_FATTN_MMA_F16_CASE(128, 16, 2);
10 | DECL_FATTN_MMA_F16_CASE(256, 16, 2);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_16-ncols2_4.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 16, 4);
 6 | DECL_FATTN_MMA_F16_CASE(80, 16, 4);
 7 | DECL_FATTN_MMA_F16_CASE(96, 16, 4);
 8 | DECL_FATTN_MMA_F16_CASE(112, 16, 4);
 9 | DECL_FATTN_MMA_F16_CASE(128, 16, 4);
10 | DECL_FATTN_MMA_F16_CASE(256, 16, 4);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_32-ncols2_1.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 32, 1);
 6 | DECL_FATTN_MMA_F16_CASE(80, 32, 1);
 7 | DECL_FATTN_MMA_F16_CASE(96, 32, 1);
 8 | DECL_FATTN_MMA_F16_CASE(112, 32, 1);
 9 | DECL_FATTN_MMA_F16_CASE(128, 32, 1);
10 | DECL_FATTN_MMA_F16_CASE(256, 32, 1);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_32-ncols2_2.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 32, 2);
 6 | DECL_FATTN_MMA_F16_CASE(80, 32, 2);
 7 | DECL_FATTN_MMA_F16_CASE(96, 32, 2);
 8 | DECL_FATTN_MMA_F16_CASE(112, 32, 2);
 9 | DECL_FATTN_MMA_F16_CASE(128, 32, 2);
10 | DECL_FATTN_MMA_F16_CASE(256, 32, 2);
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/template-instances/fattn-mma-f16-instance-ncols1_64-ncols2_1.cu:
--------------------------------------------------------------------------------
 1 | // This file has been autogenerated by generate_cu_files.py, do not edit manually.
 2 | 
 3 | #include "../fattn-mma-f16.cuh"
 4 | 
 5 | DECL_FATTN_MMA_F16_CASE(64, 64, 1);
 6 | DECL_FATTN_MMA_F16_CASE(80, 64, 1);
 7 | DECL_FATTN_MMA_F16_CASE(96, 64, 1);
 8 | DECL_FATTN_MMA_F16_CASE(112, 64, 1);
 9 | DECL_FATTN_MMA_F16_CASE(128, 64, 1);
10 | DECL_FATTN_MMA_F16_CASE(256, 64, 1);
11 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/values/colors.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <resources>
 3 |   <color name="purple_200">#FFBB86FC</color>
 4 |   <color name="purple_500">#FF6200EE</color>
 5 |   <color name="purple_700">#FF3700B3</color>
 6 |   <color name="teal_200">#FF03DAC5</color>
 7 |   <color name="teal_700">#FF018786</color>
 8 |   <color name="black">#FF000000</color>
 9 |   <color name="white">#FFFFFFFF</color>
10 | </resources>


--------------------------------------------------------------------------------
/ggml/src/ggml-cpu/amx/mmq.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | #include "common.h"
 3 | 
 4 | size_t ggml_backend_amx_desired_wsize(const struct ggml_tensor * dst);
 5 | 
 6 | size_t ggml_backend_amx_get_alloc_size(const struct ggml_tensor * tensor);
 7 | 
 8 | void ggml_backend_amx_convert_weight(struct ggml_tensor * tensor, const void * data, size_t offset, size_t size);
 9 | 
10 | void ggml_backend_amx_mul_mat(const struct ggml_compute_params * params, struct ggml_tensor * dst);
11 | 


--------------------------------------------------------------------------------
/bindings/go/go.mod:
--------------------------------------------------------------------------------
 1 | module github.com/ggerganov/whisper.cpp/bindings/go
 2 | 
 3 | go 1.23
 4 | 
 5 | require (
 6 | 	github.com/go-audio/wav v1.1.0
 7 | 	github.com/stretchr/testify v1.9.0
 8 | )
 9 | 
10 | require (
11 | 	github.com/davecgh/go-spew v1.1.1 // indirect
12 | 	github.com/go-audio/audio v1.0.0 // indirect
13 | 	github.com/go-audio/riff v1.0.0 // indirect
14 | 	github.com/pmezard/go-difflib v1.0.0 // indirect
15 | 	gopkg.in/yaml.v3 v3.0.1 // indirect
16 | )
17 | 


--------------------------------------------------------------------------------
/examples/wchess/libwchess/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | add_library(wchess-core STATIC
 2 |     WChess.cpp
 3 |     WChess.h
 4 |     Chessboard.cpp
 5 |     Chessboard.h
 6 | )
 7 | 
 8 | target_link_libraries(wchess-core
 9 |     PUBLIC
10 |     whisper
11 |     common
12 | )
13 | 
14 | target_include_directories(wchess-core
15 |     PUBLIC
16 |     "$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}>"
17 | )
18 | 
19 | # add_executable(test-chessboard test-chessboard.cpp Chessboard.cpp)
20 | 


--------------------------------------------------------------------------------
/examples/talk-llama/llama-io.cpp:
--------------------------------------------------------------------------------
 1 | #include "llama-io.h"
 2 | 
 3 | void llama_io_write_i::write_string(const std::string & str) {
 4 |     uint32_t str_size = str.size();
 5 | 
 6 |     write(&str_size,  sizeof(str_size));
 7 |     write(str.data(), str_size);
 8 | }
 9 | 
10 | void llama_io_read_i::read_string(std::string & str) {
11 |     uint32_t str_size;
12 |     read_to(&str_size, sizeof(str_size));
13 | 
14 |     str.assign((const char *) read(str_size), str_size);
15 | }
16 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/convert.cuh:
--------------------------------------------------------------------------------
 1 | #include "common.cuh"
 2 | 
 3 | #define CUDA_DEQUANTIZE_BLOCK_SIZE 256
 4 | 
 5 | template<typename T>
 6 | using to_t_cuda_t = void (*)(const void * __restrict__ x, T * __restrict__ y, int64_t k, cudaStream_t stream);
 7 | 
 8 | typedef to_t_cuda_t<float> to_fp32_cuda_t;
 9 | typedef to_t_cuda_t<half> to_fp16_cuda_t;
10 | 
11 | to_fp16_cuda_t ggml_get_to_fp16_cuda(ggml_type type);
12 | 
13 | to_fp32_cuda_t ggml_get_to_fp32_cuda(ggml_type type);
14 | 


--------------------------------------------------------------------------------
/cmake/DefaultTargetOptions.cmake:
--------------------------------------------------------------------------------
 1 | # Set the default compile features and properties for a target.
 2 | 
 3 | if (NOT TARGET)
 4 |     message(FATAL_ERROR "TARGET not set before including DefaultTargetOptions")
 5 | endif()
 6 | 
 7 | target_compile_features(${TARGET}
 8 |     PRIVATE
 9 |         cxx_std_11
10 |     )
11 | 
12 | set_target_properties(${TARGET}
13 |     PROPERTIES
14 |         EXPORT_COMPILE_COMMANDS ON
15 |         RUNTIME_OUTPUT_DIRECTORY "${CMAKE_BINARY_DIR}/bin"
16 | )
17 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/test/java/com/whispercppdemo/ExampleUnitTest.kt:
--------------------------------------------------------------------------------
 1 | package com.whispercppdemo
 2 | 
 3 | import org.junit.Test
 4 | 
 5 | import org.junit.Assert.*
 6 | 
 7 | /**
 8 |  * Example local unit test, which will execute on the development machine (host).
 9 |  *
10 |  * See [testing documentation](http://d.android.com/tools/testing).
11 |  */
12 | class ExampleUnitTest {
13 |     @Test
14 |     fun addition_isCorrect() {
15 |         assertEquals(4, 2 + 2)
16 |     }
17 | }


--------------------------------------------------------------------------------
/SDL2/README-SDL.txt:
--------------------------------------------------------------------------------
 1 | 
 2 | Please distribute this file with the SDL runtime environment:
 3 | 
 4 | The Simple DirectMedia Layer (SDL for short) is a cross-platform library
 5 | designed to make it easy to write multi-media software, such as games
 6 | and emulators.
 7 | 
 8 | The Simple DirectMedia Layer library source code is available from:
 9 | https://www.libsdl.org/
10 | 
11 | This library is distributed under the terms of the zlib license:
12 | http://www.zlib.net/zlib_license.html
13 | 
14 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/cos.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 7 | 
 8 | void main() {
 9 |     const uint idx = get_idx();
10 | 
11 |     if (idx >= p.ne) {
12 |         return;
13 |     }
14 | 
15 |     const FLOAT_TYPE val = FLOAT_TYPE(data_a[get_aoffset() + src0_idx(idx)]);
16 |     data_d[get_doffset() + dst_idx(idx)] = D_TYPE(cos(val));
17 | }
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/sin.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 7 | 
 8 | void main() {
 9 |     const uint idx = get_idx();
10 | 
11 |     if (idx >= p.ne) {
12 |         return;
13 |     }
14 | 
15 |     const FLOAT_TYPE val = FLOAT_TYPE(data_a[get_aoffset() + src0_idx(idx)]);
16 |     data_d[get_doffset() + dst_idx(idx)] = D_TYPE(sin(val));
17 | }
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/square.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 7 | 
 8 | void main() {
 9 |     const uint idx = get_idx();
10 | 
11 |     if (idx >= p.ne) {
12 |         return;
13 |     }
14 | 
15 |     const FLOAT_TYPE val = FLOAT_TYPE(data_a[get_aoffset() + src0_idx(idx)]);
16 |     data_d[get_doffset() + dst_idx(idx)] = D_TYPE(val * val);
17 | }
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-amx/mmq.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | #include "common.h"
 3 | #include <stdint.h>
 4 | 
 5 | #ifdef __cplusplus
 6 | extern "C" {
 7 | #endif
 8 | 
 9 | size_t ggml_backend_amx_get_alloc_size(const struct ggml_tensor * tensor);
10 | 
11 | void ggml_backend_amx_convert_weight(struct ggml_tensor * tensor, const void * data, size_t offset, size_t size);
12 | 
13 | void ggml_backend_amx_mul_mat(ggml_backend_amx_context * ctx, struct ggml_tensor * dst);
14 | 
15 | #ifdef __cplusplus
16 | }
17 | #endif
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/norm.cuh:
--------------------------------------------------------------------------------
 1 | #include "common.cuh"
 2 | 
 3 | void ggml_cuda_op_norm(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 4 | 
 5 | void ggml_cuda_op_group_norm(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 6 | 
 7 | void ggml_cuda_op_rms_norm(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 8 | 
 9 | void ggml_cuda_op_rms_norm_back(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
10 | 
11 | void ggml_cuda_op_l2_norm(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
12 | 


--------------------------------------------------------------------------------
/examples/common-ggml.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "ggml.h"
 4 | 
 5 | #include <fstream>
 6 | #include <vector>
 7 | #include <string>
 8 | 
 9 | enum ggml_ftype ggml_parse_ftype(const char * str);
10 | 
11 | void ggml_print_ftypes(FILE * fp = stderr);
12 | 
13 | bool ggml_common_quantize_0(
14 |         std::ifstream & finp,
15 |         std::ofstream & fout,
16 |         const ggml_ftype ftype,
17 |         const std::vector<std::string> & to_quant,
18 |         const std::vector<std::string> & to_skip);
19 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Supporting files/WhisperCppDemo.entitlements:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
 3 | <plist version="1.0">
 4 | <dict>
 5 | 	<key>com.apple.security.app-sandbox</key>
 6 | 	<true/>
 7 | 	<key>com.apple.security.device.audio-input</key>
 8 | 	<true/>
 9 | 	<key>com.apple.security.files.user-selected.read-only</key>
10 | 	<true/>
11 | </dict>
12 | </plist>
13 | 


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Utils/RiffWaveUtils.swift:
--------------------------------------------------------------------------------
 1 | import Foundation
 2 | 
 3 | func decodeWaveFile(_ url: URL) throws -> [Float] {
 4 |     let data = try Data(contentsOf: url)
 5 |     let floats = stride(from: 44, to: data.count, by: 2).map {
 6 |         return data[$0..<$0 + 2].withUnsafeBytes {
 7 |             let short = Int16(littleEndian: $0.load(as: Int16.self))
 8 |             return max(-1.0, min(Float(short) / 32767.0, 1.0))
 9 |         }
10 |     }
11 |     return floats
12 | }
13 | 


--------------------------------------------------------------------------------
/.github/workflows/bindings-go.yml:
--------------------------------------------------------------------------------
 1 | name: Bindings Tests (Go)
 2 | on:
 3 |   push:
 4 |     paths:
 5 |       - bindings/go/**
 6 |       - whisper.h
 7 |   pull_request:
 8 |     paths:
 9 |       - bindings/go/**
10 |       - whisper.h
11 | 
12 | jobs:
13 |   ubuntu-22:
14 |     runs-on: ubuntu-22.04
15 |     steps:
16 |       - uses: actions/setup-go@v5
17 |         with:
18 |           go-version: '^1.23'
19 |       - uses: actions/checkout@v4
20 |       - run: |
21 |           cd bindings/go
22 |           make test
23 | 


--------------------------------------------------------------------------------
/examples/whisper.android/.idea/misc.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <project version="4">
 3 |   <component name="ExternalStorageConfigurationManager" enabled="true" />
 4 |   <component name="ProjectRootManager" version="2" languageLevel="JDK_17" default="true" project-jdk-name="jbr-17" project-jdk-type="JavaSDK">
 5 |     <output url="file://$PROJECT_DIR$/build/classes" />
 6 |   </component>
 7 |   <component name="ProjectType">
 8 |     <option name="id" value="Android" />
 9 |   </component>
10 | </project>


--------------------------------------------------------------------------------
/examples/sycl/run-whisper.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | #  MIT license
 4 | #  Copyright (C) 2024 Intel Corporation
 5 | #  SPDX-License-Identifier: MIT
 6 | 
 7 | INPUT2="Building a website can be done in 10 simple steps:\nStep 1:"
 8 | source /opt/intel/oneapi/setvars.sh
 9 | 
10 | if [ $# -gt 0 ]; then
11 |     export GGML_SYCL_DEVICE=$1
12 | else
13 |     export GGML_SYCL_DEVICE=0
14 | fi
15 | echo GGML_SYCL_DEVICE=$GGML_SYCL_DEVICE
16 | #export GGML_SYCL_DEBUG=1
17 | ./build/bin/main -m models/ggml-base.en.bin -f samples/jfk.wav


--------------------------------------------------------------------------------
/examples/whisper.swiftui/whisper.swiftui.demo/Models/Model.swift:
--------------------------------------------------------------------------------
 1 | import Foundation
 2 | 
 3 | struct Model: Identifiable {
 4 |     var id = UUID()
 5 |     var name: String
 6 |     var info: String
 7 |     var url: String
 8 | 
 9 |     var filename: String
10 |     var fileURL: URL {
11 |         FileManager.default.urls(for: .documentDirectory, in: .userDomainMask)[0].appendingPathComponent(filename)
12 |     }
13 | 
14 |     func fileExists() -> Bool {
15 |         FileManager.default.fileExists(atPath: fileURL.path)
16 |     }
17 | }
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/sycl_hw.hpp:
--------------------------------------------------------------------------------
 1 | #ifndef SYCL_HW_HPP
 2 | #define SYCL_HW_HPP
 3 | 
 4 | #include <algorithm>
 5 | #include <stdio.h>
 6 | #include <vector>
 7 | #include <map>
 8 | 
 9 | #include <sycl/sycl.hpp>
10 | 
11 | namespace syclex = sycl::ext::oneapi::experimental;
12 | 
13 | struct sycl_hw_info {
14 |   syclex::architecture arch;
15 |   int32_t device_id;
16 | };
17 | 
18 | bool is_in_vector(std::vector<int> &vec, int item);
19 | 
20 | sycl_hw_info get_device_hw_info(sycl::device *device_ptr);
21 | 
22 | 
23 | #endif // SYCL_HW_HPP
24 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/mmvq.cuh:
--------------------------------------------------------------------------------
 1 | #include "common.cuh"
 2 | 
 3 | #define MMVQ_MAX_BATCH_SIZE 8 // Max. batch size for which to use MMVQ kernels.
 4 | 
 5 | void ggml_cuda_op_mul_mat_vec_q(
 6 |     ggml_backend_cuda_context & ctx,
 7 |     const ggml_tensor * src0, const ggml_tensor * src1, ggml_tensor * dst, const char * src0_dd_i, const float * src1_ddf_i,
 8 |     const char * src1_ddq_i, float * dst_dd_i, const int64_t row_low, const int64_t row_high, const int64_t src1_ncols,
 9 |     const int64_t src1_padded_row_size, cudaStream_t stream);
10 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/binbcast.cuh:
--------------------------------------------------------------------------------
 1 | #include "common.cuh"
 2 | 
 3 | void ggml_cuda_op_repeat(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 4 | void ggml_cuda_op_add(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 5 | void ggml_cuda_op_sub(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 6 | void ggml_cuda_op_mul(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 7 | void ggml_cuda_op_div(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
 8 | 
 9 | void ggml_cuda_op_repeat_back(ggml_backend_cuda_context & ctx, ggml_tensor * dst);
10 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/clamp.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 7 | 
 8 | void main() {
 9 |     const uint idx = get_idx();
10 | 
11 |     if (idx >= p.ne) {
12 |         return;
13 |     }
14 | 
15 |     const FLOAT_TYPE val = FLOAT_TYPE(data_a[get_aoffset() + src0_idx(idx)]);
16 |     data_d[get_doffset() + dst_idx(idx)] = D_TYPE(val < p.param1 ? p.param1 : (val > p.param2 ? p.param2 : val));
17 | }
18 | 


--------------------------------------------------------------------------------
/SDL2/BUGS.txt:
--------------------------------------------------------------------------------
 1 | 
 2 | Bugs are now managed in the SDL issue tracker, here:
 3 | 
 4 |     https://github.com/libsdl-org/SDL/issues
 5 | 
 6 | You may report bugs there, and search to see if a given issue has already
 7 |  been reported, discussed, and maybe even fixed.
 8 | 
 9 | 
10 | You may also find help at the SDL forums/mailing list:
11 | 
12 |     https://discourse.libsdl.org/
13 | 
14 | Bug reports are welcome here, but we really appreciate if you use the issue
15 |  tracker, as bugs discussed on the mailing list may be forgotten or missed.
16 | 
17 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/params/WhisperHParams.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.params;
 2 | 
 3 | public class WhisperHParams {
 4 |     int n_vocab       = 51864;
 5 |     int n_audio_ctx   = 1500;
 6 |     int n_audio_state = 384;
 7 |     int n_audio_head  = 6;
 8 |     int n_audio_layer = 4;
 9 |     int n_text_ctx    = 448;
10 |     int n_text_state  = 384;
11 |     int n_text_head   = 6;
12 |     int n_text_layer  = 4;
13 |     int n_mels        = 80;
14 |     int ftype         = 1;
15 | }
16 | 


--------------------------------------------------------------------------------
/.devops/main.Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM ubuntu:22.04 AS build
 2 | WORKDIR /app
 3 | 
 4 | RUN apt-get update && \
 5 |   apt-get install -y build-essential wget cmake git \
 6 |   && rm -rf /var/lib/apt/lists/* /var/cache/apt/archives/*
 7 | 
 8 | COPY .. .
 9 | RUN make base.en
10 | 
11 | FROM ubuntu:22.04 AS runtime
12 | WORKDIR /app
13 | 
14 | RUN apt-get update && \
15 |   apt-get install -y curl ffmpeg libsdl2-dev wget cmake git \
16 |   && rm -rf /var/lib/apt/lists/* /var/cache/apt/archives/*
17 | 
18 | COPY --from=build /app /app
19 | ENTRYPOINT [ "bash", "-c" ]
20 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/test/java/com/litongjava/whisper/android/java/ExampleUnitTest.java:
--------------------------------------------------------------------------------
 1 | package com.litongjava.whisper.android.java;
 2 | 
 3 | import org.junit.Test;
 4 | 
 5 | import static org.junit.Assert.*;
 6 | 
 7 | /**
 8 |  * Example local unit test, which will execute on the development machine (host).
 9 |  *
10 |  * @see <a href="http://d.android.com/tools/testing">Testing documentation</a>
11 |  */
12 | public class ExampleUnitTest {
13 |   @Test
14 |   public void addition_isCorrect() {
15 |     assertEquals(4, 2 + 2);
16 |   }
17 | }


--------------------------------------------------------------------------------
/examples/stream.wasm/README.md:
--------------------------------------------------------------------------------
 1 | # stream.wasm
 2 | 
 3 | Real-time transcription in the browser using WebAssembly
 4 | 
 5 | Online demo: https://whisper.ggerganov.com/stream/
 6 | 
 7 | ## Build instructions
 8 | 
 9 | ```bash
10 | # build using Emscripten (v3.1.2)
11 | git clone https://github.com/ggerganov/whisper.cpp
12 | cd whisper.cpp
13 | mkdir build-em && cd build-em
14 | emcmake cmake ..
15 | make -j
16 | 
17 | # copy the produced page to your HTTP path
18 | cp bin/stream.wasm/*       /path/to/html/
19 | cp bin/libstream.worker.js /path/to/html/
20 | ```
21 | 


--------------------------------------------------------------------------------
/bindings/ruby/tests/test_error.rb:
--------------------------------------------------------------------------------
 1 | require_relative "helper"
 2 | 
 3 | class TestError < TestBase
 4 |   def test_error
 5 |     error = Whisper::Error.new(-2)
 6 |     assert_equal "failed to compute log mel spectrogram", error.message
 7 |     assert_equal -2, error.code
 8 |   end
 9 | 
10 |   def test_unknown_error
11 |     error = Whisper::Error.new(-20)
12 |     assert_equal "unknown error", error.message
13 |   end
14 | 
15 |   def test_non_int_code
16 |     assert_raise TypeError do
17 |       error = Whisper::Error.new("non int")
18 |     end
19 |   end
20 | end
21 | 


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/main.m:
--------------------------------------------------------------------------------
 1 | //
 2 | //  main.m
 3 | //  whisper.objc
 4 | //
 5 | //  Created by Georgi Gerganov on 23.10.22.
 6 | //
 7 | 
 8 | #import <UIKit/UIKit.h>
 9 | #import "AppDelegate.h"
10 | 
11 | int main(int argc, char * argv[]) {
12 |     NSString * appDelegateClassName;
13 |     @autoreleasepool {
14 |         // Setup code that might create autoreleased objects goes here.
15 |         appDelegateClassName = NSStringFromClass([AppDelegate class]);
16 |     }
17 |     return UIApplicationMain(argc, argv, nil, appDelegateClassName);
18 | }
19 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_scale.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorIn { float in_[]; };
 8 | layout(binding = 1) buffer restrict writeonly tensorOut { float out_[]; };
 9 | 
10 | layout(push_constant) uniform PushConstants {
11 |     uint inOff;
12 |     uint outOff;
13 |     float scale;
14 | } pcs;
15 | 
16 | void main() {
17 |     const uint i = gl_WorkGroupID.x;
18 |     out_[i + pcs.outOff] = in_[i + pcs.inOff] * pcs.scale;
19 | }
20 | 


--------------------------------------------------------------------------------
/scripts/sync-llama.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | cp -rpv ../llama.cpp/include/llama.h ./examples/talk-llama/llama.h
 4 | 
 5 | cp -rpv ../llama.cpp/src/llama*.cpp       ./examples/talk-llama/
 6 | cp -rpv ../llama.cpp/src/llama*.h         ./examples/talk-llama/
 7 | cp -rpv ../llama.cpp/src/unicode.h        ./examples/talk-llama/unicode.h
 8 | cp -rpv ../llama.cpp/src/unicode.cpp      ./examples/talk-llama/unicode.cpp
 9 | cp -rpv ../llama.cpp/src/unicode-data.h   ./examples/talk-llama/unicode-data.h
10 | cp -rpv ../llama.cpp/src/unicode-data.cpp ./examples/talk-llama/unicode-data.cpp
11 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/vendors/cuda.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <cuda_runtime.h>
 4 | #include <cuda.h>
 5 | #include <cublas_v2.h>
 6 | #include <cuda_bf16.h>
 7 | #include <cuda_fp16.h>
 8 | 
 9 | #if CUDART_VERSION < 11020
10 | #define CU_DEVICE_ATTRIBUTE_VIRTUAL_MEMORY_MANAGEMENT_SUPPORTED CU_DEVICE_ATTRIBUTE_VIRTUAL_ADDRESS_MANAGEMENT_SUPPORTED
11 | #define CUBLAS_TF32_TENSOR_OP_MATH CUBLAS_TENSOR_OP_MATH
12 | #define CUBLAS_COMPUTE_16F CUDA_R_16F
13 | #define CUBLAS_COMPUTE_32F CUDA_R_32F
14 | #define cublasComputeType_t cudaDataType_t
15 | #endif // CUDART_VERSION < 11020
16 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/dequant_f32.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "dequant_head.comp"
 4 | 
 5 | layout(local_size_x = 256, local_size_y = 1, local_size_z = 1) in;
 6 | 
 7 | layout (binding = 0) readonly buffer A {float data_a[];};
 8 | layout (binding = 1) writeonly buffer D {D_TYPE data_b[];};
 9 | 
10 | void main() {
11 |     const uint i = gl_GlobalInvocationID.x * 16;
12 | 
13 |     if (i >= p.nel) {
14 |         return;
15 |     }
16 | 
17 |     [[unroll]] for (uint l = 0; l < 16; l++) {
18 |         data_b[i + l] = D_TYPE(data_a[i + l]);
19 |     }
20 | }
21 | 


--------------------------------------------------------------------------------
/examples/console.h:
--------------------------------------------------------------------------------
 1 | // Console functions
 2 | 
 3 | #pragma once
 4 | 
 5 | #include <string>
 6 | 
 7 | namespace console {
 8 |     enum display_t {
 9 |         reset = 0,
10 |         prompt,
11 |         user_input,
12 |         error
13 |     };
14 | 
15 |     void init(bool use_simple_io, bool use_advanced_display);
16 |     void cleanup();
17 |     void set_display(display_t display);
18 |     bool readline(std::string & line, bool multiline_input);
19 |     std::wstring UTF8toUTF16(const std::string& utf8Str);
20 |     std::string UTF16toUTF8(const std::wstring & utf16Str);
21 | }
22 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/res/xml/backup_rules.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?><!--
 2 |    Sample backup rules file; uncomment and customize as necessary.
 3 |    See https://developer.android.com/guide/topics/data/autobackup
 4 |    for details.
 5 |    Note: This file is ignored for devices older that API 31
 6 |    See https://developer.android.com/about/versions/12/backup-restore
 7 | -->
 8 | <full-backup-content>
 9 |     <!--
10 |    <include domain="sharedpref" path="."/>
11 |    <exclude domain="sharedpref" path="device.xml"/>
12 | -->
13 | </full-backup-content>


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/ggml/GgmlType.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.ggml;
 2 | 
 3 | public enum GgmlType {
 4 |     GGML_TYPE_F32,
 5 |     GGML_TYPE_F16,
 6 |     GGML_TYPE_Q4_0,
 7 |     GGML_TYPE_Q4_1,
 8 |     REMOVED_GGML_TYPE_Q4_2,  // support has been removed
 9 |     REMOVED_GGML_TYPE_Q4_3, // support has been removed
10 |     GGML_TYPE_Q5_0,
11 |     GGML_TYPE_Q5_1,
12 |     GGML_TYPE_Q8_0,
13 |     GGML_TYPE_Q8_1,
14 |     GGML_TYPE_I8,
15 |     GGML_TYPE_I16,
16 |     GGML_TYPE_I32,
17 |     GGML_TYPE_COUNT,
18 | }
19 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/copy.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 7 | 
 8 | void main() {
 9 |     const uint idx = get_idx();
10 | 
11 |     if (idx >= p.ne) {
12 |         return;
13 |     }
14 | 
15 | #ifndef OPTIMIZATION_ERROR_WORKAROUND
16 |     data_d[get_doffset() + dst_idx(idx)] = D_TYPE(data_a[get_aoffset() + src0_idx(idx)]);
17 | #else
18 |     data_d[get_doffset() + dst_idx(idx)] = data_a[get_aoffset() + src0_idx(idx)];
19 | #endif
20 | }
21 | 


--------------------------------------------------------------------------------
/examples/talk-llama/speak.ps1:
--------------------------------------------------------------------------------
 1 | # Set-ExecutionPolicy -ExecutionPolicy Bypass -Scope CurrentUser
 2 | param(
 3 |   [Parameter(Mandatory=$true)][int]$voicenum,
 4 |   [Parameter(Mandatory=$true)][string]$textfile
 5 | )
 6 | 
 7 | Add-Type -AssemblyName System.Speech;
 8 | $speak = New-Object System.Speech.Synthesis.SpeechSynthesizer;
 9 | $voiceoptions = $speak.GetInstalledVoices("en-US");
10 | $voice = $voiceoptions[$voicenum % $voiceoptions.count];
11 | $speak.SelectVoice($voice.VoiceInfo.Name);
12 | $speak.Rate="0";
13 | $text = Get-Content -Path $textfile;
14 | $speak.Speak($text);
15 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/concat.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_CONCAT_HPP
14 | #define GGML_SYCL_CONCAT_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_concat(ggml_backend_sycl_context & ctx, ggml_tensor *dst);
19 | 
20 | #endif // GGML_SYCL_CONCAT_HPP
21 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/conv.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_CONV_HPP
14 | #define GGML_SYCL_CONV_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_conv_transpose_1d(ggml_backend_sycl_context & ctx, ggml_tensor *dst);
19 | 
20 | #endif // GGML_SYCL_CONV_HPP
21 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/softmax.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_SOFTMAX_HPP
14 | #define GGML_SYCL_SOFTMAX_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_soft_max(ggml_backend_sycl_context &ctx, ggml_tensor *dst);
19 | 
20 | #endif // GGML_SYCL_SOFTMAX_HPP
21 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/tsembd.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_TSEMBD_HPP
14 | #define GGML_SYCL_TSEMBD_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_timestep_embedding(ggml_backend_sycl_context & ctx, ggml_tensor * dst);
19 | 
20 | #endif // GGML_SYCL_TSEMBD_HPP
21 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/params/GreedyParams.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.params;
 2 | 
 3 | import com.sun.jna.Structure;
 4 | 
 5 | import java.util.Collections;
 6 | import java.util.List;
 7 | 
 8 | public class GreedyParams extends Structure {
 9 |     /** <a href="https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/transcribe.py#L264">...</a> */
10 |     public int best_of;
11 | 
12 |     @Override
13 |     protected List<String> getFieldOrder() {
14 |         return Collections.singletonList("best_of");
15 |     }
16 | }
17 | 


--------------------------------------------------------------------------------
/bindings/ruby/tests/helper.rb:
--------------------------------------------------------------------------------
 1 | require "test/unit"
 2 | require "whisper"
 3 | require_relative "jfk_reader/jfk_reader"
 4 | 
 5 | class TestBase < Test::Unit::TestCase
 6 |   AUDIO = File.join(__dir__, "..", "..", "..", "samples", "jfk.wav")
 7 | 
 8 |   class << self
 9 |     attr_reader :whisper
10 | 
11 |     def startup
12 |       @whisper = Whisper::Context.new("base.en")
13 |       params = Whisper::Params.new
14 |       params.print_timestamps = false
15 |       @whisper.transcribe(TestBase::AUDIO, params)
16 |     end
17 |   end
18 | 
19 |   private
20 | 
21 |   def whisper
22 |     self.class.whisper
23 |   end
24 | end
25 | 


--------------------------------------------------------------------------------
/examples/bench.wasm/README.md:
--------------------------------------------------------------------------------
 1 | # bench.wasm
 2 | 
 3 | Benchmark the performance of whisper.cpp in the browser using WebAssembly
 4 | 
 5 | Link: https://whisper.ggerganov.com/bench/
 6 | 
 7 | Terminal version: [examples/bench](/examples/bench)
 8 | 
 9 | ## Build instructions
10 | 
11 | ```bash
12 | # build using Emscripten (v3.1.2)
13 | git clone https://github.com/ggerganov/whisper.cpp
14 | cd whisper.cpp
15 | mkdir build-em && cd build-em
16 | emcmake cmake ..
17 | make -j
18 | 
19 | # copy the produced page to your HTTP path
20 | cp bin/bench.wasm/*       /path/to/html/
21 | cp bin/libbench.worker.js /path/to/html/
22 | ```
23 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/build.gradle:
--------------------------------------------------------------------------------
 1 | // Top-level build file where you can add configuration options common to all sub-projects/modules.
 2 | buildscript {
 3 |   repositories {
 4 |     google()
 5 |     jcenter()
 6 |   }
 7 |   dependencies {
 8 |     classpath "com.android.tools.build:gradle:4.1.3"
 9 | 
10 |     // NOTE: Do not place your application dependencies here; they belong
11 |     // in the individual module build.gradle files
12 |   }
13 | }
14 | 
15 | allprojects {
16 |   repositories {
17 |     google()
18 |     jcenter()
19 |   }
20 | }
21 | 
22 | task clean(type: Delete) {
23 |   delete rootProject.buildDir
24 | }


--------------------------------------------------------------------------------
/ggml/src/ggml-opencl/kernels/embed_kernel.py:
--------------------------------------------------------------------------------
 1 | #
 2 | 
 3 | import sys
 4 | import logging
 5 | logger = logging.getLogger("opencl-embed-kernel")
 6 | 
 7 | 
 8 | def main():
 9 |     logging.basicConfig(level=logging.INFO)
10 | 
11 |     if len(sys.argv) != 3:
12 |         logger.info("Usage: python embed_kernel.py <input_file> <output_file>")
13 |         sys.exit(1)
14 | 
15 |     ifile = open(sys.argv[1], "r")
16 |     ofile = open(sys.argv[2], "w")
17 | 
18 |     for i in ifile:
19 |         ofile.write('R"({})"\n'.format(i))
20 | 
21 |     ifile.close()
22 |     ofile.close()
23 | 
24 | 
25 | if __name__ == "__main__":
26 |     main()
27 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_relu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorIn { float in_[]; };
 8 | layout(binding = 1) buffer restrict writeonly tensorOut { float out_[]; };
 9 | layout(push_constant) uniform PushConstants {
10 |     uint inOff;
11 |     uint outOff;
12 | } pcs;
13 | 
14 | void main() {
15 |     const uint baseIndex = gl_WorkGroupID.x * 4;
16 | 
17 |     for (uint x = 0; x < 4; x++) {
18 |         const uint i = baseIndex + x;
19 |         out_[i + pcs.outOff] = max(0.0, in_[i + pcs.inOff]);
20 |     }
21 | }
22 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/relu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
15 | 
16 |     if (i >= p.KX) {
17 |         return;
18 |     }
19 | 
20 |     data_d[i] = max(float(data_a[i]), 0);
21 | }
22 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/sigmoid.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
15 | 
16 |     if (i >= p.KX) {
17 |         return;
18 |     }
19 |     data_d[i] = D_TYPE(1. / (1 + exp(-1. *data_a[i])));
20 | }
21 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/tanh.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
15 | 
16 |     if (i >= p.KX) {
17 |         return;
18 |     }
19 |     data_d[i] = D_TYPE(1. - 2. / (exp(2.*data_a[i]) + 1.));
20 | }
21 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_scale_8.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorIn { float in_[]; };
 8 | layout(binding = 1) buffer restrict writeonly tensorOut { float out_[]; };
 9 | 
10 | layout(push_constant) uniform PushConstants {
11 |     uint inOff;
12 |     uint outOff;
13 |     float scale;
14 | } pcs;
15 | 
16 | void main() {
17 |     const uint baseIndex = gl_WorkGroupID.x * 8;
18 | 
19 |     for (uint x = 0; x < 8; x++) {
20 |         const uint i = baseIndex + x;
21 |         out_[i + pcs.outOff] = in_[i + pcs.inOff] * pcs.scale;
22 |     }
23 | }
24 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_silu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorIn { float in_[]; };
 8 | layout(binding = 1) buffer restrict writeonly tensorOut { float out_[]; };
 9 | layout(push_constant) uniform PushConstants {
10 |     uint inOff;
11 |     uint outOff;
12 | } pcs;
13 | 
14 | void main() {
15 |     const uint baseIndex = gl_WorkGroupID.x * 4;
16 | 
17 |     for (uint x = 0; x < 4; x++) {
18 |         const uint i = baseIndex + x;
19 |         const float y = in_[i + pcs.inOff];
20 |         out_[i + pcs.outOff] = y / (1.0 + exp(-y));
21 |     }
22 | }
23 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/res/xml/data_extraction_rules.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?><!--
 2 |    Sample data extraction rules file; uncomment and customize as necessary.
 3 |    See https://developer.android.com/about/versions/12/backup-restore#xml-changes
 4 |    for details.
 5 | -->
 6 | <data-extraction-rules>
 7 |     <cloud-backup>
 8 |         <!-- TODO: Use <include> and <exclude> to control what is backed up.
 9 |         <include .../>
10 |         <exclude .../>
11 |         -->
12 |     </cloud-backup>
13 |     <!--
14 |     <device-transfer>
15 |         <include .../>
16 |         <exclude .../>
17 |     </device-transfer>
18 |     -->
19 | </data-extraction-rules>


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/cmake/host-toolchain.cmake.in:
--------------------------------------------------------------------------------
 1 | set(CMAKE_BUILD_TYPE Release)
 2 | set(CMAKE_C_FLAGS -O2)
 3 | set(CMAKE_CXX_FLAGS -O2)
 4 | set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM NEVER)
 5 | set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY NEVER)
 6 | set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE NEVER)
 7 | set(CMAKE_C_COMPILER @HOST_C_COMPILER@)
 8 | set(CMAKE_CXX_COMPILER @HOST_CXX_COMPILER@)
 9 | set(CMAKE_RUNTIME_OUTPUT_DIRECTORY @CMAKE_RUNTIME_OUTPUT_DIRECTORY@)
10 | 
11 | if("@CMAKE_C_COMPILER_ID@" STREQUAL "MSVC")
12 |     foreach(CONFIG IN ITEMS DEBUG RELEASE MINSIZEREL RELWITHDEBINFO)
13 |         set(CMAKE_RUNTIME_OUTPUT_DIRECTORY_${CONFIG} ${CMAKE_RUNTIME_OUTPUT_DIRECTORY})
14 |     endforeach()
15 | endif()
16 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/silu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
15 | 
16 |     if (i >= p.KX) {
17 |         return;
18 |     }
19 | 
20 |     const float xi = float(data_a[i]);
21 |     data_d[i] = D_TYPE(xi / (1.0f + exp(-xi)));
22 | }
23 | 


--------------------------------------------------------------------------------
/examples/command.wasm/README.md:
--------------------------------------------------------------------------------
 1 | # command.wasm
 2 | 
 3 | This is a basic Voice Assistant example that accepts voice commands from the microphone.
 4 | It runs in fully in the browser via WebAseembly.
 5 | 
 6 | Online demo: https://whisper.ggerganov.com/command/
 7 | 
 8 | Terminal version: [examples/command](/examples/command)
 9 | 
10 | ## Build instructions
11 | 
12 | ```bash
13 | # build using Emscripten (v3.1.2)
14 | git clone https://github.com/ggerganov/whisper.cpp
15 | cd whisper.cpp
16 | mkdir build-em && cd build-em
17 | emcmake cmake ..
18 | make -j
19 | 
20 | # copy the produced page to your HTTP path
21 | cp bin/command.wasm/*       /path/to/html/
22 | cp bin/libcommand.worker.js /path/to/html/
23 | ```
24 | 


--------------------------------------------------------------------------------
/ggml/include/ggml-blas.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "ggml.h"
 4 | #include "ggml-backend.h"
 5 | 
 6 | 
 7 | #ifdef  __cplusplus
 8 | extern "C" {
 9 | #endif
10 | 
11 | // backend API
12 | GGML_BACKEND_API ggml_backend_t ggml_backend_blas_init(void);
13 | 
14 | GGML_BACKEND_API bool ggml_backend_is_blas(ggml_backend_t backend);
15 | 
16 | // number of threads used for conversion to float
17 | // for openblas and blis, this will also set the number of threads used for blas operations
18 | GGML_BACKEND_API void ggml_backend_blas_set_n_threads(ggml_backend_t backend_blas, int n_threads);
19 | 
20 | GGML_BACKEND_API ggml_backend_reg_t ggml_backend_blas_reg(void);
21 | 
22 | 
23 | #ifdef  __cplusplus
24 | }
25 | #endif
26 | 


--------------------------------------------------------------------------------
/ggml/include/ggml-opencl.h:
--------------------------------------------------------------------------------
 1 | #ifndef GGML_OPENCL_H
 2 | #define GGML_OPENCL_H
 3 | 
 4 | #include "ggml.h"
 5 | #include "ggml-backend.h"
 6 | 
 7 | #ifdef  __cplusplus
 8 | extern "C" {
 9 | #endif
10 | 
11 | //
12 | // backend API
13 | //
14 | GGML_BACKEND_API ggml_backend_t ggml_backend_opencl_init(void);
15 | GGML_BACKEND_API bool ggml_backend_is_opencl(ggml_backend_t backend);
16 | 
17 | GGML_BACKEND_API ggml_backend_buffer_type_t ggml_backend_opencl_buffer_type(void);
18 | GGML_BACKEND_API ggml_backend_buffer_type_t ggml_backend_opencl_host_buffer_type(void);
19 | 
20 | GGML_BACKEND_API ggml_backend_reg_t ggml_backend_opencl_reg(void);
21 | 
22 | #ifdef  __cplusplus
23 | }
24 | #endif
25 | 
26 | #endif // GGML_OPENCL_H
27 | 


--------------------------------------------------------------------------------
/SDL2/README.txt:
--------------------------------------------------------------------------------
 1 | 
 2 |                          Simple DirectMedia Layer
 3 | 
 4 |                                   (SDL)
 5 | 
 6 |                                 Version 2.0
 7 | 
 8 | ---
 9 | https://www.libsdl.org/
10 | 
11 | Simple DirectMedia Layer is a cross-platform development library designed
12 | to provide low level access to audio, keyboard, mouse, joystick, and graphics
13 | hardware via OpenGL and Direct3D. It is used by video playback software,
14 | emulators, and popular games including Valve's award winning catalog
15 | and many Humble Bundle games.
16 | 
17 | More extensive documentation is available in the docs directory, starting
18 | with README.md
19 | 
20 | Enjoy!
21 | 	Sam Lantinga				(slouken@libsdl.org)
22 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_getrows.comp:
--------------------------------------------------------------------------------
 1 | void main() {
 2 |     const uint i = gl_WorkGroupID.x;
 3 |     const int r = inB[i + pcs.inBOff];
 4 | 
 5 |     int z = 0;
 6 |     for (uint ind = gl_LocalInvocationID.x; ind < pcs.ne00/16; ind += gl_WorkGroupSize.x) {
 7 |         const uint inIndex = (r * pcs.nb01 + pcs.inAOff) + ind/NL * SIZE_OF_BLOCK;
 8 |         const mat4 result = dequantize_block(inIndex, ind%NL);
 9 |         for (uint j = 0; j < 4; ++j) {
10 |             for (uint k = 0; k < 4; ++k) {
11 |                 const uint outIndex = i * pcs.nb1/BYTES_FOR_TYPE + pcs.outOff + z;
12 |                 out_[outIndex] = result[j][k];
13 |                 ++z;
14 |             }
15 |         }
16 |     }
17 | }
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/leaky_relu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
15 | 
16 |     if (i >= p.KX) {
17 |         return;
18 |     }
19 | 
20 |     const float val = float(data_a[i]);
21 |     data_d[i] = D_TYPE(max(val, 0.0f) + min(val, 0.0f) * p.param1);
22 | }
23 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cuda/mmv.cuh:
--------------------------------------------------------------------------------
 1 | #include "common.cuh"
 2 | 
 3 | // maximum number of src0 rows with which to use mul_mat_vec over cuBLAS if FP16 tensor cores are available
 4 | #define MMV_MAX_ROWS 512
 5 | 
 6 | void ggml_cuda_mul_mat_vec(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, const ggml_tensor * src1, ggml_tensor * dst);
 7 | 
 8 | void ggml_cuda_op_mul_mat_vec(
 9 |     ggml_backend_cuda_context & ctx,
10 |     const ggml_tensor * src0, const ggml_tensor * src1, ggml_tensor * dst, const char * src0_dd_i, const float * src1_ddf_i,
11 |     const char * src1_ddq_i, float * dst_dd_i, const int64_t row_low, const int64_t row_high, const int64_t src1_ncols,
12 |     const int64_t src1_padded_row_size, cudaStream_t stream);
13 | 


--------------------------------------------------------------------------------
/bindings/javascript/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "whisper.cpp",
 3 |   "version": "1.7.4",
 4 |   "description": "Whisper speech recognition",
 5 |   "main": "whisper.js",
 6 |   "scripts": {
 7 |     "test": "echo \"todo: add tests\" && exit 0"
 8 |   },
 9 |   "repository": {
10 |     "type": "git",
11 |     "url": "git+https://github.com/ggerganov/whisper.cpp"
12 |   },
13 |   "keywords": [
14 |     "openai",
15 |     "whisper",
16 |     "speech-to-text",
17 |     "speech-recognition",
18 |     "transformer"
19 |   ],
20 |   "author": "Georgi Gerganov",
21 |   "license": "MIT",
22 |   "bugs": {
23 |     "url": "https://github.com/ggerganov/whisper.cpp/issues"
24 |   },
25 |   "homepage": "https://github.com/ggerganov/whisper.cpp#readme"
26 | }
27 | 


--------------------------------------------------------------------------------
/examples/deprecation-warning/README.md:
--------------------------------------------------------------------------------
 1 | # Migration notice for binary filenames
 2 | 
 3 | > [!IMPORTANT]
 4 | [2024 Dec 20] Binaries have been renamed w/ a `whisper-` prefix. `main` is now `whisper-cli`, `server` is `whisper-server`, etc (https://github.com/ggerganov/whisper.cpp/pull/2648)
 5 | 
 6 | This migration was important, but it is a breaking change that may not always be immediately obvious to users.
 7 | 
 8 | Please update all scripts and workflows to use the new binary names.
 9 | 
10 | | Old Filename | New Filename |
11 | | ---- | ---- |
12 | | main | whisper-cli |
13 | | bench | whisper-bench |
14 | | stream | whisper-stream |
15 | | command | whisper-command |
16 | | server | whisper-server |
17 | | talk-llama | whisper-talk-llama |
18 | 


--------------------------------------------------------------------------------
/examples/talk-llama/unicode-data.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <cstdint>
 4 | #include <vector>
 5 | #include <unordered_map>
 6 | #include <unordered_set>
 7 | 
 8 | struct range_nfd {
 9 |     uint32_t first;
10 |     uint32_t last;
11 |     uint32_t nfd;
12 | };
13 | 
14 | static const uint32_t MAX_CODEPOINTS = 0x110000;
15 | 
16 | extern const std::initializer_list<std::pair<uint32_t, uint16_t>> unicode_ranges_flags;
17 | extern const std::unordered_set<uint32_t> unicode_set_whitespace;
18 | extern const std::initializer_list<std::pair<uint32_t, uint32_t>> unicode_map_lowercase;
19 | extern const std::initializer_list<std::pair<uint32_t, uint32_t>> unicode_map_uppercase;
20 | extern const std::initializer_list<range_nfd> unicode_ranges_nfd;
21 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_gelu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorIn { float in_[]; };
 8 | layout(binding = 1) buffer restrict writeonly tensorOut { float out_[]; };
 9 | layout(push_constant) uniform PushConstants {
10 |     uint inOff;
11 |     uint outOff;
12 | } pcs;
13 | 
14 | void main() {
15 |     const uint baseIndex = gl_WorkGroupID.x * 8;
16 | 
17 |     for (uint x = 0; x < 8; x++) {
18 |         const uint i = baseIndex + x;
19 |         const float y = in_[i + pcs.inOff];
20 |         out_[i + pcs.outOff] = 0.5*y*(1.0 + tanh(clamp(SQRT_2_OVER_PI*y*(1.0 + GELU_COEF_A*y*y), -15.0, 15.0)));
21 |     }
22 | }
23 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/params/BeamSearchParams.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.params;
 2 | 
 3 | import com.sun.jna.Structure;
 4 | 
 5 | import java.util.Arrays;
 6 | import java.util.List;
 7 | 
 8 | public class BeamSearchParams extends Structure {
 9 |     /** ref: <a href="https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/transcribe.py#L265">...</a> */
10 |     public int beam_size;
11 | 
12 |     /** ref: <a href="https://arxiv.org/pdf/2204.05424.pdf">...</a> */
13 |     public float patience;
14 | 
15 |     @Override
16 |     protected List<String> getFieldOrder() {
17 |         return Arrays.asList("beam_size", "patience");
18 |     }
19 | }
20 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/rope.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_ROPE_HPP
14 | #define GGML_SYCL_ROPE_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_rope(
19 |     ggml_backend_sycl_context & ctx, const ggml_tensor *src0, const ggml_tensor *src1, ggml_tensor *dst,
20 |     const float *src0_dd, const float *src1_dd, float *dst_dd, const queue_ptr &main_stream);
21 | 
22 | #endif // GGML_SYCL_ROPE_HPP
23 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/scale.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | const uint num_threads = 128;
 7 | 
 8 | layout(local_size_x = num_threads, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | void main() {
11 |     uint idx = get_idx();
12 | 
13 |     // num_threads * num_iter must equal 512, to match the wg_denoms and get_idx calculation
14 |     const uint num_iter = 4;
15 | 
16 |     [[unroll]] for (uint i = 0; i < num_iter; ++i) {
17 |         if (idx >= p.ne) {
18 |             continue;
19 |         }
20 | 
21 |         data_d[get_doffset() + idx] = D_TYPE(FLOAT_TYPE(data_a[get_aoffset() + idx]) * FLOAT_TYPE(p.param1));
22 |         idx += num_threads;
23 |     }
24 | }
25 | 


--------------------------------------------------------------------------------
/bindings/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | if (EMSCRIPTEN)
 2 |     add_subdirectory(javascript)
 3 | 
 4 |     add_custom_command(
 5 |         OUTPUT ${CMAKE_CURRENT_SOURCE_DIR}/javascript/publish.log
 6 |         DEPENDS ${CMAKE_CURRENT_SOURCE_DIR}/javascript/whisper.js
 7 |         DEPENDS ${CMAKE_CURRENT_SOURCE_DIR}/javascript/libwhisper.worker.js
 8 |         DEPENDS ${CMAKE_CURRENT_SOURCE_DIR}/javascript/package.json
 9 |         WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/javascript
10 |         COMMAND npm publish
11 |         COMMAND touch publish.log
12 |         COMMENT "Publishing npm module v${PROJECT_VERSION}"
13 |         VERBATIM
14 |         )
15 | 
16 |     add_custom_target(publish-npm
17 |         DEPENDS javascript/publish.log
18 |         )
19 | endif()
20 | 


--------------------------------------------------------------------------------
/bindings/go/examples/go-whisper/color.go:
--------------------------------------------------------------------------------
 1 | package main
 2 | 
 3 | import "fmt"
 4 | 
 5 | ///////////////////////////////////////////////////////////////////////////////
 6 | // CONSTANTS
 7 | 
 8 | const (
 9 | 	Reset     = "\033[0m"
10 | 	RGBPrefix = "\033[38;5;" // followed by RGB values in decimal format separated by colons
11 | 	RGBSuffix = "m"
12 | )
13 | 
14 | ///////////////////////////////////////////////////////////////////////////////
15 | // PUBLIC METHODS
16 | 
17 | // Colorize text with RGB values, from 0 to 23
18 | func Colorize(text string, v int) string {
19 | 	// https://en.wikipedia.org/wiki/ANSI_escape_code#8-bit
20 | 	// Grayscale colors are in the range 232-255
21 | 	return RGBPrefix + fmt.Sprint(v%24+232) + RGBSuffix + text + Reset
22 | }
23 | 


--------------------------------------------------------------------------------
/.devops/cublas.Dockerfile:
--------------------------------------------------------------------------------
 1 | ARG UBUNTU_VERSION=22.04
 2 | 
 3 | # This needs to generally match the container host's environment.
 4 | ARG CUDA_VERSION=11.7.1
 5 | 
 6 | # Target the CUDA build image
 7 | ARG BASE_CUDA_DEV_CONTAINER=nvidia/cuda:${CUDA_VERSION}-devel-ubuntu${UBUNTU_VERSION}
 8 | 
 9 | FROM ${BASE_CUDA_DEV_CONTAINER} as build
10 | 
11 | # Unless otherwise specified, we make a fat build.
12 | ARG CUDA_DOCKER_ARCH=all
13 | 
14 | RUN apt-get update && \
15 |     apt-get install -y build-essential git cmake libsdl2-dev wget git
16 | 
17 | WORKDIR /app
18 | 
19 | COPY . .
20 | 
21 | # Set nvcc architecture
22 | ENV CUDA_DOCKER_ARCH=${CUDA_DOCKER_ARCH}
23 | # Enable cuBLAS
24 | ENV GGML_CUDA=1
25 | 
26 | RUN make base.en
27 | 
28 | ENTRYPOINT ["/app/main"]
29 | 


--------------------------------------------------------------------------------
/bindings/javascript/package-tmpl.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "whisper.cpp",
 3 |   "version": "@PROJECT_VERSION@",
 4 |   "description": "Whisper speech recognition",
 5 |   "main": "whisper.js",
 6 |   "scripts": {
 7 |     "test": "echo \"todo: add tests\" && exit 0"
 8 |   },
 9 |   "repository": {
10 |     "type": "git",
11 |     "url": "git+https://github.com/ggerganov/whisper.cpp"
12 |   },
13 |   "keywords": [
14 |     "openai",
15 |     "whisper",
16 |     "speech-to-text",
17 |     "speech-recognition",
18 |     "transformer"
19 |   ],
20 |   "author": "Georgi Gerganov",
21 |   "license": "MIT",
22 |   "bugs": {
23 |     "url": "https://github.com/ggerganov/whisper.cpp/issues"
24 |   },
25 |   "homepage": "https://github.com/ggerganov/whisper.cpp#readme"
26 | }
27 | 


--------------------------------------------------------------------------------
/SDL2/docs/README-git.md:
--------------------------------------------------------------------------------
 1 | git
 2 | =========
 3 | 
 4 | The latest development version of SDL is available via git.
 5 | Git allows you to get up-to-the-minute fixes and enhancements;
 6 | as a developer works on a source tree, you can use "git" to mirror that
 7 | source tree instead of waiting for an official release. Please look
 8 | at the Git website ( https://git-scm.com/ ) for more
 9 | information on using git, where you can also download software for
10 | macOS, Windows, and Unix systems.
11 | 
12 |     git clone https://github.com/libsdl-org/SDL
13 | 
14 | If you are building SDL via configure, you will need to run autogen.sh
15 | before running configure.
16 | 
17 | There is a web interface to the Git repository at:
18 | 	http://github.com/libsdl-org/SDL/
19 | 
20 | 


--------------------------------------------------------------------------------
/bindings/java/src/test/java/io/github/ggerganov/whispercpp/WhisperJnaLibraryTest.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp;
 2 | 
 3 | import static org.junit.jupiter.api.Assertions.*;
 4 | 
 5 | import org.junit.jupiter.api.Test;
 6 | 
 7 | class WhisperJnaLibraryTest {
 8 | 
 9 |     @Test
10 |     void testWhisperPrint_system_info() {
11 |         String systemInfo = WhisperCppJnaLibrary.instance.whisper_print_system_info();
12 |         // eg: "AVX = 1 | AVX2 = 1 | AVX512 = 0 | FMA = 1 | NEON = 0 | ARM_FMA = 0 | F16C = 1 | FP16_VA = 0
13 |         //    | WASM_SIMD = 0 | BLAS = 0 | SSE3 = 1 | VSX = 0 | COREML = 0 | "
14 |         System.out.println("System info: " + systemInfo);
15 |         assertTrue(systemInfo.length() > 10);
16 |     }
17 | }
18 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/getrows.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_GETROWS_HPP
14 | #define GGML_SYCL_GETROWS_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_get_rows(ggml_backend_sycl_context & ctx, const ggml_tensor *src0,
19 |     const ggml_tensor *src1, ggml_tensor *dst,
20 |     const float *src0_d, const float *src1_d,
21 |     float *dst_d, const queue_ptr &stream);
22 | 
23 | #endif // GGML_SYCL_GETROWS_HPP
24 | 


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/css/chessboard-1.0.0.min.css:
--------------------------------------------------------------------------------
1 | /*! chessboard.js v1.0.0 | (c) 2019 Chris Oakman | MIT License chessboardjs.com/license */
2 | .clearfix-7da63{clear:both}.board-b72b1{border:2px solid #404040;box-sizing:content-box}.square-55d63{float:left;position:relative;-webkit-touch-callout:none;-webkit-user-select:none;-khtml-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none}.white-1e1d7{background-color:#f0d9b5;color:#b58863}.black-3c85d{background-color:#b58863;color:#f0d9b5}.highlight1-32417,.highlight2-9c5d2{box-shadow:inset 0 0 3px 3px #ff0}.notation-322f9{cursor:default;font-family:"Helvetica Neue",Helvetica,Arial,sans-serif;font-size:14px;position:absolute}.alpha-d2270{bottom:1px;right:3px}.numeric-fc462{top:2px;left:2px}


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/gelu_quick.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const float GELU_QUICK_COEF = -1.702f;
15 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
16 | 
17 |     if (i >= p.KX) {
18 |         return;
19 |     }
20 | 
21 |     const float x = float(data_a[i]);
22 |     data_d[i] = D_TYPE(x * (1.0f / (1.0f + exp(GELU_QUICK_COEF * x))));
23 | }
24 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/im2col.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_IM2COL_HPP
14 | #define GGML_SYCL_IM2COL_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | void ggml_sycl_op_im2col(
19 |         ggml_backend_sycl_context & ctx, const ggml_tensor *src0, const ggml_tensor *src1,
20 |         ggml_tensor *dst, const float *src0_dd, const float *src1_dd, float *dst_dd,
21 |         const queue_ptr &main_stream);
22 | 
23 | #endif // GGML_SYCL_IM2COL_HPP
24 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_mul_mv_q_n_pre.comp:
--------------------------------------------------------------------------------
 1 | layout(local_size_x_id = 0) in;
 2 | layout(local_size_y = 8) in;
 3 | layout(local_size_z = 1) in;
 4 | 
 5 | layout (binding = 0) readonly buffer tensorInA { uint8_t inA[]; };
 6 | layout (binding = 1) readonly buffer tensorInB { float inB[]; };
 7 | layout (binding = 2) writeonly buffer tensorOut { float out_[]; };
 8 | 
 9 | layout (push_constant) uniform parameter {
10 |     uint inAOff;
11 |     uint inBOff;
12 |     uint outOff;
13 |     int  ne00;
14 |     int  ne01;
15 |     int  ne02;
16 |     int  ne10;
17 |     int  ne12;
18 |     int  ne0;
19 |     int  ne1;
20 |     uint nb01;
21 |     uint nb02;
22 |     uint nb03;
23 |     uint nb11;
24 |     uint nb12;
25 |     uint nb13;
26 |     uint r2;
27 |     uint r3;
28 | } pcs;
29 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_addrow.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorInA { float inA[]; };
 8 | layout(binding = 1) buffer restrict readonly tensorInB { float inB[]; };
 9 | layout(binding = 2) buffer restrict writeonly tensorOut { float out_[]; };
10 | 
11 | layout(push_constant) uniform PushConstants {
12 |     uint inAOff;
13 |     uint inBOff;
14 |     uint outOff;
15 |     uint row;
16 | } pcs;
17 | 
18 | void main() {
19 |     const uint baseIndex = gl_WorkGroupID.x * 4;
20 | 
21 |     for (uint x = 0; x < 4; x++) {
22 |         const uint i = baseIndex + x;
23 |         out_[i + pcs.outOff] = inA[i + pcs.inAOff] + inB[(i % pcs.row) + pcs.inBOff];
24 |     }
25 | }
26 | 


--------------------------------------------------------------------------------
/SDL2/include/SDL_opengles2_gl2platform.h:
--------------------------------------------------------------------------------
 1 | #ifndef __gl2platform_h_
 2 | #define __gl2platform_h_
 3 | 
 4 | /*
 5 | ** Copyright 2017-2020 The Khronos Group Inc.
 6 | ** SPDX-License-Identifier: Apache-2.0
 7 | */
 8 | 
 9 | /* Platform-specific types and definitions for OpenGL ES 2.X  gl2.h
10 |  *
11 |  * Adopters may modify khrplatform.h and this file to suit their platform.
12 |  * Please contribute modifications back to Khronos as pull requests on the
13 |  * public github repository:
14 |  *      https://github.com/KhronosGroup/OpenGL-Registry
15 |  */
16 | 
17 | /*#include <KHR/khrplatform.h>*/
18 | 
19 | #ifndef GL_APICALL
20 | #define GL_APICALL  KHRONOS_APICALL
21 | #endif
22 | 
23 | #ifndef GL_APIENTRY
24 | #define GL_APIENTRY KHRONOS_APIENTRY
25 | #endif
26 | 
27 | #endif /* __gl2platform_h_ */
28 | 


--------------------------------------------------------------------------------
/examples/sycl/build.sh:
--------------------------------------------------------------------------------
 1 | #  MIT license
 2 | #  Copyright (C) 2024 Intel Corporation
 3 | #  SPDX-License-Identifier: MIT
 4 | 
 5 | mkdir -p build
 6 | cd build
 7 | source /opt/intel/oneapi/setvars.sh
 8 | 
 9 | #for FP16
10 | #cmake .. -DGGML_SYCL=ON -DCMAKE_C_COMPILER=icx -DCMAKE_CXX_COMPILER=icpx -DWHISPER_SYCL_F16=ON # faster for long-prompt inference
11 | 
12 | #for FP32
13 | cmake .. -DGGML_SYCL=ON -DCMAKE_C_COMPILER=icx -DCMAKE_CXX_COMPILER=icpx
14 | 
15 | #for other features from the examples, e.g. stream and talk link with SDL2:
16 | #cmake .. -DGGML_SYCL=ON -DWHISPER_SDL2=ON -DCMAKE_C_COMPILER=icx -DCMAKE_CXX_COMPILER=icpx
17 | 
18 | #build example/main only
19 | #cmake --build . --config Release --target main
20 | 
21 | #build all binary
22 | cmake --build . --config Release -v
23 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-cann/kernels/ascendc_kernels.h:
--------------------------------------------------------------------------------
 1 | #ifndef ASCENDC_KERNELS_H
 2 | #define ASCENDC_KERNELS_H
 3 | 
 4 | #include "aclrtlaunch_ascendc_get_row_f32.h"
 5 | #include "aclrtlaunch_ascendc_get_row_f16.h"
 6 | #include "aclrtlaunch_ascendc_get_row_q8_0.h"
 7 | #include "aclrtlaunch_ascendc_get_row_q4_0.h"
 8 | 
 9 | #include "aclrtlaunch_ascendc_quantize_f32_q8_0.h"
10 | #include "aclrtlaunch_ascendc_quantize_f16_q8_0.h"
11 | #include "aclrtlaunch_ascendc_quantize_f16_to_q4_0.h"
12 | #include "aclrtlaunch_ascendc_quantize_f32_to_q4_0.h"
13 | 
14 | #include "aclrtlaunch_ascendc_dup_by_rows_fp16.h"
15 | #include "aclrtlaunch_ascendc_dup_by_rows_fp32.h"
16 | #include "aclrtlaunch_ascendc_dup_by_rows_fp32_to_fp16.h"
17 | #include "aclrtlaunch_ascendc_dup_by_rows_fp16_to_fp32.h"
18 | 
19 | #endif  // ASCENDC_KERNELS_H
20 | 


--------------------------------------------------------------------------------
/src/coreml/whisper-encoder.h:
--------------------------------------------------------------------------------
 1 | // Wrapper of the Core ML Whisper Encoder model
 2 | //
 3 | // Code is derived from the work of Github user @wangchou
 4 | // ref: https://github.com/wangchou/callCoreMLFromCpp
 5 | 
 6 | #include <stdint.h>
 7 | 
 8 | #if __cplusplus
 9 | extern "C" {
10 | #endif
11 | 
12 | struct whisper_coreml_context;
13 | 
14 | struct whisper_coreml_context * whisper_coreml_init(const char * path_model);
15 | void whisper_coreml_free(struct whisper_coreml_context * ctx);
16 | 
17 | void whisper_coreml_encode(
18 |         const whisper_coreml_context * ctx,
19 |                              int64_t   n_ctx,
20 |                              int64_t   n_mel,
21 |                                float * mel,
22 |                                float * out);
23 | 
24 | #if __cplusplus
25 | }
26 | #endif
27 | 


--------------------------------------------------------------------------------
/SDL2/docs/README-pandora.md:
--------------------------------------------------------------------------------
 1 | Pandora
 2 | =====================================================================
 3 | 
 4 | ( http://openpandora.org/ )
 5 | - A pandora specific video driver was written to allow SDL 2.0 with OpenGL ES
 6 | support to work on the pandora under the framebuffer. This driver do not have
 7 | input support for now, so if you use it you will have to add your own control code.
 8 | The video driver name is "pandora" so if you have problem running it from
 9 | the framebuffer, try to set the following variable before starting your application :
10 | "export SDL_VIDEODRIVER=pandora"
11 | 
12 | - OpenGL ES support was added to the x11 driver, so it's working like the normal
13 | x11 driver one with OpenGLX support, with SDL input event's etc..
14 | 
15 | 
16 | David Carré (Cpasjuste)
17 | cpasjuste@gmail.com
18 | 


--------------------------------------------------------------------------------
/cmake/git-vars.cmake:
--------------------------------------------------------------------------------
 1 | find_package(Git)
 2 | 
 3 | # the commit's SHA1
 4 | execute_process(COMMAND
 5 |     "${GIT_EXECUTABLE}" describe --match=NeVeRmAtCh --always --abbrev=8
 6 |     WORKING_DIRECTORY "${CMAKE_SOURCE_DIR}"
 7 |     OUTPUT_VARIABLE GIT_SHA1
 8 |     ERROR_QUIET OUTPUT_STRIP_TRAILING_WHITESPACE)
 9 | 
10 | # the date of the commit
11 | execute_process(COMMAND
12 |     "${GIT_EXECUTABLE}" log -1 --format=%ad --date=local
13 |     WORKING_DIRECTORY "${CMAKE_SOURCE_DIR}"
14 |     OUTPUT_VARIABLE GIT_DATE
15 |     ERROR_QUIET OUTPUT_STRIP_TRAILING_WHITESPACE)
16 | 
17 | # the subject of the commit
18 | execute_process(COMMAND
19 |     "${GIT_EXECUTABLE}" log -1 --format=%s
20 |     WORKING_DIRECTORY "${CMAKE_SOURCE_DIR}"
21 |     OUTPUT_VARIABLE GIT_COMMIT_SUBJECT
22 |     ERROR_QUIET OUTPUT_STRIP_TRAILING_WHITESPACE)
23 | 


--------------------------------------------------------------------------------
/ggml/cmake/GitVars.cmake:
--------------------------------------------------------------------------------
 1 | find_package(Git)
 2 | 
 3 | # the commit's SHA1
 4 | execute_process(COMMAND
 5 |     "${GIT_EXECUTABLE}" describe --match=NeVeRmAtCh --always --abbrev=8
 6 |     WORKING_DIRECTORY "${CMAKE_SOURCE_DIR}"
 7 |     OUTPUT_VARIABLE GIT_SHA1
 8 |     ERROR_QUIET OUTPUT_STRIP_TRAILING_WHITESPACE)
 9 | 
10 | # the date of the commit
11 | execute_process(COMMAND
12 |     "${GIT_EXECUTABLE}" log -1 --format=%ad --date=local
13 |     WORKING_DIRECTORY "${CMAKE_SOURCE_DIR}"
14 |     OUTPUT_VARIABLE GIT_DATE
15 |     ERROR_QUIET OUTPUT_STRIP_TRAILING_WHITESPACE)
16 | 
17 | # the subject of the commit
18 | execute_process(COMMAND
19 |     "${GIT_EXECUTABLE}" log -1 --format=%s
20 |     WORKING_DIRECTORY "${CMAKE_SOURCE_DIR}"
21 |     OUTPUT_VARIABLE GIT_COMMIT_SUBJECT
22 |     ERROR_QUIET OUTPUT_STRIP_TRAILING_WHITESPACE)
23 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/callbacks/WhisperProgressCallback.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.callbacks;
 2 | 
 3 | import com.sun.jna.Callback;
 4 | import com.sun.jna.Pointer;
 5 | import io.github.ggerganov.whispercpp.WhisperContext;
 6 | import io.github.ggerganov.whispercpp.model.WhisperState;
 7 | 
 8 | /**
 9 |  * Callback for progress updates.
10 |  */
11 | public interface WhisperProgressCallback extends Callback {
12 | 
13 |     /**
14 |      * Callback method for progress updates.
15 |      *
16 |      * @param ctx        The whisper context.
17 |      * @param state      The whisper state.
18 |      * @param progress   The progress value.
19 |      * @param user_data  User data.
20 |      */
21 |     void callback(Pointer ctx, Pointer state, int progress, Pointer user_data);
22 | }
23 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/AndroidManifest.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <manifest xmlns:android="http://schemas.android.com/apk/res/android"
 3 |   package="com.litongjava.whisper.android.java">
 4 | 
 5 |   <application
 6 |     android:allowBackup="true"
 7 |     android:name=".app.App"
 8 |     android:icon="@mipmap/ic_launcher"
 9 |     android:label="@string/app_name"
10 |     android:roundIcon="@mipmap/ic_launcher_round"
11 |     android:supportsRtl="true"
12 |     android:theme="@style/Theme.Whisperandroidjava">
13 |     <activity android:name=".MainActivity">
14 |       <intent-filter>
15 |         <action android:name="android.intent.action.MAIN" />
16 | 
17 |         <category android:name="android.intent.category.LAUNCHER" />
18 |       </intent-filter>
19 |     </activity>
20 |   </application>
21 | 
22 | </manifest>


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/androidTest/java/com/whispercppdemo/ExampleInstrumentedTest.kt:
--------------------------------------------------------------------------------
 1 | package com.whispercppdemo
 2 | 
 3 | import androidx.test.platform.app.InstrumentationRegistry
 4 | import androidx.test.ext.junit.runners.AndroidJUnit4
 5 | 
 6 | import org.junit.Test
 7 | import org.junit.runner.RunWith
 8 | 
 9 | import org.junit.Assert.*
10 | 
11 | /**
12 |  * Instrumented test, which will execute on an Android device.
13 |  *
14 |  * See [testing documentation](http://d.android.com/tools/testing).
15 |  */
16 | @RunWith(AndroidJUnit4::class)
17 | class ExampleInstrumentedTest {
18 |     @Test
19 |     fun useAppContext() {
20 |         // Context of the app under test.
21 |         val appContext = InstrumentationRegistry.getInstrumentation().targetContext
22 |         assertEquals("com.whispercppdemo", appContext.packageName)
23 |     }
24 | }


--------------------------------------------------------------------------------
/examples/whisper.android/app/src/main/java/com/whispercppdemo/MainActivity.kt:
--------------------------------------------------------------------------------
 1 | package com.whispercppdemo
 2 | 
 3 | import android.os.Bundle
 4 | import androidx.activity.ComponentActivity
 5 | import androidx.activity.compose.setContent
 6 | import androidx.activity.viewModels
 7 | import com.whispercppdemo.ui.main.MainScreen
 8 | import com.whispercppdemo.ui.main.MainScreenViewModel
 9 | import com.whispercppdemo.ui.theme.WhisperCppDemoTheme
10 | 
11 | class MainActivity : ComponentActivity() {
12 |     private val viewModel: MainScreenViewModel by viewModels { MainScreenViewModel.factory() }
13 | 
14 |     override fun onCreate(savedInstanceState: Bundle?) {
15 |         super.onCreate(savedInstanceState)
16 |         setContent {
17 |             WhisperCppDemoTheme {
18 |                 MainScreen(viewModel)
19 |             }
20 |         }
21 |     }
22 | }


--------------------------------------------------------------------------------
/bindings/go/examples/go-model-download/context.go:
--------------------------------------------------------------------------------
 1 | package main
 2 | 
 3 | import (
 4 | 	"context"
 5 | 	"os"
 6 | 	"os/signal"
 7 | )
 8 | 
 9 | // ContextForSignal returns a context object which is cancelled when a signal
10 | // is received. It returns nil if no signal parameter is provided
11 | func ContextForSignal(signals ...os.Signal) context.Context {
12 |     if len(signals) == 0 {
13 |         return nil
14 |     }
15 | 
16 |     ch := make(chan os.Signal, 1) // Buffered channel with space for 1 signal
17 |     ctx, cancel := context.WithCancel(context.Background())
18 | 
19 |     // Send message on channel when signal received
20 |     signal.Notify(ch, signals...)
21 | 
22 |     // When any signal is received, call cancel
23 |     go func() {
24 |         <-ch
25 |         cancel()
26 |     }()
27 | 
28 |     // Return success
29 |     return ctx
30 | }
31 | 
32 | 


--------------------------------------------------------------------------------
/bindings/ruby/ext/ruby_whisper.h:
--------------------------------------------------------------------------------
 1 | #ifndef RUBY_WHISPER_H
 2 | #define RUBY_WHISPER_H
 3 | 
 4 | #include "whisper.h"
 5 | 
 6 | typedef struct {
 7 |   VALUE *context;
 8 |   VALUE user_data;
 9 |   VALUE callback;
10 |   VALUE callbacks;
11 | } ruby_whisper_callback_container;
12 | 
13 | typedef struct {
14 |   struct whisper_context *context;
15 | } ruby_whisper;
16 | 
17 | typedef struct {
18 |   struct whisper_full_params params;
19 |   bool diarize;
20 |   ruby_whisper_callback_container *new_segment_callback_container;
21 |   ruby_whisper_callback_container *progress_callback_container;
22 |   ruby_whisper_callback_container *abort_callback_container;
23 | } ruby_whisper_params;
24 | 
25 | typedef struct {
26 |   VALUE context;
27 |   int index;
28 | } ruby_whisper_segment;
29 | 
30 | typedef struct {
31 |   VALUE context;
32 | } ruby_whisper_model;
33 | 
34 | #endif
35 | 


--------------------------------------------------------------------------------
/examples/whisper.android/app/proguard-rules.pro:
--------------------------------------------------------------------------------
 1 | # Add project specific ProGuard rules here.
 2 | # You can control the set of applied configuration files using the
 3 | # proguardFiles setting in build.gradle.
 4 | #
 5 | # For more details, see
 6 | #   http://developer.android.com/guide/developing/tools/proguard.html
 7 | 
 8 | # If your project uses WebView with JS, uncomment the following
 9 | # and specify the fully qualified class name to the JavaScript interface
10 | # class:
11 | #-keepclassmembers class fqcn.of.javascript.interface.for.webview {
12 | #   public *;
13 | #}
14 | 
15 | # Uncomment this to preserve the line number information for
16 | # debugging stack traces.
17 | #-keepattributes SourceFile,LineNumberTable
18 | 
19 | # If you keep the line number information, uncomment this to
20 | # hide the original source file name.
21 | #-renamesourcefileattribute SourceFile


--------------------------------------------------------------------------------
/scripts/build-info.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | CC=$1
 4 | 
 5 | build_number="0"
 6 | build_commit="unknown"
 7 | build_compiler="unknown"
 8 | build_target="unknown"
 9 | 
10 | if out=$(git rev-list --count HEAD); then
11 |     # git is broken on WSL so we need to strip extra newlines
12 |     build_number=$(printf '%s' "$out" | tr -d '\n')
13 | fi
14 | 
15 | if out=$(git rev-parse --short HEAD); then
16 |     build_commit=$(printf '%s' "$out" | tr -d '\n')
17 | fi
18 | 
19 | if out=$($CC --version | head -1); then
20 |     build_compiler=$out
21 | fi
22 | 
23 | if out=$($CC -dumpmachine); then
24 |     build_target=$out
25 | fi
26 | 
27 | echo "int WHISPER_BUILD_NUMBER = ${build_number};"
28 | echo "char const *WHISPER_COMMIT = \"${build_commit}\";"
29 | echo "char const *WHISPER_COMPILER = \"${build_compiler}\";"
30 | echo "char const *WHISPER_BUILD_TARGET = \"${build_target}\";"
31 | 


--------------------------------------------------------------------------------
/bindings/java/src/main/java/io/github/ggerganov/whispercpp/params/CBool.java:
--------------------------------------------------------------------------------
 1 | package io.github.ggerganov.whispercpp.params;
 2 | 
 3 | import com.sun.jna.IntegerType;
 4 | 
 5 | import java.util.function.BooleanSupplier;
 6 | 
 7 | public class CBool extends IntegerType implements BooleanSupplier {
 8 |     public static final int SIZE = 1;
 9 |     public static final CBool FALSE = new CBool(0);
10 |     public static final CBool TRUE = new CBool(1);
11 | 
12 | 
13 |     public CBool() {
14 |         this(0);
15 |     }
16 | 
17 |     public CBool(long value) {
18 |         super(SIZE, value, true);
19 |     }
20 | 
21 |     @Override
22 |     public boolean getAsBoolean() {
23 |         return intValue() == 1;
24 |     }
25 | 
26 |     @Override
27 |     public String toString() {
28 |         return intValue() == 1 ? "true" : "false";
29 |     }
30 | }
31 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/proguard-rules.pro:
--------------------------------------------------------------------------------
 1 | # Add project specific ProGuard rules here.
 2 | # You can control the set of applied configuration files using the
 3 | # proguardFiles setting in build.gradle.
 4 | #
 5 | # For more details, see
 6 | #   http://developer.android.com/guide/developing/tools/proguard.html
 7 | 
 8 | # If your project uses WebView with JS, uncomment the following
 9 | # and specify the fully qualified class name to the JavaScript interface
10 | # class:
11 | #-keepclassmembers class fqcn.of.javascript.interface.for.webview {
12 | #   public *;
13 | #}
14 | 
15 | # Uncomment this to preserve the line number information for
16 | # debugging stack traces.
17 | #-keepattributes SourceFile,LineNumberTable
18 | 
19 | # If you keep the line number information, uncomment this to
20 | # hide the original source file name.
21 | #-renamesourcefileattribute SourceFile


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/values/themes.xml:
--------------------------------------------------------------------------------
 1 | <resources xmlns:tools="http://schemas.android.com/tools">
 2 |   <!-- Base application theme. -->
 3 |   <style name="Theme.Whisperandroidjava" parent="Theme.MaterialComponents.DayNight.DarkActionBar">
 4 |     <!-- Primary brand color. -->
 5 |     <item name="colorPrimary">@color/purple_500</item>
 6 |     <item name="colorPrimaryVariant">@color/purple_700</item>
 7 |     <item name="colorOnPrimary">@color/white</item>
 8 |     <!-- Secondary brand color. -->
 9 |     <item name="colorSecondary">@color/teal_200</item>
10 |     <item name="colorSecondaryVariant">@color/teal_700</item>
11 |     <item name="colorOnSecondary">@color/black</item>
12 |     <!-- Status bar color. -->
13 |     <item name="android:statusBarColor" tools:targetApi="l">?attr/colorPrimaryVariant</item>
14 |     <!-- Customize your theme here. -->
15 |   </style>
16 | </resources>


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_diagmask.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout(binding = 0) buffer restrict readonly tensorIn { float in_[]; };
 8 | layout(binding = 1) buffer restrict writeonly tensorOut { float out_[]; };
 9 | 
10 | layout(push_constant) uniform PushConstants {
11 |     uint inOff;
12 |     uint outOff;
13 |     uint n_past;
14 |     int ne00;
15 |     int ne01;
16 | } pcs;
17 | 
18 | void main() {
19 |     const uint i02 = gl_WorkGroupID.z;
20 |     const uint i01 = gl_WorkGroupID.y;
21 |     const uint i00 = gl_WorkGroupID.x;
22 | 
23 |     const uint index = i02*pcs.ne01*pcs.ne00 + i01*pcs.ne00 + i00;
24 | 
25 |     if (i00 > pcs.n_past + i01) {
26 |         out_[index + pcs.outOff] = uintBitsToFloat(0xFF800000);
27 |     } else {
28 |         out_[index + pcs.outOff] = in_[index + pcs.inOff];
29 |     }
30 | }
31 | 


--------------------------------------------------------------------------------
/examples/whisper.android.java/app/src/main/res/values-night/themes.xml:
--------------------------------------------------------------------------------
 1 | <resources xmlns:tools="http://schemas.android.com/tools">
 2 |   <!-- Base application theme. -->
 3 |   <style name="Theme.Whisperandroidjava" parent="Theme.MaterialComponents.DayNight.DarkActionBar">
 4 |     <!-- Primary brand color. -->
 5 |     <item name="colorPrimary">@color/purple_200</item>
 6 |     <item name="colorPrimaryVariant">@color/purple_700</item>
 7 |     <item name="colorOnPrimary">@color/black</item>
 8 |     <!-- Secondary brand color. -->
 9 |     <item name="colorSecondary">@color/teal_200</item>
10 |     <item name="colorSecondaryVariant">@color/teal_200</item>
11 |     <item name="colorOnSecondary">@color/black</item>
12 |     <!-- Status bar color. -->
13 |     <item name="android:statusBarColor" tools:targetApi="l">?attr/colorPrimaryVariant</item>
14 |     <!-- Customize your theme here. -->
15 |   </style>
16 | </resources>


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/gelu.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) writeonly buffer D {D_TYPE data_d[];};
12 | 
13 | void main() {
14 |     const float GELU_COEF_A    = 0.044715f;
15 |     const float SQRT_2_OVER_PI = 0.79788456080286535587989211986876f;
16 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
17 | 
18 |     if (i >= p.KX) {
19 |         return;
20 |     }
21 | 
22 |     const float xi = float(data_a[i]);
23 |     const float val = SQRT_2_OVER_PI*xi*(1.0f + GELU_COEF_A*xi*xi);
24 |     data_d[i] = D_TYPE(0.5f*xi*(2.0f - 2.0f / (exp(2 * val) + 1)));
25 | }
26 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/silu_back.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "generic_head.comp"
 4 | #include "types.comp"
 5 | 
 6 | #extension GL_EXT_control_flow_attributes : enable
 7 | 
 8 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer G {A_TYPE data_g[];};
11 | layout (binding = 1) readonly buffer X {B_TYPE data_x[];};
12 | layout (binding = 2) writeonly buffer D {D_TYPE data_d[];};
13 | 
14 | void main() {
15 |     const uint i = gl_GlobalInvocationID.z * 262144 + gl_GlobalInvocationID.y * 512 + gl_GlobalInvocationID.x;
16 | 
17 |     if (i >= p.KX) {
18 |         return;
19 |     }
20 | 
21 |     // Compute derivative of SiLU(x): 1/(1+exp(-x)) - x*exp(-x)/(1+exp(-x))^2
22 | 
23 |     const float xi = float(data_x[i]);
24 |     const float s = 1.0f / (1.0f + exp(-xi));
25 |     data_d[i] = D_TYPE(data_g[i] * (s + xi * s * (1 - s)));
26 | }
27 | 


--------------------------------------------------------------------------------
/examples/addon.node/__test__/whisper.spec.js:
--------------------------------------------------------------------------------
 1 | const path = require("path");
 2 | const { whisper } = require(path.join(
 3 |   __dirname,
 4 |   "../../../build/Release/addon.node"
 5 | ));
 6 | const { promisify } = require("util");
 7 | 
 8 | const whisperAsync = promisify(whisper);
 9 | 
10 | const whisperParamsMock = {
11 |   language: "en",
12 |   model: path.join(__dirname, "../../../models/ggml-base.en.bin"),
13 |   fname_inp: path.join(__dirname, "../../../samples/jfk.wav"),
14 |   use_gpu: true,
15 |   flash_attn: false,
16 |   no_prints: true,
17 |   comma_in_time: false,
18 |   translate: true,
19 |   no_timestamps: false,
20 |   audio_ctx: 0,
21 | };
22 | 
23 | describe("Run whisper.node", () => {
24 |     test("it should receive a non-empty value", async () => {
25 |         let result = await whisperAsync(whisperParamsMock);
26 | 
27 |         expect(result.length).toBeGreaterThan(0);
28 |     }, 10000);
29 | });
30 | 
31 | 


--------------------------------------------------------------------------------
/examples/talk-llama/llama-sampling.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | // TODO: rename llama-sampling.h/.cpp to llama-sampler.h/.cpp ?
 4 | 
 5 | #include "llama.h"
 6 | 
 7 | #include <vector>
 8 | 
 9 | struct llama_vocab;
10 | struct llama_grammar;
11 | 
12 | // sampler chain
13 | 
14 | struct llama_sampler_chain {
15 |     llama_sampler_chain_params params;
16 | 
17 |     std::vector<struct llama_sampler *> samplers;
18 | 
19 |     // timing
20 | 
21 |     mutable int64_t t_sample_us;
22 | 
23 |     mutable int32_t n_sample;
24 | };
25 | 
26 | struct llama_sampler * llama_sampler_init_dry_testing(
27 |                          int32_t   context_size,
28 |                            float   dry_multiplier,
29 |                            float   dry_base,
30 |                          int32_t   dry_allowed_length,
31 |                          int32_t   dry_penalty_last_n,
32 |   const std::vector<std::vector<llama_token>>& seq_breakers);
33 | 


--------------------------------------------------------------------------------
/examples/whisper.android/.idea/gradle.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <project version="4">
 3 |   <component name="GradleMigrationSettings" migrationVersion="1" />
 4 |   <component name="GradleSettings">
 5 |     <option name="linkedExternalProjectsSettings">
 6 |       <GradleProjectSettings>
 7 |         <option name="testRunner" value="GRADLE" />
 8 |         <option name="externalProjectPath" value="$PROJECT_DIR$" />
 9 |         <option name="gradleJvm" value="#GRADLE_LOCAL_JAVA_HOME" />
10 |         <option name="modules">
11 |           <set>
12 |             <option value="$PROJECT_DIR$" />
13 |             <option value="$PROJECT_DIR$/app" />
14 |           </set>
15 |         </option>
16 |         <option name="resolveExternalAnnotations" value="false" />
17 |         <option name="resolveModulePerSourceSet" value="false" />
18 |       </GradleProjectSettings>
19 |     </option>
20 |   </component>
21 | </project>


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/div.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_binary_head.comp"
 5 | 
 6 | const uint num_threads = 256;
 7 | 
 8 | layout(local_size_x = num_threads, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | void main() {
11 |     uint idx = get_idx();
12 | 
13 |     // num_threads * num_iter must equal 512, to match the wg_denoms and get_idx calculation
14 |     const uint num_iter = 2;
15 | 
16 |     [[unroll]] for (uint i = 0; i < num_iter; ++i) {
17 |         if (idx >= p.ne) {
18 |             continue;
19 |         }
20 |         uint i00, i01, i02, i03;
21 |         get_indices(idx, i00, i01, i02, i03);
22 | 
23 |         data_d[get_doffset() + dst_idx(i00, i01, i02, i03)] = D_TYPE(FLOAT_TYPE(data_a[get_aoffset() + src0_idx(i00, i01, i02, i03)]) / FLOAT_TYPE(data_b[get_boffset() + src1_idx(i00, i01, i02, i03)]));
24 | 
25 |         idx += num_threads;
26 |     }
27 | }
28 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/mul.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_binary_head.comp"
 5 | 
 6 | const uint num_threads = 256;
 7 | 
 8 | layout(local_size_x = num_threads, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | void main() {
11 |     uint idx = get_idx();
12 | 
13 |     // num_threads * num_iter must equal 512, to match the wg_denoms and get_idx calculation
14 |     const uint num_iter = 2;
15 | 
16 |     [[unroll]] for (uint i = 0; i < num_iter; ++i) {
17 |         if (idx >= p.ne) {
18 |             continue;
19 |         }
20 |         uint i00, i01, i02, i03;
21 |         get_indices(idx, i00, i01, i02, i03);
22 | 
23 |         data_d[get_doffset() + dst_idx(i00, i01, i02, i03)] = D_TYPE(FLOAT_TYPE(data_a[get_aoffset() + src0_idx(i00, i01, i02, i03)]) * FLOAT_TYPE(data_b[get_boffset() + src1_idx(i00, i01, i02, i03)]));
24 | 
25 |         idx += num_threads;
26 |     }
27 | }
28 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/mmvq.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_MMVQ_HPP
14 | #define GGML_SYCL_MMVQ_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | 
19 | void ggml_sycl_op_mul_mat_vec_q(
20 |     ggml_backend_sycl_context & ctx,
21 |     const ggml_tensor *src0, const ggml_tensor *src1, ggml_tensor *dst,
22 |     const char *src0_dd_i, const float *src1_ddf_i, const char *src1_ddq_i,
23 |     float *dst_dd_i, const int64_t row_low, const int64_t row_high,
24 |     const int64_t src1_ncols, const int64_t src1_padded_row_size,
25 |     const dpct::queue_ptr &stream);
26 | 
27 | #endif // GGML_SYCL_MMVQ_HPP
28 | 


--------------------------------------------------------------------------------
/bindings/go/pkg/whisper/consts.go:
--------------------------------------------------------------------------------
 1 | package whisper
 2 | 
 3 | import (
 4 | 	"errors"
 5 | 
 6 | 	// Bindings
 7 | 	whisper "github.com/ggerganov/whisper.cpp/bindings/go"
 8 | )
 9 | 
10 | ///////////////////////////////////////////////////////////////////////////////
11 | // ERRORS
12 | 
13 | var (
14 | 	ErrUnableToLoadModel    = errors.New("unable to load model")
15 | 	ErrInternalAppError     = errors.New("internal application error")
16 | 	ErrProcessingFailed     = errors.New("processing failed")
17 | 	ErrUnsupportedLanguage  = errors.New("unsupported language")
18 | 	ErrModelNotMultilingual = errors.New("model is not multilingual")
19 | )
20 | 
21 | ///////////////////////////////////////////////////////////////////////////////
22 | // CONSTANTS
23 | 
24 | // SampleRate is the sample rate of the audio data.
25 | const SampleRate = whisper.SampleRate
26 | 
27 | // SampleBits is the number of bytes per sample.
28 | const SampleBits = whisper.SampleBits
29 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/dmmv.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_DMMV_HPP
14 | #define GGML_SYCL_DMMV_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | 
19 | void ggml_sycl_op_dequantize_mul_mat_vec(
20 |     ggml_backend_sycl_context & ctx,
21 |     const ggml_tensor *src0, const ggml_tensor *src1, ggml_tensor *dst,
22 |     const char *src0_dd_i, const float *src1_ddf_i, const char *src1_ddq_i,
23 |     float *dst_dd_i, const int64_t row_low, const int64_t row_high,
24 |     const int64_t src1_ncols, const int64_t src1_padded_row_size,
25 |     const dpct::queue_ptr &stream);
26 | 
27 | #endif // GGML_SYCL_DMMV_HPP
28 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_getrows_f32.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout (binding = 0) readonly buffer tensorInA { float inA[]; };
 8 | layout (binding = 1) readonly buffer tensorInB { int inB[]; };
 9 | layout (binding = 2) writeonly buffer tensorOut { float out_[]; };
10 | 
11 | layout (push_constant) uniform parameter {
12 |     uint inAOff;
13 |     uint inBOff;
14 |     uint outOff;
15 |     int ne00;
16 |     int nb01;
17 |     int nb1;
18 | } pcs;
19 | 
20 | void dequantize_row_f32(uint x /*Based from inA unaligned*/, uint y /*Based from out_*/, int k) {
21 |     for (int j = 0; j < k; j++) {
22 |         out_[y + j] = inA[x + j];
23 |     }
24 | }
25 | 
26 | void main() {
27 |     const uint i = gl_WorkGroupID.x;
28 |     const int r = inB[i + pcs.inBOff];
29 | 
30 |     dequantize_row_f32(r*pcs.nb01/4 + pcs.inAOff, i*pcs.nb1/4 + pcs.outOff, pcs.ne00);
31 | }
32 | 


--------------------------------------------------------------------------------
/tests/en-2-ref.txt:
--------------------------------------------------------------------------------
1 |  This is the Micro Machine Man presenting the most midget miniature motorcade of Micro Machines. Each one has dramatic details, terrific trim, precision paint jobs, plus incredible Micro Machine Pocket Playsets. There's a police station, fire station, restaurant, service station, and more. Perfect pocket portables to take anyplace. And there are many miniature playsets to play with, and each one comes with its own special edition Micro Machine vehicle and fun, fantastic features that miraculously move. Raise the boat lift at the airport marina, man the gun turret at the army base, clean your car at the car wash, raise the toll bridge. And these playsets fit together to form a Micro Machine world. Micro Machine Pocket Playsets, so tremendously tiny, so perfectly precise, so dazzlingly detailed, you'll want to pocket them all. Micro Machines are Micro Machine Pocket Playsets sold separately from Galoob. The smaller they are, the better they are.


--------------------------------------------------------------------------------
/examples/whisper.objc/whisper.objc/Info.plist:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
 3 | <plist version="1.0">
 4 | <dict>
 5 | 	<key>NSMicrophoneUsageDescription</key>
 6 | 	<string>This app requires microphone access in order to transcribe speech</string>
 7 | 	<key>UIApplicationSceneManifest</key>
 8 | 	<dict>
 9 | 		<key>UIApplicationSupportsMultipleScenes</key>
10 | 		<false/>
11 | 		<key>UISceneConfigurations</key>
12 | 		<dict>
13 | 			<key>UIWindowSceneSessionRoleApplication</key>
14 | 			<array>
15 | 				<dict>
16 | 					<key>UISceneConfigurationName</key>
17 | 					<string>Default Configuration</string>
18 | 					<key>UISceneDelegateClassName</key>
19 | 					<string>SceneDelegate</string>
20 | 					<key>UISceneStoryboardFile</key>
21 | 					<string>Main</string>
22 | 				</dict>
23 | 			</array>
24 | 		</dict>
25 | 	</dict>
26 | </dict>
27 | </plist>
28 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/convert.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_CONVERT_HPP
14 | #define GGML_SYCL_CONVERT_HPP
15 | 
16 | #include "common.hpp"
17 | 
18 | template <typename T>
19 | using to_t_sycl_t = void (*)(const void *__restrict__ x, T *__restrict__ y,
20 |                              int64_t k, dpct::queue_ptr stream);
21 | typedef to_t_sycl_t<float> to_fp32_sycl_t;
22 | typedef to_t_sycl_t<sycl::half> to_fp16_sycl_t;
23 | 
24 | to_fp16_sycl_t ggml_get_to_fp16_sycl(ggml_type type, ggml_tensor *dst);
25 | to_fp32_sycl_t ggml_get_to_fp32_sycl(ggml_type type, ggml_tensor *dst);
26 | 
27 | #endif // GGML_SYCL_CONVERT_HPP
28 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/repeat.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "types.comp"
 4 | #include "generic_unary_head.comp"
 5 | 
 6 | layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
 7 | 
 8 | uint src0_idx_mod(uint idx) {
 9 |     const uint i13 = idx / (p.ne12*p.ne11*p.ne10);
10 |     const uint i13_offset = i13 * p.ne12*p.ne11*p.ne10;
11 |     const uint i12 = (idx - i13_offset) / (p.ne11*p.ne10);
12 |     const uint i12_offset = i12*p.ne11*p.ne10;
13 |     const uint i11 = (idx - i13_offset - i12_offset) / p.ne10;
14 |     const uint i10 = idx - i13_offset - i12_offset - i11*p.ne10;
15 |     return (i13 % p.ne03)*p.nb03 + (i12 % p.ne02)*p.nb02 + (i11 % p.ne01)*p.nb01 + (i10 % p.ne00)*p.nb00;
16 | }
17 | 
18 | void main() {
19 |     const uint idx = get_idx();
20 | 
21 |     if (idx >= p.ne) {
22 |         return;
23 |     }
24 | 
25 |     data_d[get_doffset() + dst_idx(idx)] = D_TYPE(data_a[get_aoffset() + src0_idx_mod(idx)]);
26 | }
27 | 


--------------------------------------------------------------------------------
/examples/talk-llama/llama-memory.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "llama.h"
 4 | 
 5 | // general concept of LLM memory
 6 | // the KV cache is a type of LLM memory, but there can be other types
 7 | class llama_memory_i {
 8 | public:
 9 |     virtual void clear() = 0;
10 |     virtual void defrag() = 0;
11 | 
12 |     virtual bool seq_rm  (llama_seq_id seq_id,                              llama_pos p0, llama_pos p1) = 0;
13 |     virtual void seq_cp  (llama_seq_id seq_id_src, llama_seq_id seq_id_dst, llama_pos p0, llama_pos p1) = 0;
14 |     virtual void seq_keep(llama_seq_id seq_id) = 0;
15 |     virtual void seq_add (llama_seq_id seq_id,                              llama_pos p0, llama_pos p1, llama_pos delta) = 0;
16 |     virtual void seq_div (llama_seq_id seq_id,                              llama_pos p0, llama_pos p1, int d) = 0;
17 | 
18 |     virtual llama_pos seq_pos_max(llama_seq_id seq_id) = 0;
19 | 
20 |     virtual bool get_can_edit() const = 0;
21 | };
22 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-sycl/backend.hpp:
--------------------------------------------------------------------------------
 1 | //
 2 | // MIT license
 3 | // Copyright (C) 2024 Intel Corporation
 4 | // SPDX-License-Identifier: MIT
 5 | //
 6 | 
 7 | //
 8 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 9 | // See https://llvm.org/LICENSE.txt for license information.
10 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
11 | //
12 | 
13 | #ifndef GGML_SYCL_BACKEND_HPP
14 | #define GGML_SYCL_BACKEND_HPP
15 | 
16 | #include "concat.hpp"
17 | #include "common.hpp"
18 | #include "conv.hpp"
19 | #include "convert.hpp"
20 | #include "dequantize.hpp"
21 | #include "dmmv.hpp"
22 | #include "mmq.hpp"
23 | #include "mmvq.hpp"
24 | #include "rope.hpp"
25 | #include "norm.hpp"
26 | #include "softmax.hpp"
27 | #include "tsembd.hpp"
28 | #include "im2col.hpp"
29 | #include "wkv.hpp"
30 | #include "outprod.hpp"
31 | #include "element_wise.hpp"
32 | #include "cpy.hpp"
33 | #include "gla.hpp"
34 | 
35 | #endif // GGML_SYCL_BACKEND_HPP
36 | 


--------------------------------------------------------------------------------
/examples/talk-llama/llama-io.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <cstddef>
 4 | #include <cstdint>
 5 | #include <string>
 6 | 
 7 | struct ggml_tensor;
 8 | 
 9 | class llama_io_write_i {
10 | public:
11 |     llama_io_write_i() = default;
12 |     virtual ~llama_io_write_i() = default;
13 | 
14 |     virtual void write(const void * src, size_t size) = 0;
15 |     virtual void write_tensor(const ggml_tensor * tensor, size_t offset, size_t size) = 0;
16 | 
17 |     // bytes written so far
18 |     virtual size_t n_bytes() = 0;
19 | 
20 |     void write_string(const std::string & str);
21 | };
22 | 
23 | class llama_io_read_i {
24 | public:
25 |     llama_io_read_i() = default;
26 |     virtual ~llama_io_read_i() = default;
27 | 
28 |     virtual const uint8_t * read(size_t size) = 0;
29 |     virtual void read_to(void * dst, size_t size) = 0;
30 | 
31 |     // bytes read so far
32 |     virtual size_t n_bytes() = 0;
33 | 
34 |     void read_string(std::string & str);
35 | };
36 | 


--------------------------------------------------------------------------------
/ggml/include/ggml-rpc.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "ggml.h"
 4 | #include "ggml-backend.h"
 5 | 
 6 | #ifdef  __cplusplus
 7 | extern "C" {
 8 | #endif
 9 | 
10 | #define GGML_RPC_MAX_SERVERS       16
11 | 
12 | // backend API
13 | GGML_BACKEND_API ggml_backend_t ggml_backend_rpc_init(const char * endpoint);
14 | GGML_BACKEND_API bool ggml_backend_is_rpc(ggml_backend_t backend);
15 | 
16 | GGML_BACKEND_API ggml_backend_buffer_type_t ggml_backend_rpc_buffer_type(const char * endpoint);
17 | 
18 | GGML_BACKEND_API void ggml_backend_rpc_get_device_memory(const char * endpoint, size_t * free, size_t * total);
19 | 
20 | GGML_BACKEND_API void ggml_backend_rpc_start_server(ggml_backend_t backend, const char * endpoint, size_t free_mem, size_t total_mem);
21 | 
22 | GGML_BACKEND_API ggml_backend_reg_t ggml_backend_rpc_reg(void);
23 | 
24 | GGML_BACKEND_API ggml_backend_dev_t ggml_backend_rpc_add_device(const char * endpoint);
25 | 
26 | #ifdef  __cplusplus
27 | }
28 | #endif
29 | 


--------------------------------------------------------------------------------
/examples/wchess/wchess.wasm/chessboardjs-1.0.0/js/chessboard-1.0.0/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "author": "Chris Oakman <chris@oakmac.com> (http://chrisoakman.com/)",
 3 |   "name": "@chrisoakman/chessboardjs",
 4 |   "description": "JavaScript chessboard widget",
 5 |   "homepage": "https://chessboardjs.com",
 6 |   "license": "MIT",
 7 |   "version": "1.0.0",
 8 |   "repository": {
 9 |     "type": "git",
10 |     "url": "git://github.com/oakmac/chessboardjs.git"
11 |   },
12 |   "files": ["dist/"],
13 |   "dependencies": {
14 |     "jquery": ">=3.4.1"
15 |   },
16 |   "devDependencies": {
17 |     "csso": "3.5.1",
18 |     "fs-plus": "3.1.1",
19 |     "kidif": "1.1.0",
20 |     "mustache": "2.3.0",
21 |     "standard": "10.0.2",
22 |     "uglify-js": "3.6.0"
23 |   },
24 |   "scripts": {
25 |     "build": "standard lib/chessboard.js && node scripts/build.js",
26 |     "standard": "standard --fix lib/*.js website/js/*.js",
27 |     "website": "node scripts/website.js"
28 |   }
29 | }
30 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-kompute/kompute-shaders/op_getrows_f16.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #include "common.comp"
 4 | 
 5 | layout(local_size_x = 1) in;
 6 | 
 7 | layout (binding = 0) readonly buffer tensorInA { float16_t inA[]; };
 8 | layout (binding = 1) readonly buffer tensorInB { int inB[]; };
 9 | layout (binding = 2) writeonly buffer tensorOut { float out_[]; };
10 | 
11 | layout (push_constant) uniform parameter {
12 |     uint inAOff;
13 |     uint inBOff;
14 |     uint outOff;
15 |     int ne00;
16 |     int nb01;
17 |     int nb1;
18 | } pcs;
19 | 
20 | void dequantize_row_f16(uint x /*Based from inA unaligned*/, uint y /*Based from out_*/, int k) {
21 |     for (int j = 0; j < k; j++) {
22 |         out_[y + j] = inA[x + j];
23 |     }
24 | }
25 | 
26 | void main() {
27 |     const uint i = gl_WorkGroupID.x;
28 |     const int r = inB[i + pcs.inBOff];
29 | 
30 |     dequantize_row_f16(r*pcs.nb01/2/*bytes for float16*/ + pcs.inAOff, i*pcs.nb1/4 + pcs.outOff, pcs.ne00);
31 | }
32 | 


--------------------------------------------------------------------------------
/ggml/src/ggml-vulkan/vulkan-shaders/count_equal.comp:
--------------------------------------------------------------------------------
 1 | #version 450
 2 | 
 3 | #extension GL_EXT_control_flow_attributes : enable
 4 | 
 5 | #include "types.comp"
 6 | #include "generic_head.comp"
 7 | 
 8 | layout(local_size_x_id = 0, local_size_y = 1, local_size_z = 1) in;
 9 | 
10 | layout (binding = 0) readonly buffer X {A_TYPE data_a[];};
11 | layout (binding = 1) readonly buffer Y {B_TYPE data_b[];};
12 | layout (binding = 2) buffer D {D_TYPE data_d[];};
13 | 
14 | const uint CHUNK_SIZE = 512;
15 | 
16 | void main() {
17 |     const uint base = gl_WorkGroupID.x * CHUNK_SIZE;
18 |     const uint col = gl_LocalInvocationID.x;
19 | 
20 |     uint count = 0;
21 |     [[unroll]]
22 |     for (uint i = 0; i < CHUNK_SIZE; i += gl_WorkGroupSize.x) {
23 |         const uint idx = base + i + col;
24 |         if (idx >= p.KX) {
25 |             break;
26 |         }
27 |         count += uint(data_a[idx] == data_b[idx]);
28 |     }
29 | 
30 |     atomicAdd(data_d[0], D_TYPE(count));
31 | }
32 | 


--------------------------------------------------------------------------------