├── .github
    ├── ISSUE_TEMPLATE
    │   ├── 1_bug-report.yml
    │   ├── 2_feature_request.yml
    │   ├── 3_question.yml
    │   └── config.yml
    ├── PULL_REQUEST_TEMPLATE.md
    └── workflows
    │   ├── changelog.yml
    │   ├── docs.yml
    │   └── release.yml
├── .gitignore
├── CHANGELOG.md
├── LICENSE
├── README.md
├── VERSION
├── bin
    └── transformers
├── composer.json
├── docs
    ├── .gitignore
    ├── .vitepress
    │   └── config.mts
    ├── README.md
    ├── audio-classification.md
    ├── automatic-speech-recognition.md
    ├── basic-usage.md
    ├── bun.lockb
    ├── configuration.md
    ├── feature-extraction.md
    ├── fill-mask.md
    ├── getting-started.md
    ├── image-classification.md
    ├── image-feature-extraction.md
    ├── image-to-image.md
    ├── image-to-text.md
    ├── images
    │   └── detection-example.jpg
    ├── index.md
    ├── introduction.md
    ├── models.md
    ├── object-detection.md
    ├── package.json
    ├── pipelines.md
    ├── question-answering.md
    ├── summarization.md
    ├── text-classification.md
    ├── text-generation.md
    ├── text-to-text-generation.md
    ├── token-classification.md
    ├── tokenizers.md
    ├── translation.md
    ├── utils
    │   ├── generation.md
    │   ├── image.md
    │   └── tensor.md
    ├── zero-shot-classification.md
    ├── zero-shot-image-classification.md
    └── zero-shot-object-detection.md
├── examples
    ├── .gitignore
    ├── bootstrap.php
    ├── composer.json
    ├── misc
    │   ├── background-removal.php
    │   ├── custom-object-detection.php
    │   ├── general-test.php
    │   └── image-test.php
    ├── pipelines
    │   ├── asr.php
    │   ├── audio-classification.php
    │   ├── feature-extraction.php
    │   ├── fill-mask.php
    │   ├── image-classification.php
    │   ├── image-feature-extraction.php
    │   ├── image-to-image.php
    │   ├── image-to-text.php
    │   ├── object-detection.php
    │   ├── question-answering.php
    │   ├── sentiment-analysis.php
    │   ├── summarization.php
    │   ├── text-classification.php
    │   ├── text-generation.php
    │   ├── text2text-generation.php
    │   ├── token-classification.php
    │   ├── translation.php
    │   ├── zero-shot-classification.php
    │   ├── zero-shot-image-classification.php
    │   └── zero-shot-object-detection.php
    └── tokenizers
    │   └── apply-chat-template.php
├── libs
    └── .gitignore
├── phpunit.xml
├── scripts
    ├── convert.py
    ├── convert_upload_hf.ipynb
    └── requirements.txt
├── src
    ├── Commands
    │   ├── DownloadModelCommand.php
    │   └── InstallCommand.php
    ├── DataStructures
    │   ├── CharTrie.php
    │   ├── CharTrieNode.php
    │   ├── TokenLattice.php
    │   └── TokenLatticeNode.php
    ├── Decoders
    │   ├── BPEDecoder.php
    │   ├── ByteFallback.php
    │   ├── ByteLevelDecoder.php
    │   ├── CTCDecoder.php
    │   ├── Decoder.php
    │   ├── DecoderSequence.php
    │   ├── FuseDecoder.php
    │   ├── MetaspaceDecoder.php
    │   ├── ReplaceDecoder.php
    │   ├── StripDecoder.php
    │   ├── VitsDecoder.php
    │   └── WordPieceDecoder.php
    ├── Exceptions
    │   ├── HubException.php
    │   ├── MissingModelInputException.php
    │   ├── ModelExecutionException.php
    │   ├── TemplateParseException.php
    │   ├── TransformersException.php
    │   ├── UnsupportedModelTypeException.php
    │   └── UnsupportedTaskException.php
    ├── FFI
    │   ├── Libc.php
    │   ├── OnnxRuntime.php
    │   ├── Samplerate.php
    │   ├── Sndfile.php
    │   └── TransformersUtils.php
    ├── FeatureExtractors
    │   ├── ASTFeatureExtractor.php
    │   ├── DetrFeatureExtractor.php
    │   ├── FeatureExtractor.php
    │   ├── ImageFeatureExtractor.php
    │   ├── OwlViTFeatureExtractor.php
    │   ├── Owlv2ImageProcessor.php
    │   ├── Swin2SRImageProcessor.php
    │   ├── ViTFeatureExtractor.php
    │   ├── Wav2Vec2FeatureExtractor.php
    │   └── WhisperFeatureExtractor.php
    ├── Generation
    │   ├── AggregationStrategy.php
    │   ├── LogitsProcessors
    │   │   ├── BadWordsLogitsProcessor.php
    │   │   ├── ForceTokensLogitsProcessor.php
    │   │   ├── ForcedBOSTokenLogitsProcessor.php
    │   │   ├── ForcedEOSTokenLogitsProcessor.php
    │   │   ├── LogitsProcessor.php
    │   │   ├── LogitsProcessorList.php
    │   │   ├── MinLengthLogitsProcessor.php
    │   │   ├── MinNewTokensLengthLogitsProcessor.php
    │   │   ├── NoRepeatNGramLogitsProcessor.php
    │   │   ├── RepetitionPenaltyLogitsProcessor.php
    │   │   ├── SuppressTokensAtBeginLogitsProcessor.php
    │   │   └── WhisperTimeStampLogitsProcessor.php
    │   ├── Samplers
    │   │   ├── BeamSearchSampler.php
    │   │   ├── GreedySampler.php
    │   │   ├── MultinomialSampler.php
    │   │   └── Sampler.php
    │   └── Streamers
    │   │   ├── StdOutStreamer.php
    │   │   ├── StreamMode.php
    │   │   ├── Streamer.php
    │   │   ├── TextStreamer.php
    │   │   └── WhisperTextStreamer.php
    ├── Models
    │   ├── Auto
    │   │   ├── AutoModel.php
    │   │   ├── AutoModelForAudioClassification.php
    │   │   ├── AutoModelForCTC.php
    │   │   ├── AutoModelForCausalLM.php
    │   │   ├── AutoModelForImageClassification.php
    │   │   ├── AutoModelForImageFeatureExtraction.php
    │   │   ├── AutoModelForImageToImage.php
    │   │   ├── AutoModelForMaskedLM.php
    │   │   ├── AutoModelForObjectDetection.php
    │   │   ├── AutoModelForQuestionAnswering.php
    │   │   ├── AutoModelForSeq2SeqLM.php
    │   │   ├── AutoModelForSequenceClassification.php
    │   │   ├── AutoModelForSpeechSeq2Seq.php
    │   │   ├── AutoModelForTokenClassification.php
    │   │   ├── AutoModelForVision2Seq.php
    │   │   ├── AutoModelForZeroShotObjectDetection.php
    │   │   └── PretrainedMixin.php
    │   ├── ModelArchitecture.php
    │   ├── Output
    │   │   ├── BaseModelOutput.php
    │   │   ├── CasualLMOutput.php
    │   │   ├── DetrSegmentationOutput.php
    │   │   ├── MaskedLMOutput.php
    │   │   ├── ModelOutput.php
    │   │   ├── ObjectDetectionOutput.php
    │   │   ├── QuestionAnsweringModelOutput.php
    │   │   ├── SequenceClassifierOutput.php
    │   │   └── TokenClassifierOutput.php
    │   └── Pretrained
    │   │   ├── ASTForAudioClassification.php
    │   │   ├── ASTModel.php
    │   │   ├── ASTPretrainedModel.php
    │   │   ├── AlbertForMaskedLM.php
    │   │   ├── AlbertForQuestionAnswering.php
    │   │   ├── AlbertForSequenceClassification.php
    │   │   ├── AlbertModel.php
    │   │   ├── AlbertPretrainedModel.php
    │   │   ├── BartForConditionalGeneration.php
    │   │   ├── BartForSequenceClassification.php
    │   │   ├── BartModel.php
    │   │   ├── BartPretrainedModel.php
    │   │   ├── BertForMaskedLM.php
    │   │   ├── BertForQuestionAnswering.php
    │   │   ├── BertForSequenceClassification.php
    │   │   ├── BertForTokenClassification.php
    │   │   ├── BertModel.php
    │   │   ├── BertPretrainedModel.php
    │   │   ├── CLIPModel.php
    │   │   ├── CLIPPretrainedModel.php
    │   │   ├── CLIPVisionModelWithProjection.php
    │   │   ├── CodeGenForCausalLM.php
    │   │   ├── CodeGenModel.php
    │   │   ├── CodeGenPretrainedModel.php
    │   │   ├── DebertaForMaskedLM.php
    │   │   ├── DebertaForQuestionAnswering.php
    │   │   ├── DebertaForSequenceClassification.php
    │   │   ├── DebertaForTokenClassification.php
    │   │   ├── DebertaModel.php
    │   │   ├── DebertaPretrainedModel.php
    │   │   ├── DebertaV2ForMaskedLM.php
    │   │   ├── DebertaV2ForQuestionAnswering.php
    │   │   ├── DebertaV2ForSequenceClassification.php
    │   │   ├── DebertaV2ForTokenClassification.php
    │   │   ├── DebertaV2Model.php
    │   │   ├── DebertaV2PretrainedModel.php
    │   │   ├── DeiTForImageClassification.php
    │   │   ├── DeiTModel.php
    │   │   ├── DeiTPretrainedModel.php
    │   │   ├── DetrForObjectDetection.php
    │   │   ├── DetrForSegmentation.php
    │   │   ├── DetrModel.php
    │   │   ├── DetrPretrainedModel.php
    │   │   ├── DistilBertForMaskedLM.php
    │   │   ├── DistilBertForQuestionAnswering.php
    │   │   ├── DistilBertForSequenceClassification.php
    │   │   ├── DistilBertModel.php
    │   │   ├── GPT2LMHeadModel.php
    │   │   ├── GPT2Model.php
    │   │   ├── GPT2PretrainedModel.php
    │   │   ├── GPTBigCodeForCausalLM.php
    │   │   ├── GPTBigCodeModel.php
    │   │   ├── GPTBigCodePretrainedModel.php
    │   │   ├── GPTJForCausalLM.php
    │   │   ├── GPTJModel.php
    │   │   ├── GPTJPretrainedModel.php
    │   │   ├── LlamaForCausalLM.php
    │   │   ├── LlamaModel.php
    │   │   ├── LlamaPretrainedModel.php
    │   │   ├── M2M100ForConditionalGeneration.php
    │   │   ├── M2M100Model.php
    │   │   ├── M2M100PretrainedModel.php
    │   │   ├── MobileBertForMaskedLM.php
    │   │   ├── MobileBertForQuestionAnswering.php
    │   │   ├── MobileBertForSequenceClassification.php
    │   │   ├── MobileBertModel.php
    │   │   ├── MobileBertPretrainedModel.php
    │   │   ├── OwlViTForObjectDetection.php
    │   │   ├── OwlViTModel.php
    │   │   ├── OwlViTPretrainedModel.php
    │   │   ├── Owlv2ForObjectDetection.php
    │   │   ├── Owlv2Model.php
    │   │   ├── Owlv2PretrainedModel.php
    │   │   ├── PretrainedModel.php
    │   │   ├── Qwen2ForCausalLM.php
    │   │   ├── Qwen2Model.php
    │   │   ├── Qwen2PreTrainedModel.php
    │   │   ├── RoFormerForMaskedLM.php
    │   │   ├── RoFormerForQuestionAnswering.php
    │   │   ├── RoFormerForSequenceClassification.php
    │   │   ├── RoFormerForTokenClassification.php
    │   │   ├── RoFormerModel.php
    │   │   ├── RoFormerPretrainedModel.php
    │   │   ├── RobertaForMaskedLM.php
    │   │   ├── RobertaForQuestionAnswering.php
    │   │   ├── RobertaForSequenceClassification.php
    │   │   ├── RobertaForTokenClassification.php
    │   │   ├── RobertaModel.php
    │   │   ├── RobertaPretrainedModel.php
    │   │   ├── SiglipModel.php
    │   │   ├── SiglipPretrainedModel.php
    │   │   ├── SiglipTextModel.php
    │   │   ├── SiglipVisionModel.php
    │   │   ├── Swin2SRForImageSuperResolution.php
    │   │   ├── Swin2SRModel.php
    │   │   ├── Swin2SRPretrainedModel.php
    │   │   ├── T5ForConditionalGeneration.php
    │   │   ├── T5Model.php
    │   │   ├── T5PretrainedModel.php
    │   │   ├── TrOCRForCausalLM.php
    │   │   ├── TrOCRPretrainedModel.php
    │   │   ├── ViTForImageClassification.php
    │   │   ├── ViTModel.php
    │   │   ├── ViTPretrainedModel.php
    │   │   ├── VisionEncoderDecoderModel.php
    │   │   ├── Wav2Vec2ForAudioFrameClassification.php
    │   │   ├── Wav2Vec2ForCTC.php
    │   │   ├── Wav2Vec2ForSequenceClassification.php
    │   │   ├── Wav2Vec2Model.php
    │   │   ├── Wav2Vec2PretrainedModel.php
    │   │   ├── WhisperForConditionalGeneration.php
    │   │   ├── WhisperModel.php
    │   │   ├── WhisperPretrainedModel.php
    │   │   ├── YolosForObjectDetection.php
    │   │   ├── YolosModel.php
    │   │   └── YolosPretrainedModel.php
    ├── Normalizers
    │   ├── BertNormalizer.php
    │   ├── Lowercase.php
    │   ├── NFC.php
    │   ├── NFKC.php
    │   ├── NFKD.php
    │   ├── Normalizer.php
    │   ├── NormalizerSequence.php
    │   ├── Precompiled.php
    │   ├── Prepend.php
    │   ├── Replace.php
    │   ├── StripAccents.php
    │   └── StripNormalizer.php
    ├── Pipelines
    │   ├── AudioClassificationPipeline.php
    │   ├── AutomaticSpeechRecognitionPipeline.php
    │   ├── FeatureExtractionPipeline.php
    │   ├── FillMaskPipeline.php
    │   ├── ImageClassificationPipeline.php
    │   ├── ImageFeatureExtractionPipeline.php
    │   ├── ImageToImagePipeline.php
    │   ├── ImageToTextPipeline.php
    │   ├── ObjectDetectionPipeline.php
    │   ├── Pipeline.php
    │   ├── QuestionAnsweringPipeline.php
    │   ├── SummarizationPipeline.php
    │   ├── Task.php
    │   ├── Text2TextGenerationPipeline.php
    │   ├── TextClassificationPipeline.php
    │   ├── TextGenerationPipeline.php
    │   ├── TokenClassificationPipeline.php
    │   ├── TranslationPipeline.php
    │   ├── ZeroShotClassificationPipeline.php
    │   ├── ZeroShotImageClassificationPipeline.php
    │   └── ZeroShotObjectDetectionPipeline.php
    ├── PostProcessors
    │   ├── BertProcessing.php
    │   ├── ByteLevelPostProcessor.php
    │   ├── PostProcessedOutput.php
    │   ├── PostProcessor.php
    │   ├── PostProcessorSequence.php
    │   ├── RobertaProcessing.php
    │   └── TemplateProcessing.php
    ├── PreTokenizers
    │   ├── BertPreTokenizer.php
    │   ├── ByteLevelPreTokenizer.php
    │   ├── DigitsPreTokenizer.php
    │   ├── MetaspacePreTokenizer.php
    │   ├── PreTokenizer.php
    │   ├── PreTokenizerSequence.php
    │   ├── PunctuationPreTokenizer.php
    │   ├── ReplacePreTokenizer.php
    │   ├── SplitPreTokenizer.php
    │   ├── WhitespacePreTokenizer.php
    │   └── WhitespaceSplit.php
    ├── PreTrainedTokenizers
    │   ├── AlbertTokenizer.php
    │   ├── AutoTokenizer.php
    │   ├── BartTokenizer.php
    │   ├── BertTokenizer.php
    │   ├── BlenderbotSmallTokenizer.php
    │   ├── BlenderbotTokenizer.php
    │   ├── BloomTokenizer.php
    │   ├── CLIPTokenizer.php
    │   ├── CamembertTokenizer.php
    │   ├── CodeGenTokenizer.php
    │   ├── CodeLlamaTokenizer.php
    │   ├── CohereTokenizer.php
    │   ├── ConvBertTokenizer.php
    │   ├── DebertaTokenizer.php
    │   ├── DebertaV2Tokenizer.php
    │   ├── DistilBertTokenizer.php
    │   ├── ElectraTokenizer.php
    │   ├── EsmTokenizer.php
    │   ├── FalconTokenizer.php
    │   ├── GPT2Tokenizer.php
    │   ├── GPTNeoXTokenizer.php
    │   ├── GemmaTokenizer.php
    │   ├── Grok1Tokenizer.php
    │   ├── HerbertTokenizer.php
    │   ├── LlamaTokenizer.php
    │   ├── M2M100Tokenizer.php
    │   ├── MBart50Tokenizer.php
    │   ├── MBartTokenizer.php
    │   ├── MPNetTokenizer.php
    │   ├── MobileBertTokenizer.php
    │   ├── NllbTokenizer.php
    │   ├── NougatTokenizer.php
    │   ├── PreTrainedTokenizer.php
    │   ├── Qwen2Tokenizer.php
    │   ├── RoFormerTokenizer.php
    │   ├── RobertaTokenizer.php
    │   ├── SiglipTokenizer.php
    │   ├── SpeechT5Tokenizer.php
    │   ├── SqueezeBertTokenizer.php
    │   ├── T5Tokenizer.php
    │   ├── VitsTokenizer.php
    │   ├── Wav2Vec2CTCTokenizer.php
    │   ├── WhisperTokenizer.php
    │   ├── XLMRobertaTokenizer.php
    │   └── XLMTokenizer.php
    ├── Processors
    │   ├── AutoProcessor.php
    │   ├── OwlViTProcessor.php
    │   ├── Processor.php
    │   ├── Wav2Vec2ProcessorWithLM.php
    │   └── WhisperProcessor.php
    ├── Tensor
    │   ├── MatrixOperator.php
    │   ├── OpenBLASFactory.php
    │   ├── Tensor.php
    │   ├── TensorBuffer.php
    │   ├── TensorBufferFactory.php
    │   └── TensorService.php
    ├── Tokenizers
    │   ├── AddedToken.php
    │   ├── BPEModel.php
    │   ├── BPENode.php
    │   ├── LegacyModel.php
    │   ├── TokenizerModel.php
    │   ├── UnigramModel.php
    │   └── WordPieceModel.php
    ├── Transformers.php
    └── Utils
    │   ├── Audio.php
    │   ├── AutoConfig.php
    │   ├── Downloader.php
    │   ├── GenerationConfig.php
    │   ├── Helpers.php
    │   ├── Hub.php
    │   ├── Image.php
    │   ├── ImageDriver.php
    │   ├── InferenceSession.php
    │   ├── LibsChecker.php
    │   ├── Math.php
    │   ├── Resample.php
    │   └── StreamLogger.php
└── tests
    ├── Expectations.php
    ├── Pest.php
    ├── PipelineTest.php
    ├── Utils
        ├── HubTest.php
        └── StreamLoggerTest.php
    ├── tensors
        ├── TensorBufferTest.php
        └── TensorTest.php
    └── tokenizers
        ├── Datasets.php
        ├── TokenizersTest.php
        ├── dataset-regular.json
        └── dataset-templates.json


/.github/ISSUE_TEMPLATE/2_feature_request.yml:
--------------------------------------------------------------------------------
 1 | name: " Feature request"
 2 | description: Submit a proposal/request for a new Transformers PHP feature
 3 | labels: [ "enhancement" ]
 4 | body:
 5 |   - type: dropdown
 6 |     id: feature-type
 7 |     attributes:
 8 |       label: Type of feature request
 9 |       description: "What kind of feature are you requesting?"
10 |       options:
11 |         - "🌟New Model"
12 |         - "🔧New Pipeline"
13 |         - "🚀Enhancement"
14 |         - "📦Other (please specify)"
15 |     validations:
16 |       required: true
17 | 
18 |   - type: textarea
19 |     id: feature-description
20 |     validations:
21 |       required: true
22 |     attributes:
23 |       label: Feature description
24 |       description: |
25 |         Please provide a clear and concise description of the feature you are requesting. If the feature is related to a new model or pipeline, include details like its functionality and purpose. 
26 |         For enhancements, describe the desired change and its benefits.
27 | 
28 |   - type: textarea
29 |     id: motivation
30 |     validations:
31 |       required: true
32 |     attributes:
33 |       label: Motivation
34 |       description: |
35 |         Please outline the motivation for the proposal. Why is it important that we add this feature? What is your intended use case?
36 | 
37 |   - type: textarea
38 |     id: contribution
39 |     validations:
40 |       required: true
41 |     attributes:
42 |       label: Your contribution
43 |       description: |
44 |         Is there any way that you could help, e.g. by submitting a PR?


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/3_question.yml:
--------------------------------------------------------------------------------
 1 | name: "❓ Question about Transformers PHP"
 2 | description: Ask your questions about using Transformers PHP
 3 | labels: [ "question" ]
 4 | body:
 5 |   - type: textarea
 6 |     id: question
 7 |     validations:
 8 |       required: true
 9 |     attributes:
10 |       label: Your question
11 |       description: Please clearly state your question about using Transformers PHP. The more details you provide, the better we can assist you.
12 |       placeholder: "For example, I'm having trouble understanding how to use the [Model Name] model for sentiment analysis. Can you please provide some guidance?"
13 | 
14 |   - type: textarea
15 |     id: context
16 |     validations:
17 |       required: false  # Optional field
18 |     attributes:
19 |       label: Context (optional)
20 |       description: If necessary, provide additional context about your question. This could include - The specific functionality you're trying to achieve, any code snippets you're working with, or error messages you're encountering (if applicable).
21 | 
22 |   - type: input
23 |     id: reference
24 |     validations:
25 |       required: false  # Optional field
26 |     attributes:
27 |       label: Reference (optional)
28 |       description: If your question relates to specific documentation or code examples, please provide a link here.
29 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/config.yml:
--------------------------------------------------------------------------------
1 | blank_issues_enabled: true
2 | version: 2.1
3 | contact_links:
4 |   - name: Documentation
5 |     url: https://codewithkyrian.github.io/transformers-php
6 |     about: Read the Transformers PHP documentation


--------------------------------------------------------------------------------
/.github/PULL_REQUEST_TEMPLATE.md:
--------------------------------------------------------------------------------
 1 | <!--
 2 | - Fill in the form below correctly. This will help the TransformersPHP team to understand the PR and also work on it.
 3 | -->
 4 | 
 5 | ### What:
 6 | 
 7 | - [ ] Bug Fix
 8 | - [ ] New Feature
 9 | 
10 | ### Description:
11 | 
12 | <!-- describe what your PR is solving -->
13 | 
14 | ### Related:
15 | 
16 | <!-- link to the issue(s) your PR is solving. If it doesn't exist, remove the "Related" section. -->
17 | 


--------------------------------------------------------------------------------
/.github/workflows/changelog.yml:
--------------------------------------------------------------------------------
 1 | name: "Update Changelog"
 2 | 
 3 | on:
 4 |   release:
 5 |     types: [prereleased, released]
 6 | 
 7 | permissions:
 8 |   contents: write
 9 | 
10 | jobs:
11 |   update:
12 |     runs-on: ubuntu-latest
13 | 
14 |     steps:
15 |       - name: Checkout code
16 |         uses: actions/checkout@v4
17 |         with:
18 |           ref: main
19 | 
20 |       - name: Update Changelog
21 |         uses: stefanzweifel/changelog-updater-action@v1
22 |         with:
23 |           latest-version: ${{ github.event.release.name }}
24 |           release-notes: ${{ github.event.release.body }}
25 | 
26 |       - name: Commit updated CHANGELOG
27 |         uses: stefanzweifel/git-auto-commit-action@v5
28 |         with:
29 |           branch: main
30 |           commit_message: Update CHANGELOG
31 |           file_pattern: CHANGELOG.md


--------------------------------------------------------------------------------
/.github/workflows/docs.yml:
--------------------------------------------------------------------------------
 1 | name: Deploy Docs site to Pages
 2 | 
 3 | on:
 4 |   push:
 5 |     branches: [main]
 6 | 
 7 |   workflow_dispatch:
 8 | 
 9 | permissions:
10 |   contents: read
11 |   pages: write
12 |   id-token: write
13 | 
14 | concurrency:
15 |   group: pages
16 |   cancel-in-progress: false
17 | 
18 | jobs:
19 | 
20 |   build:
21 |     runs-on: ubuntu-latest
22 |     steps:
23 |       - name: Checkout
24 |         uses: actions/checkout@v4
25 |         with:
26 |           fetch-depth: 0 # Not needed if lastUpdated is not enabled
27 | 
28 |       - name: Setup Bun
29 |         uses: oven-sh/setup-bun@v1 # Uncomment this if you're using Bun
30 | 
31 |       - name: Setup Pages
32 |         uses: actions/configure-pages@v4
33 | 
34 |       - name: Install dependencies
35 |         working-directory: docs
36 |         run: bun install
37 | 
38 |       - name: Build with VitePress
39 |         working-directory: docs
40 |         run: bun run docs:build
41 | 
42 |       - name: Upload artifact
43 |         uses: actions/upload-pages-artifact@v3
44 |         with:
45 |           path: docs/.vitepress/dist
46 | 
47 |   deploy:
48 |     environment:
49 |       name: github-pages
50 |       url: ${{ steps.deployment.outputs.page_url }}
51 |     needs: build
52 |     runs-on: ubuntu-latest
53 |     name: Deploy
54 |     steps:
55 |       - name: Deploy to GitHub Pages
56 |         id: deployment
57 |         uses: actions/deploy-pages@v4


--------------------------------------------------------------------------------
/.github/workflows/release.yml:
--------------------------------------------------------------------------------
 1 | name: Build and Release Libraries
 2 | 
 3 | permissions:
 4 |   contents: write
 5 |   packages: read
 6 | 
 7 | on:
 8 |   release:
 9 |     types:
10 |       - published
11 | 
12 |   workflow_dispatch:
13 |     inputs:
14 |       tag:
15 |         description: 'Release Tag'
16 |         required: true
17 | 
18 | 
19 | jobs:
20 |   add-libs:
21 |     runs-on: ubuntu-latest
22 | 
23 |     steps:
24 |       - name: Log in to GHCR
25 |         uses: docker/login-action@v3
26 |         with:
27 |           registry: ghcr.io
28 |           username: ${{ github.actor }}
29 |           password: ${{ secrets.GITHUB_TOKEN }}
30 | 
31 |       - name: Build Libraries
32 |         run: |
33 |           TAG=${{ startsWith(github.ref, 'refs/tags/') && github.ref_name || github.event.inputs.tag }}
34 |           docker run --rm -v ./libs:/libs -e TAG=$TAG ghcr.io/codewithkyrian/transformers-php:latest
35 |           ls libs
36 | 
37 |       - name: Add Libraries to Release
38 |         uses:  softprops/action-gh-release@v2
39 |         with:
40 |           files: |
41 |             libs/*


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | .phpunit.cache
 2 | .phpunit.result.cache
 3 | .php-cs-fixer.cache
 4 | .php-cs-fixer.php
 5 | 
 6 | composer.lock
 7 | /vendor/
 8 | 
 9 | .DS_Store
10 | Thumbs.db
11 | 
12 | *.swp
13 | *.swo
14 | playground/*
15 | 
16 | .idea
17 | .fleet
18 | .vscode
19 | 
20 | .transformers-cache/*
21 | tests/models/*
22 | dist


--------------------------------------------------------------------------------
/VERSION:
--------------------------------------------------------------------------------
1 | 0.5.3


--------------------------------------------------------------------------------
/bin/transformers:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env php
 2 | <?php declare(strict_types=1);
 3 | 
 4 | use Symfony\Component\Console\Application;
 5 | 
 6 | require_once $_composer_autoload_path ?? __DIR__ . '/../vendor/autoload.php';
 7 | 
 8 | $application = new Application();
 9 | 
10 | // ... register commands
11 | 
12 | try {
13 |     $application->setName('Transformers PHP CLI');
14 | 
15 |     $application->add(new Codewithkyrian\Transformers\Commands\InstallCommand());
16 |     $application->add(new Codewithkyrian\Transformers\Commands\DownloadModelCommand());
17 | 
18 |     $application->run();
19 | } catch (Exception $e) {
20 |     echo $e->getMessage();
21 |     exit(1);
22 | }


--------------------------------------------------------------------------------
/docs/.gitignore:
--------------------------------------------------------------------------------
 1 | ### OSX ###
 2 | # General
 3 | .DS_Store
 4 | .AppleDouble
 5 | .LSOverride
 6 | 
 7 | # Thumbnails
 8 | ._*
 9 | 
10 | 
11 | # Files that might appear in the root of a volume
12 | .DocumentRevisions-V100
13 | .fseventsd
14 | .Spotlight-V100
15 | .TemporaryItems
16 | .Trashes
17 | .VolumeIcon.icns
18 | .com.apple.timemachine.donotpresent
19 | .idea
20 | 
21 | # Directories potentially created on remote AFP share
22 | .AppleDB
23 | .AppleDesktop
24 | Network Trash Folder
25 | Temporary Items
26 | .apdisk
27 | 
28 | ### Node ###
29 | # Logs
30 | logs
31 | *.log
32 | npm-debug.log*
33 | yarn-debug.log*
34 | yarn-error.log*
35 | lerna-debug.log*
36 | 
37 | # Dependency directories
38 | node_modules/
39 | jspm_packages/
40 | 
41 | # dotenv environment variables file
42 | .env
43 | .env.test
44 | 
45 | # vitepress build output
46 | .vitepress/dist
47 | .vitepress/cache


--------------------------------------------------------------------------------
/docs/README.md:
--------------------------------------------------------------------------------
1 | # TransformersPHP Documentation
2 | 
3 | Welcome to the official documentation for TransformersPHP. You can find the online version of this documentation
4 | at [https://codewithkyrian.github.io/transformers-docs/](https://codewithkyrian.github.io/transformers-docs/).
5 | 
6 | ## Contributing
7 | 
8 | If you would like to contribute to the documentation, create a pull request with your changes. The documentation is
9 | written in Markdown so it should be easy to understand and contribute to.


--------------------------------------------------------------------------------
/docs/bun.lockb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/CodeWithKyrian/transformers-php/6609377bb44275d8a2c8936ec30d62e430f836de/docs/bun.lockb


--------------------------------------------------------------------------------
/docs/images/detection-example.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/CodeWithKyrian/transformers-php/6609377bb44275d8a2c8936ec30d62e430f836de/docs/images/detection-example.jpg


--------------------------------------------------------------------------------
/docs/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "devDependencies": {
 3 |     "vitepress": "^1.0.0-rc.45"
 4 |   },
 5 |   "scripts": {
 6 |     "docs:dev": "vitepress dev",
 7 |     "docs:build": "vitepress build",
 8 |     "docs:preview": "vitepress preview"
 9 |   }
10 | }


--------------------------------------------------------------------------------
/examples/.gitignore:
--------------------------------------------------------------------------------
1 | vendor
2 | .transformers-cache/*
3 | composer.lock
4 | paddleocr


--------------------------------------------------------------------------------
/examples/bootstrap.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\Transformers;
 6 | use Codewithkyrian\Transformers\Utils\ImageDriver;
 7 | use Codewithkyrian\Transformers\Utils\StreamLogger;
 8 | 
 9 | require_once './vendor/autoload.php';
10 | 
11 | Transformers::setup()
12 |     ->setCacheDir('/Users/Kyrian/.transformers')
13 |     ->setImageDriver(ImageDriver::VIPS)
14 |     ->setLogger(new StreamLogger(STDOUT));
15 | 


--------------------------------------------------------------------------------
/examples/composer.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "kyrian/examples",
 3 |   "autoload": {
 4 |     "psr-4": {
 5 |       "Kyrian\\Examples\\": "/"
 6 |     }
 7 |   },
 8 |   "authors": [
 9 |     {
10 |       "name": "Kyrian Obikwelu",
11 |       "email": "koshnawaza@gmail.com"
12 |     }
13 |   ],
14 |   "require": {
15 |     "php": "^8.1",
16 |     "symfony/console": "^7.0",
17 |     "codewithkyrian/transformers": "*"
18 |   },
19 |   "require-dev": {
20 |     "symfony/var-dumper": "^7.0"
21 |   },
22 |   "minimum-stability": "dev",
23 |   "repositories": [
24 |     {
25 |       "type": "path",
26 |       "url": "../"
27 |     }
28 |   ],
29 |   "config": {
30 |     "allow-plugins": {
31 |       "codewithkyrian/transformers-libraries-downloader": true,
32 |       "codewithkyrian/transformers-libsloader": true
33 |     }
34 |   }
35 | }
36 | 


--------------------------------------------------------------------------------
/examples/misc/background-removal.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\Models\Auto\AutoModel;
 6 | use Codewithkyrian\Transformers\Processors\AutoProcessor;
 7 | use Codewithkyrian\Transformers\Utils\Image;
 8 | use function Codewithkyrian\Transformers\Utils\{memoryPeak, memoryUsage, timeUsage};
 9 | 
10 | require_once './bootstrap.php';
11 | 
12 | $model = AutoModel::fromPretrained(modelNameOrPath: 'briaai/RMBG-1.4');
13 | $processor = AutoProcessor::fromPretrained(modelNameOrPath: 'briaai/RMBG-1.4');
14 | 
15 | $url = __DIR__ . '/../images/woman-w-bag.jpeg';
16 | 
17 | $image = Image::read($url);
18 | 
19 | $fileName = pathinfo($url, PATHINFO_FILENAME);
20 | 
21 | ['pixel_values' => $pixelValues] = $processor($image);
22 | 
23 | ['output' => $output] = $model(['input' => $pixelValues]);
24 | //
25 | $mask = Image::fromTensor($output[0]->multiply(255))->resize($image->width(), $image->height());
26 | //
27 | $mask->save($fileName . '-mask.png');
28 | //
29 | $maskedImage = $image->applyMask($mask);
30 | //
31 | //$maskedImage->save($fileName . '-masked.png');


--------------------------------------------------------------------------------
/examples/misc/general-test.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | use Codewithkyrian\Transformers\FFI\TransformersUtils;
 4 | use Codewithkyrian\Transformers\FFI\Libc;
 5 | use Codewithkyrian\Transformers\FFI\OnnxRuntime;
 6 | use Codewithkyrian\Transformers\FFI\Samplerate;
 7 | use Codewithkyrian\Transformers\FFI\Sndfile;
 8 | 
 9 | include __DIR__.'/../vendor/autoload.php';
10 | 
11 | dd(
12 |     Libc::version(),
13 |     Sndfile::version(),
14 |     Samplerate::version(),
15 |     OnnxRuntime::version(),
16 |     TransformersUtils::version()
17 | );
18 | 


--------------------------------------------------------------------------------
/examples/misc/image-test.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\Tensor\Tensor;
 6 | use Codewithkyrian\Transformers\Transformers;
 7 | use Codewithkyrian\Transformers\Utils\Image;
 8 | use Codewithkyrian\Transformers\Utils\ImageDriver;
 9 | use function Codewithkyrian\Transformers\Utils\timeUsage;
10 | 
11 | require_once './bootstrap.php';
12 | 
13 | ini_set('memory_limit', '2048M');
14 | 
15 | function toTensorTest(ImageDriver $imageDriver): Tensor
16 | {
17 |     timeUsage();
18 | 
19 |     Transformers::setup()
20 |         ->setImageDriver($imageDriver)
21 |         ->apply();
22 | 
23 |     $url = __DIR__.'/../images/kyrian-cartoon.jpeg';
24 |     $tensor = Image::read($url)
25 |         ->rgb()
26 |         ->thumbnail(101, 101)
27 |         ->toTensor();
28 | 
29 |     dump("$imageDriver->name (toTensor) : ".timeUsage(true));
30 | 
31 |     return $tensor;
32 | }
33 | 
34 | function fromTensorTest(ImageDriver $imageDriver, Tensor $tensor): Image
35 | {
36 |     Transformers::setup()
37 |         ->setImageDriver($imageDriver)
38 |         ->apply();
39 | 
40 |     $image = Image::fromTensor($tensor);
41 | 
42 |     dump("$imageDriver->name (fromTensor) : ".timeUsage(true));
43 | 
44 |     return $image;
45 | }
46 | 
47 | 
48 | // Run the test
49 | dump("------------ toTensor ------------");
50 | $tensor = toTensorTest(ImageDriver::IMAGICK);
51 | $tensor = toTensorTest(ImageDriver::GD);
52 | $tensor = toTensorTest(ImageDriver::VIPS);
53 | 
54 | 
55 | dump("------------ fromTensor ------------");
56 | $image = fromTensorTest(ImageDriver::IMAGICK, $tensor);
57 | $image = fromTensorTest(ImageDriver::GD, $tensor);
58 | $image = fromTensorTest(ImageDriver::VIPS, $tensor);
59 | 
60 | // Save the image
61 | //$image->save('images/images/kyrian-cartoon-converted.jpeg');
62 | 


--------------------------------------------------------------------------------
/examples/pipelines/asr.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\Generation\Streamers\TextStreamer;
 6 | use Codewithkyrian\Transformers\Generation\Streamers\WhisperTextStreamer;
 7 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 8 | use function Codewithkyrian\Transformers\Utils\{memoryUsage, timeUsage};
 9 | 
10 | require_once './bootstrap.php';
11 | 
12 | ini_set('memory_limit', '-1');
13 | 
14 | $transcriber = pipeline('asr', 'Xenova/whisper-tiny.en');
15 | //$transcriber = pipeline('automatic-speech-recognition', 'Xenova/whisper-tiny');
16 | //$transcriber = pipeline('automatic-speech-recognition', 'Xenova/whisper-base');
17 | //$transcriber = pipeline('automatic-speech-recognition', 'Xenova/wav2vec2-large-xlsr-53-english');
18 | 
19 | //$audioUrl = __DIR__ . '/../sounds/kyrian-dev.wav';
20 | //$audioUrl = __DIR__ . '/../sounds/jfk.wav';
21 | //$audioUrl = __DIR__ . '/../sounds/preamble.wav';
22 | //$audioUrl = __DIR__ . '/../sounds/taunt.wav';
23 | //$audioUrl = __DIR__ . '/../sounds/gettysburg.wav';
24 | //$audioUrl = __DIR__ . '/../sounds/kyrian-speaking.wav';
25 | $audioUrl = __DIR__ . '/../sounds/ted_60.wav';
26 | //$audioUrl = __DIR__ . '/../sounds/sample-1.mp3';
27 | 
28 | $streamer = WhisperTextStreamer::make()
29 | ->onStream(fn($text) => print($text));
30 | 
31 | 
32 | $output = $transcriber($audioUrl,
33 |     maxNewTokens: 256,
34 |     chunkLengthSecs: 24,
35 |     streamer: $streamer,
36 | );
37 | 
38 | dd($output, timeUsage(), memoryUsage());
39 | 


--------------------------------------------------------------------------------
/examples/pipelines/audio-classification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 7 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 8 | 
 9 | require_once './bootstrap.php';
10 | 
11 | $classifier = pipeline('audio-classification', 'Xenova/ast-finetuned-audioset-10-10-0.4593');
12 | 
13 | //$audioUrl = __DIR__ . '/../sounds/dog_barking.wav';
14 | $audioUrl = __DIR__ . '/../sounds/cat_meow.wav';
15 | 
16 | $output = $classifier($audioUrl, topK: 4);
17 | 
18 | dd($output, timeUsage(), memoryUsage());
19 | 


--------------------------------------------------------------------------------
/examples/pipelines/feature-extraction.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | use function Codewithkyrian\Transformers\Utils\{memoryUsage, timeUsage};
 7 | 
 8 | require_once './bootstrap.php';
 9 | 
10 | 
11 | //$extractor = pipeline('feature-extraction', 'Xenova/bert-base-uncased');
12 | $extractor = pipeline('embeddings', 'Xenova/all-MiniLM-L6-v2');
13 | //$extractor = pipeline('embeddings', 'Xenova/paraphrase-albert-small-v2');
14 | 
15 | $embeddings = $extractor('The quick brown fox jumps over the lazy dog.', normalize: true, pooling: 'mean');
16 | 
17 | dd(memoryUsage(), timeUsage(milliseconds: true), count($embeddings[0]));
18 | 


--------------------------------------------------------------------------------
/examples/pipelines/fill-mask.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | 
 7 | require_once './bootstrap.php';
 8 | 
 9 | 
10 | //$pipeline = pipeline('fill-mask', 'Xenova/bert-base-uncased');
11 | //$result = $pipeline('My name is Kyrian and I am a [MASK] developer.');
12 | 
13 | 
14 | $pipeline = pipeline('fill-mask', 'Xenova/roberta-base');
15 | $result = $pipeline('My name is Kyrian and I am a <mask> developer.');
16 | 
17 | 
18 | dd($result);
19 | 
20 | 


--------------------------------------------------------------------------------
/examples/pipelines/image-classification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 7 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 8 | 
 9 | require_once './bootstrap.php';
10 | 
11 | $classifier = pipeline('image-classification', 'Xenova/vit-base-patch16-224');
12 | 
13 | $urls = [
14 |     __DIR__ . '/../images/tiger.jpg',
15 |     __DIR__ . '/../images/corgi.jpg',
16 |     __DIR__ . '/../images/cats.jpg',
17 | ];
18 | 
19 | $output = $classifier(__DIR__ . '/../images/tiger.jpg');
20 | 
21 | dd($output, timeUsage(), memoryUsage());
22 | 


--------------------------------------------------------------------------------
/examples/pipelines/image-feature-extraction.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 7 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 8 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 9 | 
10 | require_once './bootstrap.php';
11 | 
12 | $imageFeatureExtractor = pipeline('image-feature-extraction', 'Xenova/vit-base-patch16-224-in21k');
13 | 
14 | $url = __DIR__ . '/../images/cats.jpg';
15 | 
16 | $features = $imageFeatureExtractor($url);
17 | 
18 | dd(($features[0]), timeUsage(), memoryUsage());
19 | 


--------------------------------------------------------------------------------
/examples/pipelines/image-to-image.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 7 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 8 | 
 9 | require_once './bootstrap.php';
10 | 
11 | ini_set('memory_limit', '2048M');
12 | 
13 | $upscaler = pipeline('image-to-image', 'Xenova/swin2SR-classical-sr-x2-64');
14 | 
15 | $url = __DIR__ . '/../images/butterfly.jpg';
16 | 
17 | $savePath = __DIR__ . '/../images/butterfly-x4.jpeg';
18 | 
19 | $output = $upscaler($url, saveTo: $savePath);
20 | 
21 | dd($output, timeUsage(), memoryUsage());
22 | 


--------------------------------------------------------------------------------
/examples/pipelines/image-to-text.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 7 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 8 | 
 9 | require_once './bootstrap.php';
10 | 
11 | ini_set('memory_limit', -1);
12 | $captioner = pipeline('image-to-text', 'Xenova/vit-gpt2-image-captioning');
13 | //$captioner = pipeline('image-to-text', 'Xenova/trocr-small-handwritten');
14 | 
15 | //$streamer = StdOutStreamer::make($captioner->tokenizer);
16 | 
17 | $url = __DIR__ . '/../images/beach.png';
18 | //$url = __DIR__. '/../images/handwriting.jpg';
19 | //$url = __DIR__. '/../images/handwriting3.png';
20 | //$url = __DIR__ . '/../images/handwriting4.jpeg';
21 | 
22 | $output = $captioner($url);
23 | 
24 | dd($output, timeUsage(), memoryUsage());


--------------------------------------------------------------------------------
/examples/pipelines/object-detection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Pipelines;
 6 | 
 7 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 8 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 9 | 
10 | require_once './bootstrap.php';
11 | 
12 | ini_set('memory_limit', '-1');
13 | 
14 | $detector = pipeline('object-detection', 'Xenova/detr-resnet-50');
15 | 
16 | $img = __DIR__.'/../images/cats.jpg';
17 | 
18 | $output = $detector($img, threshold: 0.9);
19 | 
20 | dd($output, timeUsage(), memoryUsage());
21 | 
22 | //$image = Image::read($img);
23 | //
24 | //foreach ($output as $item) {
25 | //    $box = $item['box'];
26 | //    $image = $image->drawRectangle($box['xmin'], $box['ymin'], $box['xmax'], $box['ymax'], '0099FF', thickness: 2);
27 | //    $image = $image->drawText($item['label'], $box['xmin'], max($box['ymin'] - 5, 0), '/Users/Kyrian/Library/Fonts/JosefinSans-Bold.ttf', 14, '0099FF');
28 | //}
29 | //
30 | //$image->save(__DIR__ . '/../images/cats-detection.jpg');
31 | 
32 | 
33 | 


--------------------------------------------------------------------------------
/examples/pipelines/question-answering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | 
 7 | require_once './bootstrap.php';
 8 | 
 9 | 
10 | //$question = "What is a good example of a question answering dataset?";
11 | //
12 | //$context = "Extractive Question Answering is the task of extracting an answer from a text given a question. An example
13 | //of a question answering dataset is the SQuAD dataset, which is entirely based on that task. If you would like to
14 | //fine-tune a model on a SQuAD task, you may leverage the examples/pytorch/question-answering/run_squad.py script.";
15 | //
16 | //$pipeline = pipeline('question-answering', 'Xenova/distilbert-base-cased-distilled-squad');
17 | 
18 | $question = "Who is known as the father of computers?";
19 | 
20 | $context = "The history of computing is longer than the history of computing hardware and modern computing technology 
21 | and includes the history of methods intended for pen and paper or for chalk and slate, with or without the aid of tables. 
22 | Charles Babbage is often regarded as one of the fathers of computing because of his contributions to the basic design of 
23 | the computer through his analytical engine.";
24 | 
25 | $pipeline = pipeline('question-answering', 'Xenova/distilbert-base-cased-distilled-squad');
26 | 
27 | $result = $pipeline($question, $context, topK: 3);
28 | 
29 | dd($result);
30 | 
31 | 
32 | 


--------------------------------------------------------------------------------
/examples/pipelines/sentiment-analysis.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | 
 7 | require_once './bootstrap.php';
 8 | 
 9 | 
10 | $classifier = pipeline('sentiment-analysis', 'Xenova/distilbert-base-uncased-finetuned-sst-2-english');
11 | 
12 | $result1 = $classifier(['I love transformers!', 'I hate transformers!']);
13 | //$result2 = $classifier("I hate him, he's very terrible.");
14 | 
15 | dd($result1);
16 | 
17 | 


--------------------------------------------------------------------------------
/examples/pipelines/text-classification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | 
 7 | require_once './bootstrap.php';
 8 | 
 9 | 
10 | $classifier = pipeline('text-classification', 'Xenova/toxic-bert');
11 | //
12 | //$result = $classifier("I hate you! You gave me life but in misery", topK: -1);
13 | 
14 | 
15 | // $classifier = pipeline('text-classification', 'Xenova/distilbert-base-uncased-mnli');
16 | 
17 | $result = $classifier('I want to beat him to pulp', topK: -1);
18 | 
19 | dd($result);
20 | 


--------------------------------------------------------------------------------
/examples/pipelines/text-generation.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | require_once './bootstrap.php';
 6 | 
 7 | use Codewithkyrian\Transformers\Generation\Streamers\StdOutStreamer;
 8 | use Codewithkyrian\Transformers\Generation\Streamers\TextStreamer;
 9 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
10 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
11 | use function Codewithkyrian\Transformers\Utils\timeUsage;
12 | 
13 | ini_set('memory_limit', -1);
14 | 
15 | //$generator = pipeline('text-generation', 'Xenova/gpt2');
16 | //$generator = pipeline('text-generation', 'Xenova/Qwen1.5-0.5B-Chat');
17 | //$generator = pipeline('text-generation', 'Xenova/TinyLlama-1.1B-Chat-v1.0');
18 | $generator = pipeline('text-generation', 'onnx-community/Llama-3.2-1B-Instruct', modelFilename: 'model_q4');
19 | 
20 | $streamer = TextStreamer::make()->shouldSkipPrompt();
21 | 
22 | $messages = [
23 |     ['role' => 'system', 'content' => 'You are a helpful assistant.'],
24 |     ['role' => 'user', 'content' => 'What is diffusion?'],
25 | ];
26 | 
27 | $input = $generator->tokenizer->applyChatTemplate($messages, addGenerationPrompt: true, tokenize: false);
28 | 
29 | $output = $generator($input,
30 |     streamer: $streamer,
31 |     maxNewTokens: 256,
32 |     doSample: true,
33 |     returnFullText: false,
34 | //    temperature: 0.7,
35 | //    repetitionPenalty: 1.3,
36 | //    earlyStopping: true
37 | );
38 | 
39 | //$generator = pipeline('text-generation', 'Xenova/codegen-350M-mono');
40 | //$streamer = TextStreamer::make();
41 | 
42 | //$output = $generator(
43 | //    'def fib(n):',
44 | //    streamer: $streamer,
45 | //    maxNewTokens: 100,
46 | //    doSample: true,
47 | //    returnFullText: true,
48 | //);
49 | 
50 | dd($output[0]['generated_text'], timeUsage(), memoryUsage());
51 | 


--------------------------------------------------------------------------------
/examples/pipelines/text2text-generation.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | require_once './bootstrap.php';
 6 | 
 7 | use Codewithkyrian\Transformers\Generation\Streamers\TextStreamer;
 8 | use function Codewithkyrian\Transformers\{Pipelines\pipeline, Utils\memoryUsage, Utils\timeUsage};
 9 | 
10 | ini_set('memory_limit', -1);
11 | 
12 | //$generator = pipeline('text2text-generation', 'Xenova/LaMini-Flan-T5-783M');
13 | $generator = pipeline('text2text-generation', 'Xenova/flan-t5-small', quantized: true);
14 | 
15 | $streamer = TextStreamer::make();
16 | 
17 | //$query = 'Please let me know your thoughts on the given place and why you think it deserves to be visited: \n" Barcelona, Spain"';
18 | //$query = 'How many continents are in the world? List them out';
19 | //$query = 'What is the capital of Nigeria? When was it changed from Lagos?';
20 | $query = 'In 5 steps, give me a guide on how to make a simple cake.';
21 | 
22 | $output = $generator($query, streamer: $streamer, maxNewTokens: 256, doSample: true, repetitionPenalty: 1.1, temperature: 0.7);
23 | 
24 | //dd($output);
25 | dd('Done', timeUsage(), memoryUsage());
26 | 


--------------------------------------------------------------------------------
/examples/pipelines/token-classification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | require_once './bootstrap.php';
 6 | 
 7 | use Codewithkyrian\Transformers\Generation\AggregationStrategy;
 8 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 9 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
10 | use function Codewithkyrian\Transformers\Utils\timeUsage;
11 | 
12 | ini_set('memory_limit', -1);
13 | 
14 |  $classifier = pipeline('token-classification', 'Xenova/bert-base-NER');
15 | //$classifier = pipeline('token-classification', 'codewithkyrian/bert-english-uncased-finetuned-pos');
16 | 
17 | $output = $classifier(
18 |     'My name is Kyrian and I live in Nigeria',
19 |     aggregationStrategy: AggregationStrategy::FIRST
20 | );
21 | 
22 | dd($output, timeUsage(), memoryUsage());
23 | 


--------------------------------------------------------------------------------
/examples/pipelines/translation.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | require_once './bootstrap.php';
 6 | 
 7 | use Codewithkyrian\Transformers\Generation\Streamers\TextStreamer;
 8 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 9 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
10 | use function Codewithkyrian\Transformers\Utils\timeUsage;
11 | 
12 | ini_set('memory_limit', -1);
13 | 
14 | //$translator = pipeline('translation', 'Xenova/m2m100_418M');
15 | $translator = pipeline('translation', 'Xenova/nllb-200-distilled-600M');
16 | 
17 | $streamer = TextStreamer::make();
18 | 
19 | //$output = $translator('生活就像一盒巧克力。', streamer: $streamer, tgtLang: 'en');
20 | $output = $translator('जीवन एक चॉकलेट बॉक्स की तरह है।', streamer: $streamer, tgtLang: 'fra_Latn');
21 | //$output = $translator('जीवन एक चॉकलेट बॉक्स की तरह है।', streamer: $streamer, tgtLang: 'fr');
22 | //$output = $translator('संयुक्त राष्ट्र के प्रमुख का कहना है कि सीरिया में कोई सैन्य समाधान नहीं है', streamer: $streamer, tgtLang: 'fr', maxNewTokens: 256);
23 | 
24 | dd("done", timeUsage(), memoryUsage());
25 | 


--------------------------------------------------------------------------------
/examples/pipelines/zero-shot-image-classification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 6 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 7 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 8 | 
 9 | require_once './bootstrap.php';
10 | 
11 | $classifier = pipeline('zero-shot-image-classification', 'Xenova/clip-vit-base-patch32');
12 | 
13 | $url = __DIR__. '/../images/tiger.jpg';
14 | 
15 | $output = $classifier($url, ['tiger', 'horse', 'dog']);
16 | 
17 | dd($output, timeUsage(), memoryUsage());
18 | 


--------------------------------------------------------------------------------
/examples/pipelines/zero-shot-object-detection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Pipelines;
 6 | 
 7 | use function Codewithkyrian\Transformers\Utils\memoryUsage;
 8 | use function Codewithkyrian\Transformers\Utils\timeUsage;
 9 | 
10 | require_once './bootstrap.php';
11 | 
12 | ini_set('memory_limit', '-1');
13 | 
14 | $detector = pipeline('zero-shot-object-detection', 'Xenova/owlvit-base-patch32');
15 | 
16 | $url = __DIR__ . '/../images/astronaut.png';
17 | $candidateLabels = ['human face', 'rocket', 'helmet', 'american flag'];
18 | 
19 | //$url = __DIR__. '/../images/beach.png';
20 | //$candidateLabels = ['hat', 'book', 'sunglasses', 'camera'];
21 | 
22 | $output = $detector($url, $candidateLabels, topK: 4, threshold: 0.05);
23 | 
24 | dd($output, timeUsage(), memoryUsage());


--------------------------------------------------------------------------------
/examples/tokenizers/apply-chat-template.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\PreTrainedTokenizers\AutoTokenizer;
 6 | 
 7 | require_once './bootstrap.php';
 8 | 
 9 | $tokenizer = AutoTokenizer::fromPretrained('mistralai/Mistral-7B-Instruct-v0.1');
10 | //$tokenizer = AutoTokenizer::fromPretrained('facebook/blenderbot-400M-distill');
11 | $messages = [
12 |     ['role' => 'user', 'content' => 'Hello!'],
13 |     ['role' => 'assistant', 'content' => 'Hi! How are you?'],
14 |     ['role' => 'user', 'content' => 'I am doing great.'],
15 |     ['role' => 'assistant', 'content' => 'That is great to hear.'],
16 | ];
17 | 
18 | $text = $tokenizer->applyChatTemplate($messages, addGenerationPrompt: true, tokenize: false);
19 | 
20 | dd($text);
21 | 


--------------------------------------------------------------------------------
/libs/.gitignore:
--------------------------------------------------------------------------------
1 | /*
2 | !VERSIONS


--------------------------------------------------------------------------------
/phpunit.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <phpunit xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 3 |          xsi:noNamespaceSchemaLocation="https://schema.phpunit.de/10.3/phpunit.xsd"
 4 |          bootstrap="vendor/autoload.php"
 5 |          colors="true"
 6 | >
 7 |     <testsuites>
 8 |         <testsuite name="Test Suite">
 9 |             <directory suffix="Test.php">./tests</directory>
10 |         </testsuite>
11 |     </testsuites>
12 |     <source>
13 |         <include>
14 |             <directory suffix=".php">./app</directory>
15 |             <directory suffix=".php">./src</directory>
16 |         </include>
17 |     </source>
18 | </phpunit>
19 | 


--------------------------------------------------------------------------------
/scripts/requirements.txt:
--------------------------------------------------------------------------------
1 | onnxruntime<1.16.0
2 | transformers[torch]==4.33.2
3 | optimum==1.13.2
4 | tqdm
5 | onnx==1.13
6 | 


--------------------------------------------------------------------------------
/src/DataStructures/CharTrieNode.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\DataStructures;
 7 | 
 8 | class CharTrieNode
 9 | {
10 | 
11 |     /**
12 |      * Create a new CharTrieNode.
13 |      * @param bool $isLeaf Whether the node is a leaf node or not.
14 |      * @param CharTrieNode[] $children A map containing the node's children, where the key is a character and the value is a `CharTrieNode`.
15 |      */
16 |     public function __construct(public bool $isLeaf, public array $children)
17 |     {
18 |     }
19 | 
20 |     /**
21 |      * Returns a new `CharTrieNode` instance with default values.
22 |      * @return CharTrieNode A new `CharTrieNode` instance with `isLeaf` set to `false` and an empty `children` map.
23 |      */
24 |     public static function default(): CharTrieNode
25 |     {
26 |         return new CharTrieNode(false, []);
27 |     }
28 | 
29 |     public function getChild(string $ch): CharTrieNode
30 |     {
31 |         $this->children[$ch] ??= CharTrieNode::default();
32 | 
33 |         return $this->children[$ch];
34 |     }
35 | }


--------------------------------------------------------------------------------
/src/DataStructures/TokenLatticeNode.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\DataStructures;
 7 | 
 8 | class TokenLatticeNode
 9 | {
10 |     /** @var TokenLatticeNode|null A reference to the previous node. */
11 |     public ?TokenLatticeNode $prev = null;
12 | 
13 |     /** @var float The backtrace score. */
14 |     public float $backtraceScore = 0.0;
15 | 
16 |     /**
17 |      * Represents a node in a token lattice for a given sentence.
18 |      * @param int $tokenId The ID of the token associated with this node.
19 |      * @param int $nodeId The ID of this node.
20 |      * @param int $pos The starting position of the token in the sentence.
21 |      * @param int $length The length of the token.
22 |      * @param float $score The score associated with the token.
23 |      */
24 |     public function __construct(
25 |         public ?int   $tokenId,
26 |         public int   $nodeId,
27 |         public int   $pos,
28 |         public int   $length,
29 |         public float $score)
30 |     {
31 |     }
32 | 
33 |     /**
34 |      * Returns a clone of this node.
35 |      * @return TokenLatticeNode A clone of this node.
36 |      */
37 |     public function clone(): TokenLatticeNode
38 |     {
39 |         $n = new TokenLatticeNode($this->tokenId, $this->nodeId, $this->pos, $this->length, $this->score);
40 |         $n->prev = $this->prev;
41 |         $n->backtraceScore = $this->backtraceScore;
42 |         return $n;
43 |     }
44 | }
45 | 


--------------------------------------------------------------------------------
/src/Decoders/BPEDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Decoders;
 7 | 
 8 | class BPEDecoder extends Decoder
 9 | {
10 |     protected string $suffix;
11 | 
12 |     /**
13 |      * @param array $config
14 |      */
15 |     public function __construct(array $config)
16 |     {
17 |         parent::__construct($config);
18 | 
19 |         $this->suffix = $config['suffix'];
20 |     }
21 | 
22 |     protected function decodeChain(array $tokens): array
23 |     {
24 |         return array_map(function (string $token, int $i) use ($tokens) {
25 |             return str_replace($this->suffix, ($i === count($tokens) - 1) ? '' : ' ', $token);
26 |         }, $tokens, array_keys($tokens));
27 |     }
28 | }


--------------------------------------------------------------------------------
/src/Decoders/DecoderSequence.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Decoders;
 7 | 
 8 | class DecoderSequence extends Decoder
 9 | {
10 |     /**
11 |      * @var array Decoder[]
12 |      */
13 |     protected array $decoders;
14 | 
15 |     /**
16 |      * @param array $config
17 |      */
18 |     public function __construct(array $config)
19 |     {
20 |         parent::__construct($config);
21 | 
22 |         $this->decoders = array_map(
23 |             fn(array $decoderConfig) => Decoder::fromConfig($decoderConfig),
24 |             $config['decoders']
25 |         );
26 |     }
27 | 
28 |     protected function decodeChain(array $tokens): array
29 |     {
30 |         return array_reduce(
31 |             $this->decoders,
32 |             fn(array $tokens, Decoder $decoder) => $decoder->decodeChain($tokens),
33 |             $tokens
34 |         );
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Decoders/FuseDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Decoders;
 7 | 
 8 | class FuseDecoder extends Decoder
 9 | {
10 | 
11 |     /**
12 |      * @param array $config
13 |      */
14 |     public function __construct(array $config)
15 |     {
16 |         parent::__construct($config);
17 |     }
18 | 
19 |     protected function decodeChain(array $tokens): array
20 |     {
21 |         return [implode('', $tokens)];
22 |     }
23 | }


--------------------------------------------------------------------------------
/src/Decoders/MetaspaceDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Decoders;
 7 | 
 8 | /**
 9 |  * MetaspaceDecoder class extends the Decoder class and decodes Metaspace tokenization.
10 |  */
11 | class MetaspaceDecoder extends Decoder
12 | {
13 |     /**
14 |      * Whether to add a prefix space to the decoded string.
15 |      */
16 |     protected bool $addPrefixSpace;
17 | 
18 |     /**
19 |      * The string to replace spaces with.
20 |      */
21 |     protected string $replacement;
22 | 
23 |     /**
24 |      * @param array $config
25 |      */
26 |     public function __construct(array $config)
27 |     {
28 |         parent::__construct($config);
29 | 
30 |         $this->addPrefixSpace = $config['add_prefix_space'] ?? false;
31 |         $this->replacement = $config['replacement'] ?? '';
32 |     }
33 | 
34 |     protected function decodeChain(array $tokens): array
35 |     {
36 |         $result = [];
37 | 
38 |         foreach ($tokens as $i => $token) {
39 |             $normalized = str_replace($this->replacement, ' ', $token);
40 | 
41 |             if ($this->addPrefixSpace && $i == 0 && str_starts_with($normalized, ' ')) {
42 |                 $normalized = substr($normalized, 1);
43 |             }
44 | 
45 |             $result[] = $normalized;
46 |         }
47 | 
48 |         return $result;
49 |     }
50 | }


--------------------------------------------------------------------------------
/src/Decoders/ReplaceDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Decoders;
 6 | 
 7 | class ReplaceDecoder extends Decoder
 8 | {
 9 | 
10 |     /**
11 |      * @param array $config
12 |      */
13 |     public function __construct(array $config)
14 |     {
15 |         parent::__construct($config);
16 |     }
17 | 
18 |     protected function decodeChain(array $tokens): array
19 |     {
20 |         $pattern = $this->config['pattern'] ?? null;
21 | 
22 |         if ($pattern === null) {
23 |             return $tokens;
24 |         }
25 | 
26 |         $regex = $pattern['Regex'] ?? null;
27 |         $string = $pattern['String'] ?? null;
28 |         $replacement = $this->config['content'] ?? '';
29 | 
30 |         return array_map(function ($token) use ($regex, $string, $replacement) {
31 |             if ($regex !== null) {
32 |                 return preg_replace("/{$regex}/u", $replacement, (string)$token);
33 |             }
34 |             if ($string !== null) {
35 |                 return str_replace($string, $replacement, (string)$token);
36 |             }
37 |             return $token;
38 |         }, $tokens);
39 |     }
40 | }
41 | 


--------------------------------------------------------------------------------
/src/Decoders/StripDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Decoders;
 7 | 
 8 | class StripDecoder extends Decoder
 9 | {
10 |     protected string $content;
11 |     protected int $start;
12 |     protected int $stop;
13 | 
14 |     /**
15 |      * @param array $config
16 |      */
17 |     public function __construct(array $config)
18 |     {
19 |         parent::__construct($config);
20 | 
21 |         $this->content = $config['content'];
22 |         $this->start = $config['start'];
23 |         $this->stop = $config['stop'];
24 |     }
25 | 
26 |     protected function decodeChain(array $tokens): array
27 |     {
28 |         return array_map(function ($token) {
29 |             $startCut = 0;
30 |             for ($i = 0; $i < $this->start; ++$i) {
31 |                 $char = mb_substr($token, $i, 1);
32 |                 if ($char === $this->content) {
33 |                     $startCut = $i + 1;
34 |                     continue;
35 |                 } else {
36 |                     break;
37 |                 }
38 |             }
39 | 
40 |             $stopCut = mb_strlen($token);
41 |             for ($i = 0; $i < $this->stop; ++$i) {
42 |                 $index = mb_strlen($token) - $i - 1;
43 |                 if ($token[$index] ?? null === $this->content) {
44 |                     $stopCut = $index;
45 |                     continue;
46 |                 } else {
47 |                     break;
48 |                 }
49 |             }
50 | 
51 |             return mb_substr($token, $startCut, $stopCut - $startCut);
52 |         }, $tokens);
53 |     }
54 | }
55 | 


--------------------------------------------------------------------------------
/src/Decoders/VitsDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Decoders;
 6 | 
 7 | class VitsDecoder extends Decoder
 8 | {
 9 | 
10 |     protected function decodeChain(array $tokens): array
11 |     {
12 |         $decoded = '';
13 | 
14 |         for ($i = 1; $i < count($tokens); $i += 2) {
15 |             $decoded .= $tokens[$i];
16 |         }
17 | 
18 |         return [$decoded];
19 |     }
20 | }
21 | 


--------------------------------------------------------------------------------
/src/Decoders/WordPieceDecoder.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Decoders;
 7 | 
 8 | use Codewithkyrian\Transformers\Tokenizers\TokenizerModel;
 9 | 
10 | class WordPieceDecoder extends Decoder
11 | {
12 | 
13 |     protected bool $cleanup;
14 | 
15 |     public function __construct(array $config)
16 |     {
17 |         parent::__construct($config);
18 |         $this->cleanup = $config['cleanup'];
19 |     }
20 | 
21 |     protected function decodeChain(array $tokens): array
22 |     {
23 |         $decodedTokens = [];
24 |         foreach ($tokens as $i => $token) {
25 |             if ($i !== 0) {
26 |                 if (str_starts_with((string)$token, $this->config['prefix'])) {
27 |                     // NOTE: Use str_replace to replace only the first occurrence
28 |                     $token = str_replace($this->config['prefix'], '', $token);
29 |                 } else {
30 |                     $token = ' ' . $token;
31 |                 }
32 |             }
33 |             if ($this->cleanup) {
34 |                 $token = TokenizerModel::cleanUpTokenization($token);
35 |             }
36 | 
37 |             $decodedTokens[] = $token;
38 |         }
39 | 
40 |         return $decodedTokens;
41 |     }
42 | }
43 | 


--------------------------------------------------------------------------------
/src/Exceptions/HubException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Exceptions;
 7 | 
 8 | class HubException extends \Exception implements TransformersException
 9 | {
10 |     public static function make(string $message): self
11 |     {
12 |         return new self($message);
13 |     }
14 | 
15 | }


--------------------------------------------------------------------------------
/src/Exceptions/MissingModelInputException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Exceptions;
 7 | 
 8 | class MissingModelInputException extends \Exception implements TransformersException
 9 | {
10 |     public static function make(array $missingInputs): self
11 |     {
12 |         $inputs = implode("\n", $missingInputs);
13 |         return new self("The following model inputs are missing:\n$inputs");
14 |     }
15 | 
16 | }


--------------------------------------------------------------------------------
/src/Exceptions/ModelExecutionException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Exceptions;
 7 | 
 8 | class ModelExecutionException extends \Exception implements TransformersException
 9 | {
10 | public static function make(string $message): self
11 |     {
12 |         return new self("An error occurred during model execution: $message");
13 |     }
14 | }


--------------------------------------------------------------------------------
/src/Exceptions/TemplateParseException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Exceptions;
 7 | 
 8 | class TemplateParseException extends \Exception implements TransformersException
 9 | {
10 |     public static function undefinedVariable($variableName): TemplateParseException
11 |     {
12 |         return new self("Undefined variable:  $variableName");
13 |     }
14 | }


--------------------------------------------------------------------------------
/src/Exceptions/TransformersException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Exceptions;
 6 | 
 7 | interface TransformersException
 8 | {
 9 | 
10 | }


--------------------------------------------------------------------------------
/src/Exceptions/UnsupportedModelTypeException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Exceptions;
 7 | 
 8 | class UnsupportedModelTypeException extends \Exception implements TransformersException
 9 | {
10 |     public static function make(string $modelType): self
11 |     {
12 |         return new self("The model type `$modelType` is not supported for this task. Please check for typos or refer to the documentation for the list of supported model types.");
13 |     }
14 | }


--------------------------------------------------------------------------------
/src/Exceptions/UnsupportedTaskException.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Exceptions;
 7 | 
 8 | class UnsupportedTaskException extends \Exception implements TransformersException
 9 | {
10 |     public static function make(string $task): self
11 |     {
12 |         return new self("The task `$task` is not supported. Please check for typos or refer to the documentation for the list of supported tasks.");
13 |     }
14 | }


--------------------------------------------------------------------------------
/src/FFI/Libc.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\FFI;
 6 | 
 7 | use FFI;
 8 | use FFI\CData;
 9 | use RuntimeException;
10 | 
11 | class Libc
12 | {
13 |     protected static FFI $ffi;
14 | 
15 |     public static function version(): string
16 |     {
17 |         return '1.0.0';
18 |     }
19 | 
20 | 
21 |     /**
22 |      * Returns an instance of the FFI class after checking if it has already been instantiated.
23 |      * If not, it creates a new instance by defining the header contents and library path.
24 |      *
25 |      * @return FFI The FFI instance.
26 |      */
27 |     protected static function ffi(): FFI
28 |     {
29 |         if (!isset(self::$ffi)) {
30 |             self::$ffi = match (PHP_OS_FAMILY) {
31 |                 'Windows' => FFI::cdef(
32 |                     "\nsize_t mbstowcs(void *wcstr, const char *mbstr, size_t count);",
33 |                     'msvcrt.dll'
34 |                 ),
35 |                 default => FFI::cdef()
36 |             };
37 |         }
38 | 
39 |         return self::$ffi;
40 |     }
41 | 
42 |     public static function new($type, bool $owned = true, bool $persistent = false): ?CData
43 |     {
44 |         return self::ffi()->new($type, $owned, $persistent);
45 |     }
46 | 
47 |     public static function mbStringToWcString(CData $wcStr, string $mbStr, int $count): CData
48 |     {
49 |         $length = self::ffi()->mbstowcs($wcStr, $mbStr, $count);
50 | 
51 |         if ($length != strlen($mbStr)) {
52 |             throw new RuntimeException('Expected mbstowcs to return '.strlen($mbStr).", got $length");
53 |         }
54 | 
55 |         return $wcStr;
56 |     }
57 | 
58 |     public static function cstring($str): CData
59 |     {
60 |         $bytes = strlen($str) + 1;
61 |         // TODO fix?
62 |         $ptr = self::new("char[$bytes]", owned: false);
63 |         FFI::memcpy($ptr, $str, $bytes - 1);
64 |         $ptr[$bytes - 1] = "\0";
65 | 
66 |         return $ptr;
67 |     }
68 | }


--------------------------------------------------------------------------------
/src/FeatureExtractors/FeatureExtractor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\FeatureExtractors;
 7 | 
 8 | /**
 9 |  * Base class for feature extractors.
10 |  */
11 | class FeatureExtractor
12 | {
13 |     public function __construct(public array $config)
14 |     {
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/FeatureExtractors/OwlViTFeatureExtractor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\FeatureExtractors;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ObjectDetectionOutput;
 9 | use Codewithkyrian\Transformers\Processors\Processor;
10 | 
11 | class OwlViTFeatureExtractor extends ImageFeatureExtractor
12 | {
13 |     /**
14 |      * Post-processes the outputs of the model (for object detection).
15 |      * @param ObjectDetectionOutput $outputs The outputs of the model that must be post-processed
16 |      * @param float $threshold The threshold to use for the scores.
17 |      * @param array|null $targetSizes The sizes of the original images.
18 |      * @param bool $isZeroShot Whether zero-shot object detection was performed.
19 |      * @return array An array of objects containing the post-processed outputs.
20 |      */
21 |     public function postProcessObjectDetection(ObjectDetectionOutput $outputs, float $threshold = 0.5, ?array $targetSizes = null, bool $isZeroShot = false): array
22 |     {
23 |         return Processor::postProcessObjectDetection($outputs, $threshold, $targetSizes, $isZeroShot);
24 |     }
25 | }


--------------------------------------------------------------------------------
/src/FeatureExtractors/Owlv2ImageProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\FeatureExtractors;
 7 | 
 8 | class Owlv2ImageProcessor extends OwlViTFeatureExtractor
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/FeatureExtractors/Swin2SRImageProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\FeatureExtractors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class Swin2SRImageProcessor extends ImageFeatureExtractor
11 | {
12 |     public function padImage(
13 |         Tensor    $imageTensor,
14 |         int|array $padSize,
15 |         string $tensorFormat = 'CHW', // 'HWC' or 'CHW
16 |         string    $mode = 'constant',
17 |         bool      $center = false,
18 |         int       $constantValues = 0
19 |     ): Tensor
20 |     {
21 |         // NOTE: In this case, `padSize` represents the size of the sliding window for the local attention.
22 |         // In other words, the image is padded so that its width and height are multiples of `padSize`.
23 |         if ($tensorFormat === 'CHW') {
24 |             [$imageChannels, $imageHeight, $imageWidth] = $imageTensor->shape();
25 |         } else {
26 |             [$imageHeight, $imageWidth, $imageChannels] = $imageTensor->shape();
27 |         }
28 | 
29 |         // NOTE: For Swin2SR models, the original python implementation adds padding even when the image's width/height is already
30 |         // a multiple of `pad_size`. However, this is most likely a bug (PR: https://github.com/mv-lab/swin2sr/pull/19).
31 |         // For this reason, we only add padding when the image's width/height is not a multiple of `pad_size`.
32 |         $padSize = [
33 |             'width' => $imageWidth + ($padSize - $imageWidth % $padSize) % $padSize,
34 |             'height' => $imageHeight + ($padSize - $imageHeight % $padSize) % $padSize,
35 |         ];
36 | 
37 |         return parent::padImage($imageTensor, $padSize, $tensorFormat,'symmetric', false, -1);
38 |     }
39 | }


--------------------------------------------------------------------------------
/src/FeatureExtractors/ViTFeatureExtractor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\FeatureExtractors;
 7 | 
 8 | class ViTFeatureExtractor extends ImageFeatureExtractor
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/FeatureExtractors/Wav2Vec2FeatureExtractor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\FeatureExtractors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | use function Codewithkyrian\Transformers\Utils\timeUsage;
10 | 
11 | class Wav2Vec2FeatureExtractor extends FeatureExtractor
12 | {
13 |     /**
14 |      *  Extracts features from a given audio using the provided configuration.
15 |      * @param Tensor $waveform The audio tensor to extract features from.
16 |      * @return Tensor[] The extracted features.
17 |      */
18 |     public function __invoke(Tensor $waveform): array
19 |     {
20 |         // zero-mean and unit-variance normalization
21 |         if ($this->config['do_normalize'])
22 |         {
23 |             $mean = $waveform->mean();
24 | 
25 |             //calculate the variance
26 | //            $variance = $waveform->add(-$mean)->pow(2)->mean();
27 |             $variance = 0;
28 |             for ($i = 0; $i < $waveform->size(); $i++) {
29 |                 $variance += pow($waveform[$i] - $mean, 2);
30 |             }
31 |             $variance /= $waveform->size();
32 | 
33 |             //normalize the waveform
34 |             $waveform = $waveform->add(-$mean)->multiply(1.0 / sqrt($variance + 1e-7));
35 |         }
36 | 
37 |         $shape = [1, $waveform->size()];
38 | 
39 |         return [
40 |             'input_values' => $waveform->reshape($shape),
41 |             'attention_mask' => Tensor::ones($shape, dtype: Tensor::int64)
42 |         ];
43 |     }
44 | }


--------------------------------------------------------------------------------
/src/Generation/AggregationStrategy.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation;
 7 | 
 8 | enum AggregationStrategy: string
 9 | {
10 |     case NONE = 'none';
11 |     case FIRST = 'first';
12 |     case AVERAGE = 'average';
13 |     case MAX = 'max';
14 | }
15 | 


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/BadWordsLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class BadWordsLogitsProcessor extends LogitsProcessor
11 | {
12 | 
13 |     protected array $badWordsIds;
14 |     protected int|array $eosTokenId;
15 | 
16 |     public function __construct(array $badWordsIds, $eosTokenId)
17 |     {
18 |         $this->badWordsIds = $badWordsIds;
19 |         $this->eosTokenId = is_array($eosTokenId) ? $eosTokenId : [$eosTokenId];
20 |     }
21 | 
22 |     /**
23 |      * @inheritDoc
24 |      */
25 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
26 |     {
27 |         foreach ($this->badWordsIds as $badWordIds) {
28 |             // Whether to modify the logits of the last token in the bad word id sequence
29 |             $mark = true;
30 | 
31 |             // For each bad word in the list, if the current sequence of input ids ends with this sequence (excluding the last),
32 |             // then we set the logits of the last bad word id to -Infinity.
33 |             for ($i = 1; $i <= count($badWordIds) - 1 && count($badWordIds) < count($inputIds) + 1; ++$i) {
34 | 
35 |                 if ($badWordIds[count($badWordIds) - $i - 1] !== array_slice($inputIds, -$i, 1)[0]) {
36 |                     $mark = false;
37 |                     break;
38 |                 }
39 |             }
40 |             if ($mark) {
41 |                 $lastBadWordIdIndex = array_pop($badWordIds);
42 |                 $logits->buffer()[$lastBadWordIdIndex] = -INF;
43 |             }
44 |         }
45 | 
46 |         return $logits;
47 |     }
48 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/ForceTokensLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | use function Codewithkyrian\Transformers\Utils\timeUsage;
10 | 
11 | class ForceTokensLogitsProcessor extends LogitsProcessor
12 | {
13 | 
14 |     /** @var array Mapping of input lengths to forced token IDs */
15 |     protected array $forceTokenMap;
16 | 
17 |     public function __construct(array $forcedDecoderIds)
18 |     {
19 |         $this->forceTokenMap = array_column($forcedDecoderIds, 1, 0);
20 |     }
21 | 
22 |     /**
23 |      * Apply the processor to the input logits.
24 |      *
25 |      * @param Tensor[] $inputIds The input IDs.
26 |      * @param Tensor $logits The logits to process.
27 |      * @return Tensor The processed logits.
28 |      */
29 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
30 |     {
31 |         $map = $this->forceTokenMap[count($inputIds)] ?? null; // Access length from inputIds
32 | 
33 |         if ($map) {
34 |             Tensor::mo()->la()->fill(-INF, $logits);
35 | 
36 |             $logits->buffer()[$map] = 0;
37 |         }
38 | 
39 |         return $logits;
40 |     }
41 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/ForcedBOSTokenLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * A LogitsProcessor that forces a BOS token at the beginning of the generated sequence.
12 |  */
13 | class ForcedBOSTokenLogitsProcessor extends LogitsProcessor
14 | {
15 | 
16 |     public function __construct(
17 |         protected int $bosTokenId
18 |     )
19 |     {
20 |     }
21 | 
22 |     /**
23 |      * @inheritDoc
24 |      */
25 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
26 |     {
27 |         if (count($inputIds) === 1) {
28 |             Tensor::mo()->la()->fill(-INF, $logits);
29 |             $logits->buffer()[$this->bosTokenId] = 0;
30 |         }
31 |         return $logits;
32 |     }
33 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/ForcedEOSTokenLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * A logits processor that forces end-of-sequence token probability to 1.
12 |  */
13 | class ForcedEOSTokenLogitsProcessor extends LogitsProcessor
14 | {
15 |     public function __construct(
16 |         protected int $maxLength,
17 |         protected int $forcedEosTokenId
18 |     )
19 |     {
20 |     }
21 | 
22 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
23 |     {
24 |         if (count($inputIds) >= $this->maxLength) {
25 |             Tensor::mo()->la()->fill(-INF, $logits);
26 |             $logits->buffer()[$this->forcedEosTokenId] = 0;
27 |         }
28 |         return $logits;
29 |     }
30 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/LogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | abstract class LogitsProcessor
11 | {
12 |     /**
13 |      * Abstract method to apply the processor to input logits.
14 |      *
15 |      * @param Tensor[] $inputIds The input IDs.
16 |      * @param Tensor $logits The logits to process.
17 |      * @return Tensor The processed logits.
18 |      */
19 |     abstract public function __invoke(array $inputIds, Tensor $logits): Tensor;
20 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/MinLengthLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * A logits processor that enforces a minimum number of tokens.
12 |  */
13 | class MinLengthLogitsProcessor extends LogitsProcessor
14 | {
15 | 
16 |     /**
17 |      * @param int $minLength The minimum length below which the score of `eos_token_id` is set to negative infinity.
18 |      * @param int|array $eosTokenId he ID/IDs of the end-of-sequence token.
19 |      */
20 |     public function __construct(
21 |         protected int $minLength,
22 |         protected int|array $eosTokenId,
23 |     )
24 |     {
25 |         if(!is_array($eosTokenId)){
26 |             $this->eosTokenId = [$eosTokenId];
27 |         }
28 |     }
29 | 
30 |     /**
31 |      * @inheritDoc
32 |      */
33 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
34 |     {
35 |         if (count($inputIds) < $this->minLength) {
36 |             foreach ($this->eosTokenId as $id) {
37 |                 $logits->buffer()[$id] = -INF;
38 |             }
39 |         }
40 |         return $logits;
41 |     }
42 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/MinNewTokensLengthLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class MinNewTokensLengthLogitsProcessor extends LogitsProcessor
11 | {
12 | 
13 |     public function __construct(
14 |         protected int $promptLengthToSkip,
15 |         protected int $minNewTokens,
16 |         protected int|array $eosTokenId,
17 |     )
18 |     {
19 |         $this->eosTokenId = is_array($eosTokenId) ? $eosTokenId : [$eosTokenId];
20 |     }
21 | 
22 |     /**
23 |      * @inheritDoc
24 |      */
25 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
26 |     {
27 |         $newTokensLength = count($inputIds) - $this->promptLengthToSkip;
28 | 
29 |         if ($newTokensLength < $this->minNewTokens) {
30 |             foreach ($this->eosTokenId as $eosTokenId) {
31 |                 $logits->buffer()[$eosTokenId] = -INF;
32 |             }
33 |         }
34 | 
35 |         return $logits;
36 |     }
37 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/RepetitionPenaltyLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * This processor penalizes the repetition of tokens in the generated text.
12 |  */
13 | class RepetitionPenaltyLogitsProcessor extends LogitsProcessor
14 | {
15 |     public function __construct(protected float $penalty)
16 |     {
17 |     }
18 | 
19 |     /**
20 |      * Apply the repetition penalty to the logits.
21 |      */
22 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
23 |     {
24 |         // Modify the logits corresponding to each element in `input_ids`.
25 |         // As a consequence, the logits corresponding to tokens that appear
26 |         // many times in the output will be penalised more.
27 |         foreach ($inputIds as $inputId) {
28 |             if ($logits->buffer()[$inputId] < 0) {
29 |                 $logits->buffer()[$inputId] *= $this->penalty;
30 |             } else {
31 |                 $logits->buffer()[$inputId] /= $this->penalty;
32 |             }
33 |         }
34 |         return $logits;
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Generation/LogitsProcessors/SuppressTokensAtBeginLogitsProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\LogitsProcessors;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  *  A LogitsProcessor that suppresses a list of tokens as soon as the `generate` function starts
12 |  *  generating using `begin_index` tokens. This should ensure that the tokens defined by
13 |  *  `begin_suppress_tokens` at not sampled at the beginning of the generation process.
14 |  */
15 | class SuppressTokensAtBeginLogitsProcessor extends LogitsProcessor
16 | {
17 |     public function __construct(
18 |         protected array $beginSuppressTokens,
19 |         protected int   $beginIndex = 0
20 |     )
21 |     {
22 |     }
23 | 
24 |     /**
25 |      * @inheritDoc
26 |      */
27 |     public function __invoke(array $inputIds, Tensor $logits): Tensor
28 |     {
29 |         if (count($inputIds) == $this->beginIndex) {
30 |             foreach ($this->beginSuppressTokens as $token) {
31 |                 $logits->buffer()[$token] = -INF;
32 |             }
33 |         }
34 | 
35 |         return $logits;
36 |     }
37 | }


--------------------------------------------------------------------------------
/src/Generation/Samplers/BeamSearchSampler.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\Samplers;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class BeamSearchSampler extends Sampler
11 | {
12 | 
13 |     /**
14 |      * Sample from the logits.
15 |      *
16 |      * @param Tensor $logits
17 |      * @param int $index
18 |      * @return array
19 |      */
20 |     public function sample(Tensor $logits, int $index): array
21 |     {
22 |         $vocabSize = $logits->shape()[$logits->ndim() - 1];
23 | 
24 |         $k = $this->generationConfig->top_k > 0
25 |             ? min($this->generationConfig->top_k, $vocabSize)
26 |             : $vocabSize; // defaults to vocab size
27 | 
28 |         // Get logits of nth token
29 |         $logs = $this->getLogits($logits, $index);
30 | 
31 |         // Get top k tokens
32 |         [$topLogits, $topIndices] = $logs->topk($k);
33 | 
34 |         // Compute softmax over logits
35 |         $probabilities = $topLogits->softmax()->toArray();
36 | 
37 |         $sampledResults = [];
38 |         for ($i = 0; $i < $this->generationConfig->num_beams; $i++) {
39 |             $sampledResults[] = [
40 |                 $topIndices[$i], // token id
41 |                 log($probabilities[$i]), // score
42 |             ];
43 |         }
44 | 
45 |         return $sampledResults;
46 |     }
47 | }


--------------------------------------------------------------------------------
/src/Generation/Samplers/GreedySampler.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\Samplers;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class GreedySampler extends Sampler
11 | {
12 | 
13 |     /**
14 |      * Sample the maximum probability of a given logits tensor.
15 |      *
16 |      * @param Tensor $logits
17 |      * @param int $index
18 |      * @return array An array with a single tuple, containing the index of the maximum value and a meaningless score (since this is a greedy search).
19 |      */
20 |     public function sample(Tensor $logits, int $index): array
21 |     {
22 |         // NOTE: no need to do log_softmax here since we only take the maximum
23 |         $logs = $this->getLogits($logits, $index);
24 | 
25 |         // Note: score is meaningless in this context, since we are performing
26 |         // greedy search (p = 1 => log(p) = 0)
27 |         return [
28 |             [$logs->argMax(), 0]
29 |         ];
30 |     }
31 | }


--------------------------------------------------------------------------------
/src/Generation/Samplers/MultinomialSampler.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\Samplers;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class MultinomialSampler extends Sampler
11 | {
12 |     /**
13 |      * Sample from the logits.
14 |      *
15 |      * @param Tensor $logits
16 |      * @param int $index
17 |      * @return array
18 |      */
19 |     public function sample(Tensor $logits, int $index): array
20 |     {
21 |         $vocabSize = $logits->shape()[$logits->ndim() - 1];
22 | 
23 |         $k = $this->generationConfig->top_k > 0
24 |             ? min($this->generationConfig->top_k, $vocabSize)
25 |             : $vocabSize; // defaults to vocab size
26 | 
27 |         // Get logits of nth token
28 |         $logs = $this->getLogits($logits, $index);
29 | 
30 |         // Get top k tokens
31 |         [$topLogits, $topIndices] = $logs->topk($k);
32 | 
33 |         // Compute softmax over logits
34 |         $probabilities = $topLogits->softmax()->toArray();
35 | 
36 |         $sampledResults = [];
37 | 
38 |         for ($i = 0; $i < $this->generationConfig->num_beams; $i++) {
39 |             $sampledIndex = $this->randomSelect($probabilities);
40 | 
41 |             $sampledResults[] = [
42 |                 $topIndices[$sampledIndex], // token id
43 |                 log($probabilities[$sampledIndex]), // score
44 |             ];
45 |         }
46 | 
47 |         return $sampledResults;
48 |     }
49 | }


--------------------------------------------------------------------------------
/src/Generation/Streamers/StdOutStreamer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\Streamers;
 7 | 
 8 | class StdOutStreamer extends TextStreamer
 9 | {
10 | }


--------------------------------------------------------------------------------
/src/Generation/Streamers/StreamMode.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Generation\Streamers;
 7 | 
 8 | enum StreamMode
 9 | {
10 |     case FULL;
11 |     case PARTIAL;
12 | }
13 | 


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForAudioClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForAudioClassification  extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'audio-spectrogram-transformer' => \Codewithkyrian\Transformers\Models\Pretrained\ASTForAudioClassification::class,
12 |         'wav2vec2' => \Codewithkyrian\Transformers\Models\Pretrained\Wav2Vec2ForSequenceClassification::class,
13 |     ];
14 | 
15 |     const MODEL_CLASS_MAPPINGS = [
16 |         self::MODEL_CLASS_MAPPING,
17 |     ];
18 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForCTC.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForCTC extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'wav2vec2' => \Codewithkyrian\Transformers\Models\Pretrained\Wav2Vec2ForCTC::class,
12 |     ];
13 | 
14 |     const MODEL_CLASS_MAPPINGS = [
15 |         self::MODEL_CLASS_MAPPING,
16 |     ];
17 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForCausalLM extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'gpt2' => \Codewithkyrian\Transformers\Models\Pretrained\GPT2LMHeadModel::class,
12 |         'gptj' => \Codewithkyrian\Transformers\Models\Pretrained\GPTJForCausalLM::class,
13 |         'gpt_bigcode' => \Codewithkyrian\Transformers\Models\Pretrained\GPTBigCodeForCausalLM::class,
14 |         'codegen' => \Codewithkyrian\Transformers\Models\Pretrained\CodeGenForCausalLM::class,
15 |         'llama' => \Codewithkyrian\Transformers\Models\Pretrained\LlamaForCausalLM::class,
16 |         'trocr' => \Codewithkyrian\Transformers\Models\Pretrained\TrOCRForCausalLM::class,
17 |         'qwen2' => \Codewithkyrian\Transformers\Models\Pretrained\Qwen2ForCausalLM::class
18 |     ];
19 | 
20 |     const MODEL_CLASS_MAPPINGS = [
21 |         self::MODEL_CLASS_MAPPING,
22 |     ];
23 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForImageClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForImageClassification extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'vit' => \Codewithkyrian\Transformers\Models\Pretrained\ViTForImageClassification::class,
12 |         'deit' => \Codewithkyrian\Transformers\Models\Pretrained\DeiTForImageClassification::class,
13 |     ];
14 | 
15 |     const MODEL_CLASS_MAPPINGS = [
16 |         self::MODEL_CLASS_MAPPING,
17 |     ];
18 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForImageFeatureExtraction.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForImageFeatureExtraction extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'clip' => \Codewithkyrian\Transformers\Models\Pretrained\CLIPVisionModelWithProjection::class,
12 |         'siglip' => \Codewithkyrian\Transformers\Models\Pretrained\SiglipVisionModel::class,
13 |     ];
14 | 
15 |     const MODEL_CLASS_MAPPINGS = [
16 |         self::MODEL_CLASS_MAPPING,
17 |         AutoModel::ENCODER_ONLY_MODEL_MAPPING,
18 |         AutoModel::DECODER_ONLY_MODEL_MAPPING,
19 |     ];
20 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForImageToImage.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForImageToImage extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'swin2sr' => \Codewithkyrian\Transformers\Models\Pretrained\Swin2SRForImageSuperResolution::class,
12 |     ];
13 | 
14 |     const MODEL_CLASS_MAPPINGS = [
15 |         self::MODEL_CLASS_MAPPING,
16 |     ];
17 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForMaskedLM extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         "albert" => \Codewithkyrian\Transformers\Models\Pretrained\AlbertForMaskedLM::class,
12 |         "bert" => \Codewithkyrian\Transformers\Models\Pretrained\BertForMaskedLM::class,
13 |         "deberta" => \Codewithkyrian\Transformers\Models\Pretrained\DebertaForMaskedLM::class,
14 |         "deberta-v2" => \Codewithkyrian\Transformers\Models\Pretrained\DebertaV2ForMaskedLM::class,
15 |         "distilbert" => \Codewithkyrian\Transformers\Models\Pretrained\DistilBertForMaskedLM::class,
16 |         "mobilebert" => \Codewithkyrian\Transformers\Models\Pretrained\MobileBertForMaskedLM::class,
17 |         "roberta" => \Codewithkyrian\Transformers\Models\Pretrained\RobertaForMaskedLM::class,
18 |         "roformer" => \Codewithkyrian\Transformers\Models\Pretrained\RoFormerForMaskedLM::class,
19 |     ];
20 | 
21 |     const MODEL_CLASS_MAPPINGS = [
22 |         self::MODEL_CLASS_MAPPING,
23 |     ];
24 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForObjectDetection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForObjectDetection extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'detr' => \Codewithkyrian\Transformers\Models\Pretrained\DetrForObjectDetection::class,
12 |         'yolos' => \Codewithkyrian\Transformers\Models\Pretrained\YolosForObjectDetection::class,
13 |     ];
14 | 
15 |     const MODEL_CLASS_MAPPINGS = [
16 |         self::MODEL_CLASS_MAPPING,
17 |     ];
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForQuestionAnswering extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'albert' => \Codewithkyrian\Transformers\Models\Pretrained\AlbertForQuestionAnswering::class,
12 |         'bert' => \Codewithkyrian\Transformers\Models\Pretrained\BertForQuestionAnswering::class,
13 |         'deberta' => \Codewithkyrian\Transformers\Models\Pretrained\DebertaForQuestionAnswering::class,
14 |         'deberta-v2' => \Codewithkyrian\Transformers\Models\Pretrained\DebertaV2ForQuestionAnswering::class,
15 |         'distilbert' => \Codewithkyrian\Transformers\Models\Pretrained\DistilBertForQuestionAnswering::class,
16 |         'mobilebert' => \Codewithkyrian\Transformers\Models\Pretrained\MobileBertForQuestionAnswering::class,
17 |         'roberta' => \Codewithkyrian\Transformers\Models\Pretrained\RobertaForQuestionAnswering::class,
18 |         'roformer' => \Codewithkyrian\Transformers\Models\Pretrained\RoFormerForQuestionAnswering::class,
19 |     ];
20 | 
21 |     const MODEL_CLASS_MAPPINGS = [
22 |         self::MODEL_CLASS_MAPPING,
23 |     ];
24 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForSeq2SeqLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Auto;
 6 | 
 7 | class AutoModelForSeq2SeqLM extends PretrainedMixin
 8 | {
 9 |     const MODEL_CLASS_MAPPING = [
10 |         'bart' => \Codewithkyrian\Transformers\Models\Pretrained\BartForConditionalGeneration::class,
11 |         't5' => \Codewithkyrian\Transformers\Models\Pretrained\T5ForConditionalGeneration::class,
12 |         'm2m_100' => \Codewithkyrian\Transformers\Models\Pretrained\M2M100ForConditionalGeneration::class,
13 |     ];
14 | 
15 |     const MODEL_CLASS_MAPPINGS = [
16 |         self::MODEL_CLASS_MAPPING,
17 |     ];
18 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | 
 9 | class AutoModelForSequenceClassification extends PretrainedMixin
10 | {
11 |     const MODEL_CLASS_MAPPING = [
12 |         'albert' => \Codewithkyrian\Transformers\Models\Pretrained\AlbertForSequenceClassification::class,
13 |         'bert' => \Codewithkyrian\Transformers\Models\Pretrained\BertForSequenceClassification::class,
14 |         'bart' => \Codewithkyrian\Transformers\Models\Pretrained\BartForSequenceClassification::class,
15 |         'deberta' => \Codewithkyrian\Transformers\Models\Pretrained\DebertaForSequenceClassification::class,
16 |         'deberta-v2' => \Codewithkyrian\Transformers\Models\Pretrained\DebertaV2ForSequenceClassification::class,
17 |         'distilbert' => \Codewithkyrian\Transformers\Models\Pretrained\DistilBertForSequenceClassification::class,
18 |         'mobilebert' => \Codewithkyrian\Transformers\Models\Pretrained\MobileBertForSequenceClassification::class,
19 |         'roberta' => \Codewithkyrian\Transformers\Models\Pretrained\RobertaForSequenceClassification::class,
20 |         'roformer' => \Codewithkyrian\Transformers\Models\Pretrained\RoFormerForSequenceClassification::class,
21 |     ];
22 | 
23 |     const MODEL_CLASS_MAPPINGS = [
24 |         self::MODEL_CLASS_MAPPING,
25 |     ];
26 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForSpeechSeq2Seq.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForSpeechSeq2Seq extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         "whisper" => \Codewithkyrian\Transformers\Models\Pretrained\WhisperForConditionalGeneration::class,
12 |     ];
13 | 
14 |     const MODEL_CLASS_MAPPINGS = [
15 |         self::MODEL_CLASS_MAPPING,
16 |     ];
17 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForTokenClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForTokenClassification extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         "bert" => \Codewithkyrian\Transformers\Models\Pretrained\BertForTokenClassification::class,
12 |         "deberta" => \Codewithkyrian\Transformers\Models\Pretrained\DebertaForTokenClassification::class,
13 |         "deberta-v2" => \Codewithkyrian\Transformers\Models\Pretrained\DebertaV2ForTokenClassification::class,
14 |         "roberta" => \Codewithkyrian\Transformers\Models\Pretrained\RobertaForTokenClassification::class,
15 |         'roformer' => \Codewithkyrian\Transformers\Models\Pretrained\RoFormerForTokenClassification::class,
16 |     ];
17 | 
18 |     const MODEL_CLASS_MAPPINGS = [
19 |         self::MODEL_CLASS_MAPPING,
20 |     ];
21 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForVision2Seq.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForVision2Seq extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'vision-encoder-decoder' => \Codewithkyrian\Transformers\Models\Pretrained\VisionEncoderDecoderModel::class
12 |     ];
13 | 
14 |     const MODEL_CLASS_MAPPINGS = [
15 |         self::MODEL_CLASS_MAPPING,
16 |     ];
17 | }


--------------------------------------------------------------------------------
/src/Models/Auto/AutoModelForZeroShotObjectDetection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Auto;
 7 | 
 8 | class AutoModelForZeroShotObjectDetection extends PretrainedMixin
 9 | {
10 |     const MODEL_CLASS_MAPPING = [
11 |         'owlvit' => \Codewithkyrian\Transformers\Models\Pretrained\OwlViTForObjectDetection::class,
12 |         'owlv2' => \Codewithkyrian\Transformers\Models\Pretrained\Owlv2ForObjectDetection::class,
13 |     ];
14 | 
15 |     const MODEL_CLASS_MAPPINGS = [
16 |         self::MODEL_CLASS_MAPPING,
17 |     ];
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Output/BaseModelOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * Base class for model's outputs, with potential hidden states and attentions.
12 |  */
13 | class BaseModelOutput implements ModelOutput
14 | {
15 |     /**
16 |      * @param Tensor $lastHiddenState Sequence of hidden-states at the output of the last layer of the model.
17 |      * @param Tensor|null $hiddenStates Hidden-states of the model at the output of each layer plus the optional initial embedding outputs.
18 |      * @param Tensor|null $attentions Attentions weights after the attention softmax, used to compute the weighted average in the self-attention heads.
19 |      */
20 |     public function __construct(
21 |         public readonly Tensor  $lastHiddenState,
22 |         public readonly ?Tensor $hiddenStates = null,
23 |         public readonly ?Tensor $attentions = null
24 |     )
25 |     {
26 |     }
27 | 
28 |     public static function fromOutput(array $array): self
29 |     {
30 |         return new self(
31 |             $array['last_hidden_state'],
32 |             isset($array['hidden_states']) ? Tensor::fromArray($array['hidden_states']) : null,
33 |             isset($array['attentions']) ? Tensor::fromArray($array['attentions']) : null
34 |         );
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Models/Output/CasualLMOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class CasualLMOutput implements ModelOutput
11 | {
12 |     public function __construct(public readonly Tensor $logits)
13 |     {
14 |     }
15 | 
16 |     public static function fromOutput(array $array): self
17 |     {
18 |         return new self($array['logits']);
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Output/DetrSegmentationOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class DetrSegmentationOutput implements ModelOutput
11 | {
12 |     /**
13 |      * These values are normalized in [0, 1], relative to the size of each individual image in the batch (disregarding possible padding).
14 |      *
15 |      * @param Tensor $logits Classification logits (including no-object) for all queries.
16 |      * @param Tensor $predBoxes Normalized boxes coordinates for all queries, represented as (center_x, center_y, width, height).
17 |      * @param Tensor $predMasks Segmentation masks for all queries.
18 |      */
19 |     public function __construct(public readonly Tensor $logits, public readonly Tensor $predBoxes, public readonly Tensor $predMasks)
20 |     {
21 |     }
22 | 
23 | 
24 |     public static function fromOutput(array $array): self
25 |     {
26 |         return new self($array['logits'], $array['pred_boxes'], $array['pred_masks']);
27 |     }
28 | }


--------------------------------------------------------------------------------
/src/Models/Output/MaskedLMOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class MaskedLMOutput implements ModelOutput
11 | {
12 |     public function __construct(public readonly Tensor $logits)
13 |     {
14 |     }
15 | 
16 |     public static function fromOutput(array $array): self
17 |     {
18 |         return new self($array['logits']);
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Output/ModelOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | interface ModelOutput
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Output/ObjectDetectionOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class ObjectDetectionOutput  implements ModelOutput
11 | {
12 |     /**
13 |      * These values are normalized in [0, 1], relative to the size of each individual image in the batch (disregarding possible padding).
14 |      *
15 |      * @param Tensor $logits Classification logits (including no-object) for all queries.
16 |      * @param Tensor $predBoxes Normalized boxes coordinates for all queries, represented as (center_x, center_y, width, height).
17 |      */
18 |     public function __construct(public readonly Tensor $logits, public readonly Tensor $predBoxes)
19 |     {
20 |     }
21 | 
22 | 
23 |     public static function fromOutput(array $array): self
24 |     {
25 |         return new self($array['logits'], $array['pred_boxes']);
26 |     }
27 | }


--------------------------------------------------------------------------------
/src/Models/Output/QuestionAnsweringModelOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * Base class for outputs of question answering models.
12 |  */
13 | class QuestionAnsweringModelOutput implements ModelOutput
14 | {
15 |     public function __construct(
16 |         public readonly Tensor $startLogits,
17 |         public readonly Tensor $endLogits,
18 |     )
19 |     {
20 |     }
21 | 
22 |     public static function fromOutput(array $array): self
23 |     {
24 |         return new self($array['start_logits'], $array['end_logits']);
25 |     }
26 | }


--------------------------------------------------------------------------------
/src/Models/Output/SequenceClassifierOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | class SequenceClassifierOutput implements ModelOutput
11 | {
12 |     public function __construct(public readonly Tensor $logits)
13 |     {
14 |     }
15 | 
16 |     public static function fromOutput(array $array): self
17 |     {
18 |         return new self($array['logits']);
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Output/TokenClassifierOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Output;
 7 | 
 8 | use Codewithkyrian\Transformers\Tensor\Tensor;
 9 | 
10 | /**
11 |  * Base class for outputs of token classification models.
12 |  */
13 | class TokenClassifierOutput implements ModelOutput
14 | {
15 |     public function __construct(public readonly Tensor $logits)
16 |     {
17 |     }
18 | 
19 |     public static function fromOutput(array $array): self
20 |     {
21 |         return new self($array['logits']);
22 |     }
23 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/ASTForAudioClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class ASTForAudioClassification extends ASTPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/ASTModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class ASTModel extends ASTPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/ASTPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * Audio Spectrogram Transformer (AST) models
10 |  */
11 | class ASTPretrainedModel extends PretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/AlbertForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * AlbertForMaskedLM class for performing masked language modeling on albert models.
11 |  */
12 | class AlbertForMaskedLM extends BertPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/AlbertForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * AlbertForQuestionAnswering is a class representing a Albert model for sequence classification.
12 |  */
13 | class AlbertForQuestionAnswering extends BertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/AlbertForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * AlbertForSequenceClassification is a class representing a Albert model for sequence classification.
12 |  */
13 | class AlbertForSequenceClassification extends BertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/AlbertModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class AlbertModel extends AlbertPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/AlbertPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class AlbertPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BartForConditionalGeneration.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | /**
14 |  * The BART Model with a language modeling head. Can be used for summarization.
15 |  */
16 | class BartForConditionalGeneration extends BartPretrainedModel
17 | {
18 |     public mixed $numDecoderLayers;
19 |     public mixed $numDecoderHeads;
20 |     public mixed $decoderDimKv;
21 |     public mixed $numEncoderLayers;
22 |     public mixed $numEncoderHeads;
23 |     public mixed $encoderDimKv;
24 | 
25 |     public function __construct(
26 |         AutoConfig               $config,
27 |         InferenceSession         $session,
28 |         public InferenceSession  $decoderMergedSession,
29 |         public ModelArchitecture $modelArchitecture,
30 |         public GenerationConfig  $generationConfig
31 |     )
32 |     {
33 |         parent::__construct($config, $session, $modelArchitecture);
34 | 
35 |         $this->numDecoderLayers = $this->config['decoder_layers'];
36 |         $this->numDecoderHeads = $this->config['decoder_attention_heads'];
37 |         $this->decoderDimKv = $this->config['d_model'] / $this->numDecoderHeads;
38 | 
39 |         $this->numEncoderLayers = $this->config['encoder_layers'];
40 |         $this->numEncoderHeads = $this->config['encoder_attention_heads'];
41 |         $this->encoderDimKv = $this->config['d_model'] / $this->numEncoderHeads;
42 |     }
43 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BartForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ModelOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
10 | 
11 | /**
12 |  * Bart model with a sequence classification/head on top (a linear layer on top of the pooled output)
13 |  */
14 | class BartForSequenceClassification extends BartPretrainedModel
15 | {
16 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
17 |     {
18 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BartModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class BartModel extends BartPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BartPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class BartPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BertForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * BertForMaskedLM class for performing masked language modeling on BERT models.
11 |  */
12 | class BertForMaskedLM extends BertPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BertForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * BertForQuestionAnswering is a class representing a BERT model for question answering.
12 |  */
13 | class BertForQuestionAnswering extends BertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
16 |     {
17 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BertForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * BertForSequenceClassification is a class representing a BERT model for sequence classification.
12 |  */
13 | class BertForSequenceClassification extends BertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BertForTokenClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\TokenClassifierOutput;
 9 | 
10 | /**
11 |  * BertForTokenClassification is a class representing a BERT model for token classification.
12 |  */
13 | class BertForTokenClassification extends BertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): TokenClassifierOutput
16 |     {
17 |         return TokenClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BertModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class BertModel extends BertPretrainedModel
 9 | {
10 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/BertPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class BertPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/CLIPModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * CLIP Text and Vision Model with a projection layers on top
10 |  */
11 | class CLIPModel extends CLIPPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/CLIPPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | 
 9 | class CLIPPretrainedModel extends PretrainedModel
10 | {
11 | 
12 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/CLIPVisionModelWithProjection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | 
11 | /**
12 |  * CLIP Vision Model with a projection layer on top (a linear layer on top of the pooled output)
13 |  *
14 |  * Particularly useful for image feature extraction tasks.
15 |  */
16 | class CLIPVisionModelWithProjection extends CLIPPretrainedModel
17 | {
18 |     public static function fromPretrained(
19 |         string $modelNameOrPath,
20 |         bool $quantized = true,
21 |         AutoConfig|array $config = null,
22 |         ?string $cacheDir = null,
23 |         ?string $token = null,
24 |         string $revision = 'main',
25 |         ?string $modelFilename = null,
26 |         ModelArchitecture $modelArchitecture = ModelArchitecture::EncoderOnly,
27 |         ?callable $onProgress = null
28 |     ): PretrainedModel
29 |     {
30 |         // Update default model file name if not provided
31 |         $modelFilename ??= 'vision_model';
32 |         return parent::fromPretrained($modelNameOrPath, $quantized, $config, $cacheDir, $token, $revision, $modelFilename, $modelArchitecture, $onProgress);
33 |     }
34 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/CodeGenForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * CodeGenForCausalLM is a class that represents a code generation model based on the GPT-2 architecture. It extends the `CodeGenPreTrainedModel` class.
10 |  */
11 | class CodeGenForCausalLM extends CodeGenPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/CodeGenModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * CodeGenModel is a class representing a code generation model without a language model head.
10 |  */
11 | class CodeGenModel extends CodeGenPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/CodeGenPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\InferenceSession;
11 | 
12 | class CodeGenPretrainedModel extends PretrainedModel
13 | {
14 |     protected int $numHeads;
15 |     protected int $numLayers;
16 |     protected int $dimKv;
17 | 
18 |     public function __construct(
19 |         AutoConfig        $config,
20 |         InferenceSession  $session,
21 |         ModelArchitecture $modelArchitecture = ModelArchitecture::EncoderOnly,
22 |                           ...$args
23 |     )
24 |     {
25 |         parent::__construct($config, $session, $modelArchitecture, $args);
26 | 
27 |         // config doesn't contain pad_token_id, so we assume it is the eos_token_id
28 |         $this->config['pad_token_id'] = $this->config['eos_token_id'];
29 |         $this->config->padTokenId = $this->config['eos_token_id'];
30 | 
31 |         $this->numHeads = $this->config['n_head'];
32 |         $this->numLayers = $this->config['n_layer'];
33 |         $this->dimKv = $this->config['n_embd'] / $this->numHeads;
34 | 
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * DebertaForMaskedLM class for performing masked language modeling on DeBERTa models.
11 |  */
12 | class DebertaForMaskedLM extends DebertaPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * DeBERTa Model with a span classification head on top for extractive question-answering tasks like SQuAD (a linear
12 |  * layers on top of the hidden-states output to compute `span start logits` and `span end logits`).
13 |  */
14 | class DebertaForQuestionAnswering extends DebertaPretrainedModel
15 | {
16 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
17 |     {
18 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * DebertaForSequenceClassification is a class representing a DeBERTa model for sequence classification.
12 |  */
13 | class DebertaForSequenceClassification extends DebertaPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaForTokenClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\TokenClassifierOutput;
 9 | 
10 | /**
11 |  * DebertaForTokenClassification is a class representing a DeBERTa model for token classification.
12 |  */
13 | class DebertaForTokenClassification extends DebertaPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): TokenClassifierOutput
16 |     {
17 |         return TokenClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * The bare DeBERTa Model transformer outputting raw hidden-states without any specific head on top.
10 |  */
11 | class DebertaModel extends DebertaPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DebertaPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaV2ForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * DeBERTa-V2 Model with a `language modeling` head on top.
11 |  */
12 | class DebertaV2ForMaskedLM extends DebertaV2PretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaV2ForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * DeBERTa-V2 Model with a span classification head on top for extractive question-answering tasks like SQuAD (a linear
12 |  * layers on top of the hidden-states output to compute `span start logits` and `span end logits`).
13 |  */
14 | class DebertaV2ForQuestionAnswering extends DebertaV2PretrainedModel
15 | {
16 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
17 |     {
18 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaV2ForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * DeBERTa-V2 Model transformer with a sequence classification/regression head on top (a linear layer on top of the pooled output)
12 |  */
13 | class DebertaV2ForSequenceClassification extends DebertaV2PretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaV2ForTokenClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\TokenClassifierOutput;
 9 | 
10 | /**
11 |  * DeBERTa-V2 Model with a token classification head on top (a linear layer on top of the hidden-states output) e.g. for Named-Entity-Recognition (NER) tasks.
12 |  */
13 | class DebertaV2ForTokenClassification extends DebertaV2PretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): TokenClassifierOutput
16 |     {
17 |         return TokenClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaV2Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * The bare DeBERTa-V2 Model transformer outputting raw hidden-states without any specific head on top.
10 |  */
11 | class DebertaV2Model extends DebertaV2PretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DebertaV2PretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DebertaV2PretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DeiTForImageClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | class DeiTForImageClassification extends DeiTPretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
13 |     {
14 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DeiTModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DeiTModel extends DeiTPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DeiTPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DeiTPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DetrForObjectDetection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ObjectDetectionOutput;
 9 | 
10 | class DetrForObjectDetection extends DetrPretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): ObjectDetectionOutput
13 |     {
14 |         return ObjectDetectionOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DetrForSegmentation.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\DetrSegmentationOutput;
 9 | 
10 | class DetrForSegmentation extends DetrPretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): DetrSegmentationOutput
13 |     {
14 |         return DetrSegmentationOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DetrModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DetrModel extends DetrPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DetrPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DetrPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DistilBertForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * DistilBertForMaskedLM class for performing masked language modeling on DistilBERT models.
11 |  */
12 | class DistilBertForMaskedLM extends RobertaPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DistilBertForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * DistilBertForQuestionAnswering is a class representing a DistilBERT model for question answering.
12 |  */
13 | class DistilBertForQuestionAnswering extends BertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
16 |     {
17 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DistilBertForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ModelOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
10 | 
11 | /**
12 |  * DistilBERT model with a sequence classification/head on top (a linear layer on top of the pooled output)
13 |  */
14 | class DistilBertForSequenceClassification extends BartPretrainedModel
15 | {
16 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
17 |     {
18 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/DistilBertModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class DistilBertModel extends PretrainedModel
 9 | {
10 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPT2LMHeadModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class GPT2LMHeadModel extends GPT2PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPT2Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class GPT2Model extends GPT2PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPT2PretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | class GPT2PretrainedModel extends PretrainedModel
14 | {
15 |     public int $numHeads;
16 |     public int $numLayers;
17 |     public int $dimKv;
18 | 
19 |     public function __construct(
20 |         AutoConfig               $config,
21 |         InferenceSession         $session,
22 |         public ModelArchitecture $modelArchitecture,
23 |         public GenerationConfig  $generationConfig
24 |     )
25 |     {
26 |         parent::__construct($config, $session, $modelArchitecture);
27 | 
28 |         // config doesn't contain pad_token_id, so we assume it is the eos_token_id
29 |         $this->config['pad_token_id'] = $this->config['eos_token_id'];
30 |         $this->config->padTokenId = $this->config['eos_token_id'];
31 | 
32 |         $this->numHeads = $this->config['n_head'];
33 |         $this->numLayers = $this->config['n_layer'];
34 |         $this->dimKv = $this->config['n_embd'] / $this->numHeads;
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPTBigCodeForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class GPTBigCodeForCausalLM extends GPTBigCodePretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPTBigCodeModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class GPTBigCodeModel extends GPTBigCodePretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPTBigCodePretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | class GPTBigCodePretrainedModel extends PretrainedModel
14 | {
15 |     protected int $numHeads;
16 |     protected int $numLayers;
17 |     protected int $dimKv;
18 | 
19 |     public function __construct(
20 |         AutoConfig               $config,
21 |         InferenceSession         $session,
22 |         public ModelArchitecture $modelArchitecture,
23 |         public GenerationConfig  $generationConfig
24 |     )
25 |     {
26 |         parent::__construct($config, $session, $modelArchitecture);
27 | 
28 |         // config doesn't contain pad_token_id, so we assume it is the eos_token_id
29 |         $this->config['pad_token_id'] = $this->config['eos_token_id'];
30 |         $this->config->padTokenId = $this->config['eos_token_id'];
31 | 
32 |         $this->numHeads = $this->config['n_head'];
33 |         $this->numLayers = $this->config['n_layer'];
34 |         $this->dimKv = $this->config['n_embd'] / $this->numHeads;
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPTJForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class GPTJForCausalLM extends GPTJPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPTJModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class GPTJModel extends GPTJPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/GPTJPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\InferenceSession;
11 | 
12 | class GPTJPretrainedModel extends PretrainedModel
13 | {
14 |     protected int $numHeads;
15 |     protected int $numLayers;
16 |     protected int $dimKv;
17 | 
18 |     public function __construct(
19 |         AutoConfig        $config,
20 |         InferenceSession  $session,
21 |         ModelArchitecture $modelArchitecture = ModelArchitecture::EncoderOnly,
22 |                           ...$args
23 |     )
24 |     {
25 |         parent::__construct($config, $session, $modelArchitecture, $args);
26 | 
27 |         // config doesn't contain pad_token_id, so we assume it is the eos_token_id
28 |         $this->config['pad_token_id'] = $this->config['eos_token_id'];
29 |         $this->config->padTokenId = $this->config['eos_token_id'];
30 | 
31 |         $this->numHeads = $this->config['n_head'];
32 |         $this->numLayers = $this->config['n_layer'];
33 |         $this->dimKv = $this->config['n_embd'] / $this->numHeads;
34 | 
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/LlamaForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class LlamaForCausalLM extends LlamaPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/LlamaModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * The bare LLaMA Model outputting raw hidden-states without any specific head on top.
10 |  */
11 | class LlamaModel extends LlamaPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/LlamaPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | 
14 | /**
15 |  * The bare LLama Model outputting raw hidden-states without any specific head on top.
16 |  */
17 | class LlamaPretrainedModel extends PretrainedModel
18 | {
19 |     protected int $numHeads;
20 |     protected int $numLayers;
21 |     protected int $dimKv;
22 | 
23 |     public function __construct(
24 |         AutoConfig               $config,
25 |         InferenceSession         $session,
26 |         public ModelArchitecture $modelArchitecture,
27 |         public GenerationConfig  $generationConfig
28 |     )
29 |     {
30 |         parent::__construct($config, $session, $modelArchitecture);
31 | 
32 |         // config doesn't contain pad_token_id, so we assume it is the eos_token_id
33 |         $this->config['pad_token_id'] = $this->config['eos_token_id'];
34 |         $this->config->padTokenId = $this->config['eos_token_id'];
35 | 
36 |         $this->numHeads = $this->config['num_key_value_heads'] ?? $this->config['num_attention_heads'];
37 |         $this->numLayers = $this->config['num_hidden_layers'];
38 |         $this->dimKv = $this->config['hidden_size'] / $this->config['num_attention_heads'];
39 |     }
40 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/M2M100ForConditionalGeneration.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | class M2M100ForConditionalGeneration extends M2M100PretrainedModel
14 | {
15 |     protected mixed $numDecoderLayers;
16 |     protected mixed $numDecoderHeads;
17 |     protected mixed $decoderDimKv;
18 |     protected mixed $numEncoderLayers;
19 |     protected mixed $numEncoderHeads;
20 |     protected mixed $encoderDimKv;
21 | 
22 |     public function __construct(
23 |         AutoConfig               $config,
24 |         InferenceSession         $session,
25 |         public InferenceSession  $decoderMergedSession,
26 |         public ModelArchitecture $modelArchitecture,
27 |         public GenerationConfig  $generationConfig
28 |     )
29 |     {
30 |         parent::__construct($config, $session, $modelArchitecture);
31 | 
32 |         $this->numDecoderLayers = $this->config['decoder_layers'];
33 |         $this->numDecoderHeads = $this->config['decoder_attention_heads'];
34 |         $this->decoderDimKv = $this->config['d_model'] / $this->numDecoderHeads;
35 | 
36 |         $this->numEncoderLayers = $this->config['encoder_layers'];
37 |         $this->numEncoderHeads = $this->config['encoder_attention_heads'];
38 |         $this->encoderDimKv = $this->config['d_model'] / $this->numEncoderHeads;
39 |     }
40 | 
41 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/M2M100Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class M2M100Model extends M2M100PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/M2M100PretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class M2M100PretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/MobileBertForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * MobileBertForMaskedLM is a class representing a MobileBERT model for masking task.
11 |  */
12 | class MobileBertForMaskedLM extends MobileBertPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/MobileBertForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * MobileBert Model with a span classification head on top for extractive question-answering tasks
12 |  */
13 | class MobileBertForQuestionAnswering extends MobileBertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
16 |     {
17 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/MobileBertForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * MobileBert Model transformer with a sequence classification/regression head on top (a linear layer on top of the pooled output)
12 |  */
13 | class MobileBertForSequenceClassification extends MobileBertPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/MobileBertModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class MobileBertModel extends MobileBertPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/MobileBertPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class MobileBertPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/OwlViTForObjectDetection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ObjectDetectionOutput;
 9 | 
10 | class OwlViTForObjectDetection extends OwlViTPretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): ObjectDetectionOutput
13 |     {
14 |         return ObjectDetectionOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/OwlViTModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class OwlViTModel extends OwlViTPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/OwlViTPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class OwlViTPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Owlv2ForObjectDetection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ObjectDetectionOutput;
 9 | 
10 | class Owlv2ForObjectDetection extends Owlv2PretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): ObjectDetectionOutput
13 |     {
14 |         return ObjectDetectionOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Owlv2Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Owlv2Model extends Owlv2PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Owlv2PretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Owlv2PretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Qwen2ForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Qwen2ForCausalLM extends Qwen2PreTrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Qwen2Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Qwen2Model extends Qwen2PreTrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Qwen2PreTrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | /**
14 |  * The bare Qwen2 Model outputting raw hidden-states without any specific head on top.
15 |  */
16 | class Qwen2PreTrainedModel extends PretrainedModel
17 | {
18 |     protected int $numHeads;
19 |     protected int $numLayers;
20 |     protected int $dimKv;
21 | 
22 |     public function __construct(
23 |         AutoConfig               $config,
24 |         InferenceSession         $session,
25 |         public ModelArchitecture $modelArchitecture,
26 |         public GenerationConfig  $generationConfig
27 |     )
28 |     {
29 |         parent::__construct($config, $session, $modelArchitecture);
30 | 
31 |         // config doesn't contain pad_token_id, so we assume it is the eos_token_id
32 |         $this->config['pad_token_id'] = $this->config['eos_token_id'];
33 |         $this->config->padTokenId = $this->config['eos_token_id'];
34 | 
35 |         $this->numHeads = $this->config['num_key_value_heads'] ?? $this->config['num_attention_heads'];
36 |         $this->numLayers = $this->config['num_hidden_layers'];
37 |         $this->dimKv = $this->config['hidden_size'] / $this->config['num_attention_heads'];
38 |     }
39 | }
40 | 


--------------------------------------------------------------------------------
/src/Models/Pretrained/RoFormerForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * RoFormer Model with a `language modeling` head on top.
11 |  */
12 | class RoFormerForMaskedLM extends RoFormerPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RoFormerForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * RoFormer Model with a span classification head on top for extractive question-answering tasks like SQuAD
12 |  * (a linear layers on top of the hidden-states output to compute `span start logits` and `span end logits`).
13 |  */
14 | class RoFormerForQuestionAnswering extends RobertaPretrainedModel
15 | {
16 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
17 |     {
18 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RoFormerForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * RoFormer Model transformer with a sequence classification/regression head on top (a linear layer on top of the pooled output)
12 |  */
13 | class RoFormerForSequenceClassification extends RoFormerPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RoFormerForTokenClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\TokenClassifierOutput;
10 | 
11 | /**
12 |  * RoFormer Model with a token classification head on top (a linear layer on top of the hidden-states output)
13 |  * e.g. for Named-Entity-Recognition (NER) tasks.
14 |  */
15 | class RoFormerForTokenClassification extends RobertaPretrainedModel
16 | {
17 |     public function __invoke(array $modelInputs): TokenClassifierOutput
18 |     {
19 |         return TokenClassifierOutput::fromOutput(parent::__invoke($modelInputs));
20 |     }
21 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RoFormerModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * The bare RoFormer Model transformer outputting raw hidden-states without any specific head on top.
10 |  */
11 | class RoFormerModel extends RoFormerPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RoFormerPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class RoFormerPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RobertaForMaskedLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 6 | 
 7 | use Codewithkyrian\Transformers\Models\Output\MaskedLMOutput;
 8 | 
 9 | /**
10 |  * RobertaForMaskedLM class for performing masked language modeling on Roberta models.
11 |  */
12 | class RobertaForMaskedLM extends RobertaPretrainedModel
13 | {
14 |     public function __invoke(array $modelInputs): MaskedLMOutput
15 |     {
16 |         return MaskedLMOutput::fromOutput(parent::__invoke($modelInputs));
17 |     }
18 | 
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RobertaForQuestionAnswering.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\QuestionAnsweringModelOutput;
 9 | 
10 | /**
11 |  * RobertaForQuestionAnswering class for performing question answering on Roberta models.
12 |  */
13 | class RobertaForQuestionAnswering extends RobertaPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): QuestionAnsweringModelOutput
16 |     {
17 |         return QuestionAnsweringModelOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RobertaForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | /**
11 |  * RobertaForSequenceClassification class for performing sequence classification on Roberta models.
12 |  */
13 | class RobertaForSequenceClassification extends RobertaPretrainedModel
14 | {
15 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
16 |     {
17 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RobertaForTokenClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\TokenClassifierOutput;
10 | 
11 | /**
12 |  * RobertaForTokenClassification class for performing token classification on Roberta models.
13 |  */
14 | class RobertaForTokenClassification extends RobertaPretrainedModel
15 | {
16 |     public function __invoke(array $modelInputs): TokenClassifierOutput
17 |     {
18 |         return TokenClassifierOutput::fromOutput(parent::__invoke($modelInputs));
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RobertaModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class RobertaModel extends RobertaPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/RobertaPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class RobertaPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/SiglipModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * SigLIP Text and Vision Model with a projection layers on top
10 |  */
11 | class SiglipModel extends SiglipPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/SiglipPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class SiglipPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/SiglipTextModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | 
11 | /**
12 |  * The text model from SigLIP without any head or projection on top.
13 |  */
14 | class SiglipTextModel extends SiglipPretrainedModel
15 | {
16 |     public static function fromPretrained(
17 |         string $modelNameOrPath,
18 |         bool $quantized = true,
19 |         AutoConfig|array $config = null,
20 |         ?string $cacheDir = null,
21 |         ?string $token = null,
22 |         string $revision = 'main',
23 |         ?string $modelFilename = null,
24 |         ModelArchitecture $modelArchitecture = ModelArchitecture::EncoderOnly,
25 |         ?callable $onProgress = null
26 |     ): PretrainedModel
27 |     {
28 |         // Update default model file name if not provided
29 |         $modelFilename ??= 'text_model';
30 |         return parent::fromPretrained($modelNameOrPath, $quantized, $config, $cacheDir, $token, $revision, $modelFilename, $modelArchitecture, $onProgress);
31 |     }
32 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/SiglipVisionModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | 
11 | class SiglipVisionModel extends CLIPPretrainedModel
12 | {
13 |     public static function fromPretrained(
14 |         string $modelNameOrPath,
15 |         bool $quantized = true,
16 |         AutoConfig|array $config = null,
17 |         ?string $cacheDir = null,
18 |         ?string $token = null,
19 |         string $revision = 'main',
20 |         ?string $modelFilename = null,
21 |         ModelArchitecture $modelArchitecture = ModelArchitecture::EncoderOnly,
22 |         ?callable $onProgress = null
23 |     ): PretrainedModel
24 |     {
25 |         // Update default model file name if not provided
26 |         $modelFilename ??= 'vision_model';
27 |         return parent::fromPretrained($modelNameOrPath, $quantized, $config, $cacheDir, $token, $revision, $modelFilename, $modelArchitecture, $onProgress);
28 |     }
29 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Swin2SRForImageSuperResolution.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * Swin2SR Model transformer with an upsampler head on top for image super resolution and restoration.
10 |  */
11 | class Swin2SRForImageSuperResolution extends Swin2SRPretrainedModel
12 | {
13 | 
14 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Swin2SRModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Swin2SRModel extends Swin2SRPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Swin2SRPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Swin2SRPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/T5ForConditionalGeneration.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | /**
14 |  * T5Model is a class representing a T5 model for conditional generation.
15 |  */
16 | class T5ForConditionalGeneration extends T5PretrainedModel
17 | {
18 |     public mixed $numDecoderLayers;
19 |     public mixed $numDecoderHeads;
20 |     public mixed $decoderDimKv;
21 |     public mixed $numEncoderLayers;
22 |     public mixed $numEncoderHeads;
23 |     public mixed $encoderDimKv;
24 | 
25 |     public function __construct(
26 |         AutoConfig               $config,
27 |         InferenceSession         $session,
28 |         public InferenceSession  $decoderMergedSession,
29 |         public ModelArchitecture $modelArchitecture,
30 |         public GenerationConfig  $generationConfig
31 |     )
32 |     {
33 |         parent::__construct($config, $session, $modelArchitecture);
34 | 
35 |         $this->numDecoderLayers = $this->config['num_decoder_layers'];
36 |         $this->numDecoderHeads = $this->config['num_heads'];
37 |         $this->decoderDimKv = $this->config['d_kv'];
38 | 
39 |         $this->numEncoderLayers = $this->config['num_layers'];
40 |         $this->numEncoderHeads = $this->config['num_heads'];
41 |         $this->encoderDimKv = $this->config['d_kv'];
42 |     }
43 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/T5Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class T5Model extends T5PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/T5PretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class T5PretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/TrOCRForCausalLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class TrOCRForCausalLM extends TrOCRPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/TrOCRPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\ModelArchitecture;
 9 | use Codewithkyrian\Transformers\Utils\AutoConfig;
10 | use Codewithkyrian\Transformers\Utils\GenerationConfig;
11 | use Codewithkyrian\Transformers\Utils\InferenceSession;
12 | 
13 | class TrOCRPretrainedModel extends PretrainedModel
14 | {
15 |     public mixed $numDecoderLayers;
16 |     public mixed $numDecoderHeads;
17 |     public mixed $decoderDimKv;
18 |     public mixed $numEncoderLayers;
19 |     public mixed $numEncoderHeads;
20 |     public mixed $encoderDimKv;
21 | 
22 |     public function __construct(
23 |         AutoConfig               $config,
24 |         InferenceSession         $session,
25 |         public ModelArchitecture $modelArchitecture,
26 |         public GenerationConfig  $generationConfig
27 |     )
28 |     {
29 |         parent::__construct($config, $session, $modelArchitecture);
30 | 
31 | 
32 |         $this->numEncoderLayers = $this->numDecoderLayers = $this->config['decoder_layers'];
33 |         $this->numEncoderHeads = $this->numDecoderHeads = $this->config['decoder_attention_heads'];
34 |         $this->encoderDimKv = $this->decoderDimKv = $this->config['d_model'] / $this->numDecoderHeads;
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/ViTForImageClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
 9 | 
10 | class ViTForImageClassification extends ViTPretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): SequenceClassifierOutput
13 |     {
14 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/ViTModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class ViTModel extends ViTPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/ViTPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class ViTPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Wav2Vec2ForAudioFrameClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ModelOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\TokenClassifierOutput;
10 | 
11 | /**
12 |  * Wav2Vec2 Model with a frame classification head on top for tasks like Speaker Diarization.
13 |  */
14 | class Wav2Vec2ForAudioFrameClassification extends Wav2Vec2PretrainedModel
15 | {
16 | public function __invoke(array $modelInputs): array|ModelOutput
17 | {
18 |     return TokenClassifierOutput::fromOutput(parent::__invoke($modelInputs));
19 | }
20 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Wav2Vec2ForCTC.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\CasualLMOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\ModelOutput;
10 | 
11 | class Wav2Vec2ForCTC extends Wav2Vec2PretrainedModel
12 | {
13 | //    public function __invoke(array $modelInputs): array|ModelOutput
14 | //    {
15 | //        return CasualLMOutput::fromOutput(parent::__invoke($modelInputs));
16 | //    }
17 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Wav2Vec2ForSequenceClassification.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ModelOutput;
 9 | use Codewithkyrian\Transformers\Models\Output\SequenceClassifierOutput;
10 | 
11 | class Wav2Vec2ForSequenceClassification extends Wav2Vec2PretrainedModel
12 | {
13 |     public function __invoke(array $modelInputs): array|ModelOutput
14 |     {
15 |         return SequenceClassifierOutput::fromOutput(parent::__invoke($modelInputs));
16 |     }
17 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Wav2Vec2Model.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | /**
 9 |  * The bare Wav2Vec2 Model transformer outputting raw hidden-states without any specific head on top.
10 |  *
11 |  * **Example:** Load and run a `Wav2Vec2Model` for feature extraction.
12 |  *
13 |  * ```php
14 |  *
15 |  * // Read and preprocess audio
16 |  * $processor = AutoProcessor::fromPretrained('Xenova/mms-300m');
17 |  * $audio =  Audio::read('https://huggingface.co/datasets/Narsil/asr_dummy/resolve/main/mlk.flac');
18 |  * $audioTensor = $audio->toTensor(samplerate: 16000);
19 |  * $inputs = $processor($audioTensor);
20 |  *
21 |  * // Run model with inputs
22 |  * $model = AutoModel::from_pretrained('Xenova/mms-300m');
23 |  * $output = $model($inputs);
24 |  * // {
25 |  * //   last_hidden_state: Tensor {
26 |  * //     shape: [ 1, 1144, 1024 ],
27 |  * //     dtype: 'float32',
28 |  * //     buffer: (1171456) [ ... ],
29 |  * //     size: 1171456
30 |  * //   }
31 |  * // }
32 |  * ```
33 |  */
34 | class Wav2Vec2Model extends Wav2Vec2PretrainedModel
35 | {
36 | 
37 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/Wav2Vec2PretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class Wav2Vec2PretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/WhisperModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class WhisperModel extends WhisperPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/WhisperPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class WhisperPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/YolosForObjectDetection.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | use Codewithkyrian\Transformers\Models\Output\ObjectDetectionOutput;
 9 | 
10 | class YolosForObjectDetection extends YolosPretrainedModel
11 | {
12 |     public function __invoke(array $modelInputs): ObjectDetectionOutput
13 |     {
14 |         return ObjectDetectionOutput::fromOutput(parent::__invoke($modelInputs));
15 |     }
16 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/YolosModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class YolosModel extends YolosPretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Models/Pretrained/YolosPretrainedModel.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Models\Pretrained;
 7 | 
 8 | class YolosPretrainedModel extends PretrainedModel
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Normalizers/Lowercase.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | /**
 9 |  * A Normalizer that lowercases the input string.
10 |  */
11 | class Lowercase extends Normalizer
12 | {
13 | 
14 |     public function normalize(string $text): string
15 |     {
16 |         return mb_strtolower($text);
17 |     }
18 | }


--------------------------------------------------------------------------------
/src/Normalizers/NFC.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Normalizers;
 6 | 
 7 | use function normalizer_normalize;
 8 | /**
 9 |  * A normalizer that applies Unicode normalization form C (NFC) to the input text.
10 |  */
11 | class NFC extends Normalizer
12 | {
13 | 
14 | 
15 |     public function normalize(string $text): string
16 |     {
17 |         return normalizer_normalize($text, \Normalizer::NFC);
18 |     }
19 | }


--------------------------------------------------------------------------------
/src/Normalizers/NFKC.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | /*
 9 |  * NFKC Normalizer.
10 |  */
11 | 
12 | use function normalizer_normalize;
13 | 
14 | class NFKC extends Normalizer
15 | {
16 | 
17 | 
18 |     public function normalize(string $text): string
19 |     {
20 |         return normalizer_normalize($text, \Normalizer::NFKC);
21 |     }
22 | }


--------------------------------------------------------------------------------
/src/Normalizers/NFKD.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Normalizers;
 6 | 
 7 | use function normalizer_normalize;
 8 | 
 9 | /**
10 |  * Normalizes a string to Normalization Form Compatibility Decomposition (NFKD).
11 | 
12 |  */
13 | class NFKD extends Normalizer
14 | {
15 | 
16 | 
17 |     public function normalize(string $text): string
18 |     {
19 |         return normalizer_normalize($text, \Normalizer::NFKD);
20 |     }
21 | }


--------------------------------------------------------------------------------
/src/Normalizers/Normalizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | /**
 9 |  * A base class for text normalization.
10 |  */
11 | abstract class Normalizer
12 | {
13 |     public function __construct(protected array $config)
14 |     {
15 |     }
16 | 
17 |     public static function fromConfig(?array $config): ?self
18 |     {
19 |         if ($config === null) {
20 |             return null;
21 |         }
22 | 
23 |         return match ($config['type'] ?? null) {
24 |             'BertNormalizer' => new BertNormalizer($config),
25 |             'Precompiled' => new Precompiled($config),
26 |             'Sequence' => new NormalizerSequence($config),
27 |             'Replace' => new Replace($config),
28 |             'NFC' => new NFC($config),
29 |             'NFKC' => new NFKC($config),
30 |             'NFKD' => new NFKD($config),
31 |             'Strip' => new StripNormalizer($config),
32 |             'StripAccents' => new StripAccents($config),
33 |             'Lowercase' => new Lowercase($config),
34 |             'Prepend' => new Prepend($config),
35 |             default => throw new \InvalidArgumentException('Unknown normalizer type: ' . $config['type'] ?? null),
36 |         };
37 |     }
38 | 
39 |     abstract public function normalize(string $text): string;
40 | 
41 |     public function __invoke(): string
42 |     {
43 |           return $this->normalize(...func_get_args());
44 |     }
45 | }


--------------------------------------------------------------------------------
/src/Normalizers/NormalizerSequence.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | /**
 9 |  * A Normalizer that applies a sequence of Normalizers.
10 |  */
11 | class NormalizerSequence extends Normalizer
12 | {
13 |     /**
14 |      * @var Normalizer[]
15 |      */
16 |     protected array $normalizers;
17 | 
18 |     public function __construct(array $config)
19 |     {
20 |         parent::__construct($config);
21 | 
22 |         $this->normalizers = array_map(
23 |             fn(array $config) => Normalizer::fromConfig($config),
24 |             $config['normalizers']
25 |         );
26 |     }
27 | 
28 |     public function normalize(string $text): string
29 |     {
30 |         return array_reduce(
31 |             $this->normalizers,
32 |             fn(string $text, Normalizer $normalizer) => $normalizer->normalize($text),
33 |             $text
34 |         );
35 |     }
36 | }


--------------------------------------------------------------------------------
/src/Normalizers/Prepend.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | /**
 9 |  * A Normalizer that prepends a string to the input string.
10 |  */
11 | class Prepend extends Normalizer
12 | {
13 | 
14 |     /**
15 |      *  Prepends the input string.
16 |      */
17 | 
18 |     public function normalize(string $text): string
19 |     {
20 |         return $this->config['prepend'] . $text;
21 |     }
22 | }


--------------------------------------------------------------------------------
/src/Normalizers/Replace.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Normalizers;
 6 | 
 7 | /**
 8 |  * Replace normalizer that replaces occurrences of a pattern with a given string or regular expression.
 9 |  */
10 | class Replace extends Normalizer
11 | {
12 | 
13 |     public function normalize(string $text): string
14 |     {
15 |         $pattern = $this->config['pattern'] ?? null;
16 | 
17 |         if ($pattern === null) {
18 |             return $text;
19 |         }
20 | 
21 |         $regex = $pattern['Regex'] ?? null;
22 |         $string = $pattern['String'] ?? null;
23 |         $replacement = $this->config['content'] ?? '';
24 | 
25 |         if ($regex !== null) {
26 |             return preg_replace("/{$regex}/u", $replacement, $text);
27 |         }
28 | 
29 |         if ($string !== null) {
30 |             return str_replace($string, $replacement, $text);
31 |         }
32 | 
33 |         return $text;
34 |     }
35 | }


--------------------------------------------------------------------------------
/src/Normalizers/StripAccents.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | use Codewithkyrian\Transformers\Tokenizers\TokenizerModel;
 9 | 
10 | /**
11 |  * StripAccents normalizer removes all accents from the text.
12 |  */
13 | class StripAccents extends Normalizer
14 | {
15 | 
16 |     public function normalize(string $text): string
17 |     {
18 |         return TokenizerModel::removeAccents($text);
19 |     }
20 | }
21 | 


--------------------------------------------------------------------------------
/src/Normalizers/StripNormalizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Normalizers;
 7 | 
 8 | /**
 9 |  * A normalizer that strips leading and/or trailing whitespace from the input text.
10 |  */
11 | class StripNormalizer extends Normalizer
12 | {
13 | 
14 | 
15 |     /**
16 |      * Strip leading and/or trailing whitespace from the input text.
17 |      * @param string $text The input text.
18 |      * @return string The normalized text.
19 |      */
20 |     public function normalize(string $text): string
21 |     {
22 |         if ($this->config['strip_left'] && $this->config['strip_right']) {
23 |             // Fast path to avoid an extra trim call
24 |             $text = trim($text);
25 |         } else {
26 |             if ($this->config['strip_left']) {
27 |                 $text = ltrim($text);
28 |             }
29 |             if ($this->config['strip_right']) {
30 |                 $text = rtrim($text);
31 |             }
32 |         }
33 |         return $text;
34 |     }
35 | }


--------------------------------------------------------------------------------
/src/Pipelines/SummarizationPipeline.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Pipelines;
 7 | 
 8 | /**
 9 |  * A pipeline for summarization tasks, inheriting from Text2TextGenerationPipeline.
10 |  *
11 |  * *Example:** Summarization w/ `Xenova/distilbart-cnn-6-6`.
12 |  * ```php
13 |  * use function Codewithkyrian\Transformers\Pipelines\pipeline;
14 |  *
15 |  * $summarizer = pipeline('summarization', 'Xenova/distilbart-cnn-6-6');
16 |  *
17 |  * $article = 'The tower is 324 metres (1,063 ft) tall, about the same height as an 81-storey building,
18 |  *    and the tallest structure in Paris. Its base is square, measuring 125 metres (410 ft) on each side.
19 |  *    During its construction, the Eiffel Tower surpassed the Washington Monument to become the tallest
20 |  *    man-made structure in the world, a title it held for 41 years until the Chrysler Building in New
21 |  *    York City was finished in 1930. It was the first structure to reach a height of 300 metres. Due to
22 |  *    the addition of a broadcasting aerial at the top of the tower in 1957, it is now taller than the
23 |  *    Chrysler Building by 5.2 metres (17 ft). Excluding transmitters, the Eiffel Tower is the second-tallest
24 |  *    freestanding structure in France after the Millau Viaduct.';
25 |  *
26 |  * $summary = $summarizer($article, maxNewTokens: 128);
27 |  * // ['summary_text' => 'The Eiffel Tower is about the same height as an 81-storey building and the tallest structure in Paris. It is the second tallest free-standing structure in France after the Millau Viaduct.']
28 |  */
29 | class SummarizationPipeline extends Text2TextGenerationPipeline
30 | {
31 |     protected string $key = 'summary_text';
32 | }


--------------------------------------------------------------------------------
/src/Pipelines/TranslationPipeline.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Pipelines;
 7 | 
 8 | /**
 9 |  * Translates text from one language to another.
10 |  *
11 |  * *Example:** Multilingual translation w/ `Xenova/nllb-200-distilled-600M`.
12 |  * ```php
13 |  * use function Codewithkyrian\Transformers\Pipelines\pipeline;
14 |  *
15 |  * $translator = pipeline('translation', model: 'Xenova/nllb-200-distilled-600M');
16 |  *
17 |  * $output = $translator('जीवन एक चॉकलेट बॉक्स की तरह है।', srcLang: 'hin_Deva', tgtLang: 'fra_Latn'); // Hindi to French
18 |  * // ['translation_text' => 'La vie est comme une boîte a chocolat.']
19 |  * ```
20 |  *
21 |  * *Example:** Multilingual translation w/ `Xenova/m2m100_418M`.
22 |  *
23 |  * ```php
24 |  * use function Codewithkyrian\Transformers\Pipelines\pipeline;
25 |  *
26 |  * $translator = pipeline('translation', model: 'Xenova/m2m100_418M');
27 |  *
28 |  * $output = $translator('生活就像一盒巧克力。', srcLang: 'zh', tgtLang: 'en'); // Chinese to English
29 |  * // ['translation_text' => 'Life is like a box of chocolate.']
30 |  * ```
31 |  */
32 | class TranslationPipeline extends Text2TextGenerationPipeline
33 | {
34 |     protected string $key = 'translation_text';
35 | }


--------------------------------------------------------------------------------
/src/PostProcessors/ByteLevelPostProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PostProcessors;
 7 | 
 8 | /**
 9 |  * A PostProcessor that returns the given tokens as is.
10 |  */
11 | class ByteLevelPostProcessor extends PostProcessor
12 | {
13 | 
14 |     /**
15 |      * @param array $config
16 |      */
17 |     public function __construct(array $config)
18 |     {
19 |         parent::__construct($config);
20 |     }
21 | 
22 |     /**
23 |      * Post process the given tokens.
24 |      * @param string[] $tokens The input tokens.
25 |      * @param string[]|null $tokenPair The input tokens for the second sequence in a pair.
26 |      * @param bool $addSpecialTokens Whether to add the special tokens associated with the corresponding model.
27 |      * @return PostProcessedOutput
28 |      */
29 |     public function postProcess(array $tokens, array $tokenPair = null,  bool $addSpecialTokens = true): PostProcessedOutput
30 |     {
31 |         if ($tokenPair !== null) {
32 |             $tokens = array_merge($tokens, $tokenPair);
33 |         }
34 | 
35 |         return new PostProcessedOutput($tokens, array_fill(0, count($tokens), 0));
36 |     }
37 | }


--------------------------------------------------------------------------------
/src/PostProcessors/PostProcessedOutput.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PostProcessors;
 7 | 
 8 | class PostProcessedOutput
 9 | {
10 |     /**
11 |      * @param string[] $tokens The tokens to be post-processed.
12 |      * @param int[] $tokenTypeIds List of token type ids produced by the post-processor.
13 |      */
14 |     public function __construct(
15 |         public array $tokens,
16 |         public ?array $tokenTypeIds = null,
17 |     )
18 |     {
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/PostProcessors/PostProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PostProcessors;
 7 | 
 8 | abstract class PostProcessor
 9 | {
10 |     public function __construct(public array $config)
11 |     {
12 |     }
13 | 
14 |     /**
15 |      * Factory method to create a PostProcessor object from a configuration object.
16 |      *
17 |      * @param array|null $config
18 |      * @return self|null
19 |      */
20 |     public static function fromConfig(?array $config): ?self
21 |     {
22 |         if ($config === null) {
23 |             return null;
24 |         }
25 | 
26 |         return match ($config['type']) {
27 |             'BertProcessing' => new BertProcessing($config),
28 |             'ByteLevel' => new ByteLevelPostProcessor($config),
29 |             'TemplateProcessing' => new TemplateProcessing($config),
30 |             'RobertaProcessing' => new RobertaProcessing($config),
31 |             'Sequence' => new PostProcessorSequence($config),
32 |             default => throw new \InvalidArgumentException("Unknown post-processor type {$config['type']}"),
33 |         };
34 |     }
35 | 
36 |     /**
37 |      * @param array $tokens The input tokens to be post-processed.
38 |      * @param array|null $tokenPair The input tokens for the second sequence in a pair.
39 |      * @param bool $addSpecialTokens Whether to add the special tokens associated with the corresponding model.
40 |      * @return PostProcessedOutput
41 |      */
42 |     abstract public function postProcess(array $tokens, ?array $tokenPair = null,  bool $addSpecialTokens = true): PostProcessedOutput;
43 | 
44 |     public function __invoke(array $tokens, ...$args): PostProcessedOutput
45 |     {
46 |         return $this->postProcess($tokens, ...$args);
47 |     }
48 | 
49 | }


--------------------------------------------------------------------------------
/src/PostProcessors/RobertaProcessing.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PostProcessors;
 7 | 
 8 | class RobertaProcessing extends BertProcessing
 9 | {
10 | }


--------------------------------------------------------------------------------
/src/PreTokenizers/BertPreTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | /**
 9 |  * A PreTokenizer that splits text into wordpieces using a basic tokenization scheme
10 |  *  similar to that used in the original implementation of BERT.
11 |  *
12 |  * https://www.analyticsvidhya.com/blog/2021/09/an-explanatory-guide-to-bert-tokenizer/
13 |  */
14 | class BertPreTokenizer extends PreTokenizer
15 | {
16 |     protected string $pattern;
17 | 
18 |     public function __construct(array $config)
19 |     {
20 |         // Construct a pattern which matches the rust implementation:
21 |         // https://github.com/huggingface/tokenizers/blob/b4fcc9ce6e4ad5806e82826f816acfdfdc4fcc67/tokenizers/src/pre_tokenizers/bert.rs#L11
22 |         // Equivalent to removing whitespace and splitting on punctuation (both \p{P} and other ascii characters)
23 |         $PUNCTUATION_REGEX = '\p{P}\x{0021}-\x{002F}\x{003A}-\x{0040}\x{005B}-\x{0060}\x{007B}-\x{007E}';
24 |         $this->pattern = "/([$PUNCTUATION_REGEX])|\s+/u";
25 |     }
26 | 
27 |     protected function preTokenizeText(array|string $text, array $options): array
28 |     {
29 |         return preg_split($this->pattern, $text, -1, PREG_SPLIT_DELIM_CAPTURE | PREG_SPLIT_NO_EMPTY) ?? [];
30 |     }
31 | }
32 | 


--------------------------------------------------------------------------------
/src/PreTokenizers/DigitsPreTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | class DigitsPreTokenizer extends PreTokenizer
 9 | {
10 | 
11 |     protected string $pattern;
12 | 
13 |     public function __construct(protected array $config)
14 |     {
15 |         $individualDigits = $this->config['individual_digits'] ? '' : '+';
16 | 
17 |         $digitPattern = "[\D]+|\d$individualDigits";
18 | 
19 |         $this->pattern = "/$digitPattern/u";
20 |     }
21 | 
22 |     public function preTokenizeText(string|array $text, array $options): array
23 |     {
24 |         preg_match_all($this->pattern, $text, $matches, PREG_SPLIT_NO_EMPTY);
25 | 
26 |         return $matches[0] ?? [];
27 |     }
28 | }
29 | 


--------------------------------------------------------------------------------
/src/PreTokenizers/PreTokenizerSequence.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | class PreTokenizerSequence extends PreTokenizer
 9 | {
10 |     /**
11 |      * @var PreTokenizer[]
12 |      */
13 |     protected array $preTokenizers;
14 | 
15 |     public function __construct(array $config)
16 |     {
17 |         $this->preTokenizers = array_map(
18 |             fn(array $config) => PreTokenizer::fromConfig($config),
19 |             $config['pretokenizers']
20 |         );
21 |     }
22 | 
23 |     public function preTokenizeText(string|array $text, array $options): array
24 |     {
25 |         return array_reduce(
26 |             $this->preTokenizers,
27 |             fn($text, PreTokenizer $preTokenizer) => $preTokenizer->preTokenize($text, $options),
28 |             [$text]
29 |         );
30 |     }
31 | }


--------------------------------------------------------------------------------
/src/PreTokenizers/PunctuationPreTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | class PunctuationPreTokenizer extends PreTokenizer
 9 | {
10 |     protected string $pattern;
11 |     public function __construct(protected array $config)
12 |     {
13 |         $PUNCTUATION_REGEX = '\p{P}\x{0021}-\x{002F}\x{003A}-\x{0040}\x{005B}-\x{0060}\x{007B}-\x{007E}';
14 |         $this->pattern = "/[^{$PUNCTUATION_REGEX}]+|[{$PUNCTUATION_REGEX}]+/u";
15 |     }
16 |     public function preTokenizeText(string|array $text, array $options): array
17 |     {
18 |         preg_match_all($this->pattern, $text, $matches);
19 |         return $matches[0];
20 |     }
21 | }
22 | 


--------------------------------------------------------------------------------
/src/PreTokenizers/ReplacePreTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | class ReplacePreTokenizer extends PreTokenizer
 9 | {
10 | 
11 |     protected ?string $pattern;
12 |     protected string $content;
13 |     public function __construct(array $config)
14 |     {
15 |         $this->pattern = $config['pattern'] ?? null;
16 |         $this->content = $config['content'];
17 |     }
18 |     public function preTokenizeText(string|array $text, array $options): array
19 |     {
20 |         if($this->pattern === null)
21 |         {
22 |             return [$text];
23 |         }
24 | 
25 |         return str_replace($this->pattern, $this->content, $text);
26 |     }
27 | }


--------------------------------------------------------------------------------
/src/PreTokenizers/SplitPreTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | use function Codewithkyrian\Transformers\Utils\createPattern;
 9 | 
10 | class SplitPreTokenizer extends PreTokenizer
11 | {
12 |     protected string|array $pattern;
13 | 
14 |     public function __construct(protected array $config)
15 |     {
16 |         $this->pattern = createPattern($config['pattern'], $config['invert']);
17 |     }
18 | 
19 | 
20 |     /**
21 |      * Tokenizes text by splitting it using the given pattern.
22 |      */
23 |     public function preTokenizeText(string|array $text, array $options): array
24 |     {
25 |         if ($this->config['invert']) {
26 |             preg_match_all("/$this->pattern/u", $text, $matches);
27 |             return $matches[0];
28 |         } else {
29 |             $result = [];
30 |             $offset = 0;
31 | 
32 |             preg_match_all("/$this->pattern/u", $text, $matches, PREG_OFFSET_CAPTURE);
33 | 
34 |             foreach ($matches[0] as $match) {
35 |                 $fullMatch = $match[0];
36 |                 $matchIndex = $match[1];
37 | 
38 |                 if ($offset < $matchIndex) {
39 |                     $result[] = substr($text, $offset, $matchIndex - $offset);
40 |                 }
41 | 
42 |                 if (strlen($fullMatch) > 0) {
43 |                     $result[] = $fullMatch;
44 |                 }
45 | 
46 |                 $offset = $matchIndex + strlen($fullMatch);
47 |             }
48 | 
49 |             if ($offset < strlen($text)) {
50 |                 $result[] = substr($text, $offset);
51 |             }
52 | 
53 |             return $result;
54 |         }
55 |     }
56 | }
57 | 


--------------------------------------------------------------------------------
/src/PreTokenizers/WhitespacePreTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTokenizers;
 6 | 
 7 | /**
 8 |  * Splits on word boundaries (using the following regular expression: `\w+|[^\w\s]+`).
 9 |  */
10 | class WhitespacePreTokenizer extends PreTokenizer
11 | {
12 | 
13 |     protected function preTokenizeText(array|string $text, array $options): array
14 |     {
15 |         preg_match_all('/[\p{N}\p{L}]+|[^\p{Z}\s]+/u', $text, $matches);
16 | 
17 |         return $matches[0] ?? [];
18 |     }
19 | }
20 | 


--------------------------------------------------------------------------------
/src/PreTokenizers/WhitespaceSplit.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTokenizers;
 7 | 
 8 | class WhitespaceSplit extends PreTokenizer
 9 | {
10 | 
11 |     public function __construct(protected array $config)
12 |     {
13 |     }
14 | 
15 |     public function preTokenizeText(string|array $text, array $options): array
16 |     {
17 | //        $words = preg_split('/\s+/', $text, flags: PREG_SPLIT_NO_EMPTY);
18 |         return preg_split('/[\s\x{FFFD}]+/u', $text, flags: PREG_SPLIT_NO_EMPTY);
19 |     }
20 | }


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/AlbertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | /**
 9 |  * Albert tokenizer
10 |  */
11 | class AlbertTokenizer extends PreTrainedTokenizer
12 | {
13 |     protected bool $returnTokenTypeIds = true;
14 | }
15 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/BartTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class BartTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/BertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | /**
 9 |  * BertTokenizer is a class used to tokenize text for BERT models.
10 |  */
11 | class BertTokenizer extends PreTrainedTokenizer
12 | {
13 | }
14 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/BlenderbotSmallTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class BlenderbotSmallTokenizer extends BlenderbotTokenizer
 8 | {
 9 | 
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/BlenderbotTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class BlenderbotTokenizer extends PretrainedTokenizer
 8 | {
 9 |     protected string $defaultChatTemplate = "{% for message in messages %}{% if message['role'] == 'user' %}{{ ' ' }}{% endif %}{{ message['content'] }}{% if not loop.last %}{{ '  ' }}{% endif %}{% endfor %}{{ eos_token }}";
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/BloomTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class BloomTokenizer extends GPT2Tokenizer
 9 | {
10 |     public function __construct(array $tokenizerJSON, array $tokenizerConfig)
11 |     {
12 | 
13 |         // Override the default (invalid) regex of the pretokenizer.
14 |         // For more information, see https://github.com/xenova/transformers.js/issues/94
15 |         $splitChars = '.,!?\u2026\u3002\uff0c\u3001\u0964\u06d4\u060c';
16 | 
17 |         $patternObject = $tokenizerJSON['pre_tokenizer']['pretokenizers'][0]['pattern'] ?? null;
18 |         if ($patternObject && $patternObject['Regex'] === ' ?[^(\\s|[${splitChars}])]+') {
19 |             $patternObject['Regex'] = " ?[^\\s{$splitChars}]+";
20 |         }
21 | 
22 | 
23 |         parent::__construct($tokenizerJSON, $tokenizerConfig);
24 |     }
25 | }
26 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/CLIPTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class CLIPTokenizer extends PreTrainedTokenizer
 9 | {
10 | 
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/CamembertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class CamembertTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/CodeGenTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class CodeGenTokenizer extends PreTrainedTokenizer
 9 | {
10 | 
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/CodeLlamaTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class CodeLlamaTokenizer extends LlamaTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/CohereTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class CohereTokenizer extends PretrainedTokenizer
 8 | {
 9 | 
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/ConvBertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class ConvBertTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/DebertaTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class DebertaTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/DebertaV2Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class DebertaV2Tokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/DistilBertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class DistilBertTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/ElectraTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class ElectraTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/EsmTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class EsmTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/FalconTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class FalconTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/GPT2Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class GPT2Tokenizer extends PreTrainedTokenizer
 9 | {
10 |      protected string $defaultChatTemplate =  '{% for message in messages %}" "{{ message.content }}{{ eos_token }}" "{% endfor %}';
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/GPTNeoXTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class GPTNeoXTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/GemmaTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class GemmaTokenizer extends PretrainedTokenizer
 8 | {
 9 |     protected string $defaultChatTemplate = "{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}";
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/Grok1Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class Grok1Tokenizer extends PretrainedTokenizer
 8 | {
 9 | }
10 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/HerbertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class HerbertTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/MBart50Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class MBart50Tokenizer extends MBartTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/MPNetTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class MPNetTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/MobileBertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class MobileBertTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/NougatTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class NougatTokenizer extends PretrainedTokenizer
 8 | {
 9 | 
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/Qwen2Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class Qwen2Tokenizer extends PreTrainedTokenizer
 9 | {
10 | 
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/RoFormerTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class RoFormerTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/RobertaTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class RobertaTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/SiglipTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class SiglipTokenizer extends PretrainedTokenizer
 8 | {
 9 | 
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/SpeechT5Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | class SpeechT5Tokenizer extends PretrainedTokenizer
 8 | {
 9 | 
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/SqueezeBertTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class SqueezeBertTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/T5Tokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class T5Tokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/VitsTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 6 | 
 7 | use Codewithkyrian\Transformers\Decoders\VitsDecoder;
 8 | 
 9 | class VitsTokenizer extends PretrainedTokenizer
10 | {
11 |     public function __construct(array $tokenizerJSON, ?array $tokenizerConfig)
12 |     {
13 |         parent::__construct($tokenizerJSON, $tokenizerConfig);
14 | 
15 |         // Custom decoder function
16 |         $this->decoder = new VitsDecoder([]);
17 |     }
18 | }
19 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/Wav2Vec2CTCTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class Wav2Vec2CTCTokenizer extends PreTrainedTokenizer
 9 | {
10 | 
11 | }
12 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/XLMRobertaTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class XLMRobertaTokenizer extends PreTrainedTokenizer
 9 | {
10 | }
11 | 


--------------------------------------------------------------------------------
/src/PreTrainedTokenizers/XLMTokenizer.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\PreTrainedTokenizers;
 7 | 
 8 | class XLMTokenizer extends PreTrainedTokenizer
 9 | {
10 |     protected bool $returnTokenTypeIds = true;
11 | 
12 |     public function __construct(array $tokenizerJSON, array $tokenizerConfig)
13 |     {
14 |         parent::__construct($tokenizerJSON, $tokenizerConfig);
15 | 
16 |         trigger_error("WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s `fast` tokenizers library. Therefore, you may experience slightly inaccurate results.");
17 |     }
18 | }
19 | 


--------------------------------------------------------------------------------
/src/Processors/OwlViTProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Processors;
 7 | 
 8 | class OwlViTProcessor extends Processor
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Processors/Wav2Vec2ProcessorWithLM.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Processors;
 7 | 
 8 | class Wav2Vec2ProcessorWithLM extends Processor
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Processors/WhisperProcessor.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Processors;
 7 | 
 8 | class WhisperProcessor  extends Processor
 9 | {
10 | 
11 | }


--------------------------------------------------------------------------------
/src/Tensor/MatrixOperator.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Tensor;
 7 | 
 8 | use Interop\Polite\Math\Matrix\NDArray;
 9 | use Rindow\Math\Matrix\NDArrayPhp;
10 | 
11 | class MatrixOperator extends \Rindow\Math\Matrix\MatrixOperator
12 | {
13 |     protected function alloc(mixed $array, int $dtype = null, array $shape = null): NDArray
14 |     {
15 |         if ($dtype === null) {
16 |             //$dtype = $this->resolveDtype($array);
17 |             $dtype = $this->defaultFloatType;
18 |         }
19 |         return new Tensor($array, $dtype, $shape);
20 |     }
21 | }


--------------------------------------------------------------------------------
/src/Tensor/OpenBLASFactory.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Tensor;
 7 | 
 8 | use FFI;
 9 | use FFI\Exception as FFIException;
10 | use Rindow\Math\Matrix\Drivers\MatlibPHP\PhpLapack;
11 | use Rindow\OpenBLAS\FFI\Blas;
12 | use RuntimeException;
13 | 
14 | /**
15 |  */
16 | class OpenBLASFactory
17 | {
18 |     private static ?FFI $ffi = null;
19 | 
20 | 
21 |     /**
22 |      * @param array<string> $libFiles
23 |      * @param array<string> $lapackeLibs
24 |      */
25 |     public function __construct(
26 |         string $headerFile,
27 |         array  $libFiles,
28 |     )
29 |     {
30 |         if (self::$ffi !== null) {
31 |             return;
32 |         }
33 |         if (!extension_loaded('ffi')) {
34 |             return;
35 |         }
36 | 
37 |         $code = file_get_contents($headerFile);
38 | 
39 |         foreach ($libFiles as $filename) {
40 |             try {
41 |                 $ffi = FFI::cdef($code, $filename);
42 |             } catch (FFIException $e) {
43 |                 continue;
44 |             }
45 | 
46 |             self::$ffi = $ffi;
47 |             break;
48 |         }
49 |     }
50 | 
51 |     public function isAvailable(): bool
52 |     {
53 |         return self::$ffi !== null;
54 |     }
55 | 
56 |     public function Blas(): Blas
57 |     {
58 |         if (self::$ffi == null) {
59 |             throw new RuntimeException('openblas library not loaded.');
60 |         }
61 |         return new Blas(self::$ffi);
62 |     }
63 | 
64 |     public function Lapack(): PhpLapack
65 |     {
66 |         return new PhpLapack();
67 |     }
68 | }


--------------------------------------------------------------------------------
/src/Tensor/TensorBufferFactory.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | namespace Codewithkyrian\Transformers\Tensor;
 4 | 
 5 | use FFI;
 6 | 
 7 | class TensorBufferFactory
 8 | {
 9 |     public function isAvailable() : bool
10 |     {
11 |         return class_exists(FFI::class);
12 |     }
13 | 
14 |     public function Buffer(int $size, int $dtype) : TensorBuffer
15 |     {
16 |         return new TensorBuffer($size, $dtype);
17 |     }
18 | }


--------------------------------------------------------------------------------
/src/Tensor/TensorService.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | namespace Codewithkyrian\Transformers\Tensor;
 6 | 
 7 | use Codewithkyrian\TransformersLibsLoader\Library;
 8 | use Rindow\Math\Matrix\Drivers\AbstractMatlibService;
 9 | use Rindow\Matlib\FFI\MatlibFactory;
10 | use function Codewithkyrian\Transformers\Utils\basePath;
11 | 
12 | class TensorService extends AbstractMatlibService
13 | {
14 |     protected function injectDefaultFactories(): void
15 |     {
16 |         $this->bufferFactory = new TensorBufferFactory();
17 | 
18 |         $this->openblasFactory = new OpenBLASFactory(
19 |             headerFile: Library::OpenBlas->header(basePath('includes')),
20 |             libFiles: [Library::OpenBlas->library(basePath('libs'))],
21 |         );
22 | 
23 |         $this->mathFactory = new MatlibFactory(
24 |             libFiles: [Library::RindowMatlib->library(basePath('libs'))]
25 |         );
26 |     }
27 | }


--------------------------------------------------------------------------------
/src/Tokenizers/AddedToken.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Tokenizers;
 7 | 
 8 | /**
 9 |  * Represent a token added by the user on top of the existing Model vocabulary.
10 |  * AddedToken can be configured to specify the behavior they should have in various situations like:
11 |  *   - Whether they should only match single words
12 |  *   - Whether to include any whitespace on its left or right
13 |  */
14 | class AddedToken
15 | {
16 |     public function __construct(
17 |         /**
18 |          * The content of the added token.
19 |          */
20 |         public readonly string $content,
21 |         /**
22 |          * The unique ID associated to this token.
23 |          */
24 |         public readonly int $id,
25 |         /**
26 |          * Whether this token must be a single word or can break words.
27 |          */
28 |         public readonly bool $singleWord = true,
29 |         /**
30 |          * Whether this token should strip whitespaces on its left.
31 |          */
32 |         public readonly bool $lStrip = false,
33 |         /**
34 |          * Whether this token should strip whitespaces on its right.
35 |          */
36 |         public readonly bool $rStrip = false,
37 |         /**
38 |          * Whether this token should be normalized.
39 |          */
40 |         public readonly bool $normalized = true,
41 |         /**
42 |          * Whether this token is a special token.
43 |          */
44 |         public readonly bool $special = false,
45 |     )
46 |     {
47 |     }
48 | 
49 |     public static function make(array $config): self
50 |     {
51 |         return new self(
52 |             $config['content'],
53 |             $config['id'],
54 |             $config['single_word'] ?? true,
55 |             $config['lstrip'] ?? false,
56 |             $config['rstrip'] ?? false,
57 |             $config['normalized'] ?? true,
58 |             $config['special'] ?? false,
59 |         );
60 |     }
61 | }


--------------------------------------------------------------------------------
/src/Tokenizers/BPENode.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Tokenizers;
 7 | 
 8 | class BPENode
 9 | {
10 |     public float $score = 0.0;
11 | 
12 |     public bool $deleted = false;
13 | 
14 |     public function __construct(
15 |         public string $token,
16 |         public float  $bias,
17 |         public ?BPENode $prev = null,
18 |         public ?BPENode $next = null,
19 |     )
20 |     {
21 |     }
22 | }


--------------------------------------------------------------------------------
/src/Utils/ImageDriver.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Utils;
 7 | 
 8 | enum ImageDriver
 9 | {
10 |     case IMAGICK;
11 |     case GD;
12 |     case VIPS;
13 | }
14 | 


--------------------------------------------------------------------------------
/src/Utils/Resample.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | 
 6 | namespace Codewithkyrian\Transformers\Utils;
 7 | 
 8 | // Defined here: https://github.com/python-pillow/Pillow/blob/a405e8406b83f8bfb8916e93971edc7407b8b1ff/src/libImaging/Imaging.h#L262-L268
 9 | enum Resample: int
10 | {
11 |     case NEAREST = 0;
12 |     case LANCZOS = 1;
13 |     case BILINEAR = 2;
14 |     case BICUBIC = 3;
15 |     case BOX = 4;
16 |     case HAMMING = 5;
17 | 
18 |     public function toString(): string
19 |     {
20 |         return match ($this) {
21 |             self::NEAREST => 'undefined',
22 |             self::LANCZOS => 'lanczos',
23 |             self::BILINEAR => 'point',
24 |             self::BICUBIC => 'cubic',
25 |             self::BOX => 'box',
26 |             self::HAMMING => 'hamming',
27 |         };
28 |     }
29 | 
30 | }


--------------------------------------------------------------------------------
/tests/Expectations.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | use Pest\Exceptions\InvalidExpectation;
 4 | use Pest\Exceptions\InvalidExpectationValue;
 5 | 
 6 | expect()->extend('toMatchArrayApproximately', function (array $expected, float $precision = 0.0001) {
 7 |     $actual = $this->value;
 8 | 
 9 |     expect($actual)
10 |         ->toBeArray()
11 |         ->and(count($actual))
12 |         ->toBe(count($expected))
13 |         ->and($actual)
14 |         ->toHaveKeys(array_keys($expected));
15 | 
16 |     foreach ($expected as $key => $expectedValue) {
17 |         $actualValue = $actual[$key];
18 | 
19 |         if (is_numeric($actualValue))
20 |         {
21 |             $message = "Failed asserting that $actualValue at key $key ≈ $expectedValue (±$precision)";
22 |             expect($actualValue)
23 |                 ->toEqualWithDelta($expectedValue, $precision, $message);
24 |         } else
25 |         {
26 |             $message = "Failed asserting that $actualValue at key $key ≈ $expectedValue";
27 |             expect($actualValue)
28 |                 ->toEqual($expectedValue, $message);
29 |         }
30 |     }
31 | 
32 |     return $this;
33 | });
34 | 


--------------------------------------------------------------------------------
/tests/Pest.php:
--------------------------------------------------------------------------------
1 | <?php
2 | 


--------------------------------------------------------------------------------
/tests/PipelineTest.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\Exceptions\UnsupportedTaskException;
 6 | use Codewithkyrian\Transformers\Pipelines\FeatureExtractionPipeline;
 7 | use Codewithkyrian\Transformers\Transformers;
 8 | use function Codewithkyrian\Transformers\Pipelines\pipeline;
 9 | 
10 | beforeAll(function () {
11 |     Transformers::setup()
12 |         ->setCacheDir('tests/models')
13 |         ->apply();
14 | });
15 | 
16 | it('can create a pipeline for a task', function () {
17 |     $extractor = pipeline('feature-extraction');
18 | 
19 |     expect($extractor)->toBeInstanceOf(FeatureExtractionPipeline::class);
20 | });
21 | 
22 | 
23 | it('can create a pipeline for a task with a model', function () {
24 |     $extractor = pipeline('feature-extraction', 'Xenova/all-MiniLM-L6-v2');
25 | 
26 |     expect($extractor)->toBeInstanceOf(FeatureExtractionPipeline::class);
27 | });
28 | 
29 | it('throws an exception when creating a pipeline for an unsupported task', function () {
30 |     pipeline('unsupported-task');
31 | })->throws(UnsupportedTaskException::class);


--------------------------------------------------------------------------------
/tests/tensors/TensorBufferTest.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | declare(strict_types=1);
 4 | 
 5 | use Codewithkyrian\Transformers\Tensor\Tensor;
 6 | use Codewithkyrian\Transformers\Tensor\TensorBuffer;
 7 | 
 8 | beforeEach(function () {
 9 |     $this->tensorBuffer = new TensorBuffer(5, Tensor::float32);
10 | });
11 | 
12 | it('throws an exception when accessing offset with invalid type', fn() => $this->tensorBuffer['offset'])
13 |     ->throws(TypeError::class);
14 | 
15 | it('can create a zero-sized buffer', function () {
16 |     $buffer = new TensorBuffer(0, Tensor::float32);
17 | 
18 |     expect($buffer->count())->toBe(0);
19 | });
20 | 
21 | it('gets the correct value at the given offset using square brackets', function () {
22 |     expect($this->tensorBuffer[0])->toBe(0.0)
23 |         ->and($this->tensorBuffer[4])->toBe(0.0);
24 | });
25 | 
26 | it('sets the value at the given offset using square brackets', function () {
27 |     $this->tensorBuffer[0] = 1.5;
28 |     $this->tensorBuffer[4] = 2.5;
29 | 
30 |     expect($this->tensorBuffer[0])->toBe(1.5)
31 |         ->and($this->tensorBuffer[4])->toBe(2.5);
32 | });
33 | 
34 | it('throws an exception when accessing out-of-range offset', fn() => $this->tensorBuffer[5])
35 |     ->throws(OutOfRangeException::class);
36 | 
37 | it('throws an exception when unsetting offset using square brackets', function () {
38 |     unset($this->tensorBuffer[0]);
39 | })->throws(LogicException::class);
40 | 


--------------------------------------------------------------------------------
/tests/tokenizers/Datasets.php:
--------------------------------------------------------------------------------
 1 | <?php
 2 | 
 3 | dataset('regular-tokenization', function () {
 4 |     $data = json_decode(file_get_contents(__DIR__.'/dataset-regular.json'), true);
 5 | 
 6 |     foreach ($data as $tokenizerId => $tests) {
 7 |         foreach ($tests as $test) {
 8 |             $label = is_string($test['input']) ? $test['input'] : json_encode($test['input']);
 9 |             yield "$tokenizerId: $label" => fn () => [
10 |                 'tokenizerId' => $tokenizerId,
11 |                 'test' => $test
12 |             ];
13 |         }
14 |     }
15 | });
16 | 
17 | dataset('template-tokenization', function () {
18 |     $data = json_decode(file_get_contents(__DIR__.'/dataset-templates.json'), true);
19 | 
20 |     foreach ($data as $tokenizerId => $tests) {
21 |         foreach ($tests as $test) {
22 |             $printableKeys = ['add_generation_prompt', 'tokenize'];
23 |             $label = json_encode(array_intersect_key($test, array_flip($printableKeys)));
24 |             yield "$tokenizerId: $label" => fn () => [
25 |                 'tokenizerId' => $tokenizerId,
26 |                 'test' => $test
27 |             ];
28 |         }
29 |     }
30 | });
31 | 


--------------------------------------------------------------------------------