├── .github └── workflows │ ├── doc-build.yml │ ├── doc-pr-build.yml │ ├── doc-pr-upload.yml │ └── trufflehog.yml ├── .gitignore ├── LICENSE ├── Makefile ├── README.md ├── containers ├── README.md ├── container.yaml ├── pytorch │ ├── inference │ │ ├── README.md │ │ ├── cpu │ │ │ ├── 2.2.2 │ │ │ │ └── transformers │ │ │ │ │ ├── 4.41.1 │ │ │ │ │ └── py311 │ │ │ │ │ │ ├── Dockerfile │ │ │ │ │ │ └── entrypoint.sh │ │ │ │ │ └── 4.44.0 │ │ │ │ │ └── py311 │ │ │ │ │ ├── Dockerfile │ │ │ │ │ └── entrypoint.sh │ │ │ └── 2.3.1 │ │ │ │ └── transformers │ │ │ │ ├── 4.46.1 │ │ │ │ └── py311 │ │ │ │ │ ├── Dockerfile │ │ │ │ │ └── entrypoint.sh │ │ │ │ └── 4.48.0 │ │ │ │ └── py311 │ │ │ │ ├── Dockerfile │ │ │ │ └── entrypoint.sh │ │ └── gpu │ │ │ ├── 2.2.2 │ │ │ └── transformers │ │ │ │ ├── 4.41.1 │ │ │ │ └── py311 │ │ │ │ │ ├── Dockerfile │ │ │ │ │ └── entrypoint.sh │ │ │ │ └── 4.44.0 │ │ │ │ └── py311 │ │ │ │ ├── Dockerfile │ │ │ │ └── entrypoint.sh │ │ │ └── 2.3.1 │ │ │ └── transformers │ │ │ ├── 4.46.1 │ │ │ └── py311 │ │ │ │ ├── Dockerfile │ │ │ │ └── entrypoint.sh │ │ │ └── 4.48.0 │ │ │ └── py311 │ │ │ ├── Dockerfile │ │ │ └── entrypoint.sh │ └── training │ │ ├── README.md │ │ ├── gpu │ │ ├── 2.3.0 │ │ │ └── transformers │ │ │ │ ├── 4.41.1 │ │ │ │ └── py310 │ │ │ │ │ └── Dockerfile │ │ │ │ └── 4.42.3 │ │ │ │ └── py310 │ │ │ │ └── Dockerfile │ │ └── 2.3.1 │ │ │ └── transformers │ │ │ └── 4.48.0 │ │ │ └── py311 │ │ │ └── Dockerfile │ │ └── tpu │ │ ├── 2.4.0 │ │ └── transformers │ │ │ └── 4.41.1 │ │ │ └── py310 │ │ │ └── Dockerfile │ │ └── 2.5.1 │ │ └── transformers │ │ └── 4.46.3 │ │ └── py310 │ │ └── Dockerfile ├── tei │ ├── README.md │ ├── cpu │ │ ├── 1.2.2 │ │ │ └── Dockerfile │ │ ├── 1.4.0 │ │ │ ├── Dockerfile │ │ │ └── entrypoint.sh │ │ ├── 1.5.1 │ │ │ ├── Dockerfile │ │ │ └── entrypoint.sh │ │ └── 1.6.0 │ │ │ ├── Dockerfile │ │ │ └── entrypoint.sh │ └── gpu │ │ ├── 1.2.2 │ │ └── Dockerfile │ │ ├── 1.4.0 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ │ ├── 1.5.1 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ │ └── 1.6.0 │ │ ├── Dockerfile │ │ └── entrypoint.sh └── tgi │ ├── README.md │ ├── gpu │ ├── 1.4.2 │ │ └── Dockerfile │ ├── 1.4.4 │ │ └── Dockerfile │ ├── 2.0.0 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ ├── 2.0.1 │ │ └── Dockerfile │ ├── 2.0.3 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ ├── 2.1.0 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ ├── 2.1.1 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ ├── 2.2.0 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ ├── 2.3.1 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ ├── 2.4.0 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ └── 3.0.1 │ │ ├── Dockerfile │ │ └── entrypoint.sh │ └── tpu │ ├── 0.1.4 │ ├── Dockerfile │ └── entrypoint.sh │ ├── 0.2.2 │ ├── Dockerfile │ └── entrypoint.sh │ └── 0.2.3 │ ├── Dockerfile │ └── entrypoint.sh ├── docs ├── scripts │ ├── auto-generate-examples.py │ └── auto-update-toctree.py └── source │ ├── _redirects.yml │ ├── _toctree.yml │ ├── containers │ ├── available.mdx │ └── introduction.mdx │ ├── features.mdx │ ├── index.mdx │ ├── resources.mdx │ └── tpu.mdx ├── examples ├── README.md ├── cloud-run │ ├── README.md │ ├── deploy-gemma-2-on-cloud-run │ │ ├── README.md │ │ └── imgs │ │ │ ├── cloud-run-deployment.png │ │ │ └── cloud-run-details.png │ └── deploy-llama-3-1-on-cloud-run │ │ ├── README.md │ │ └── imgs │ │ ├── cloud-run-deployment.png │ │ └── cloud-run-details.png ├── gke │ ├── README.md │ ├── tei-deployment │ │ ├── README.md │ │ ├── cpu-config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ └── service.yaml │ │ ├── gpu-config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ └── service.yaml │ │ └── imgs │ │ │ ├── gke-cluster.png │ │ │ └── gke-deployment.png │ ├── tei-from-gcs-deployment │ │ ├── README.md │ │ ├── cpu-config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ ├── service.yaml │ │ │ └── storageclass.yaml │ │ ├── gpu-config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ ├── service.yaml │ │ │ └── storageclass.yaml │ │ └── imgs │ │ │ ├── gcs-bucket.png │ │ │ ├── gke-cluster.png │ │ │ └── gke-deployment.png │ ├── tgi-deployment │ │ ├── README.md │ │ ├── config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ └── service.yaml │ │ └── imgs │ │ │ ├── gke-cluster.png │ │ │ ├── gke-deployment.png │ │ │ └── gke-secrets.png │ ├── tgi-from-gcs-deployment │ │ ├── README.md │ │ ├── config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ ├── service.yaml │ │ │ └── storageclass.yaml │ │ └── imgs │ │ │ ├── gcs-bucket.png │ │ │ ├── gke-cluster.png │ │ │ └── gke-deployment.png │ ├── tgi-llama-405b-deployment │ │ ├── README.md │ │ ├── config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ └── service.yaml │ │ └── imgs │ │ │ ├── gke-cluster.png │ │ │ ├── gke-deployment-logs.png │ │ │ └── gke-deployment.png │ ├── tgi-llama-vision-deployment │ │ ├── README.md │ │ ├── config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ └── service.yaml │ │ └── imgs │ │ │ ├── gke-cluster.png │ │ │ ├── gke-deployment-logs.png │ │ │ ├── gke-deployment.png │ │ │ └── gke-secrets.png │ ├── tgi-multi-lora-deployment │ │ ├── README.md │ │ ├── config │ │ │ ├── deployment.yaml │ │ │ ├── ingress.yaml │ │ │ └── service.yaml │ │ └── imgs │ │ │ ├── gke-cluster.png │ │ │ ├── gke-deployment-logs.png │ │ │ ├── gke-deployment.png │ │ │ └── gke-secrets.png │ ├── trl-full-fine-tuning │ │ ├── README.md │ │ ├── imgs │ │ │ ├── can-it-run-llm.png │ │ │ ├── gcs-bucket.png │ │ │ ├── gke-cluster.png │ │ │ ├── gke-job-completed.png │ │ │ ├── gke-job-created.png │ │ │ ├── gke-job-logs.png │ │ │ └── gke-job-running.png │ │ └── job.yaml │ └── trl-lora-fine-tuning │ │ ├── README.md │ │ ├── imgs │ │ ├── can-it-run-llm.png │ │ ├── gcs-bucket.png │ │ ├── gke-cluster.png │ │ ├── gke-job-completed.png │ │ ├── gke-job-created.png │ │ ├── gke-job-logs.png │ │ └── gke-job-running.png │ │ └── job.yaml └── vertex-ai │ ├── README.md │ └── notebooks │ ├── deploy-bert-on-vertex-ai │ ├── assets │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint-ready.png │ │ ├── vertex-ai-endpoint.png │ │ ├── vertex-ai-model-ready.png │ │ ├── vertex-ai-model-version.png │ │ └── vertex-ai-model.png │ └── vertex-notebook.ipynb │ ├── deploy-embedding-on-vertex-ai │ ├── assets │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint-logs-predict.png │ │ ├── vertex-ai-endpoint-logs.png │ │ ├── vertex-ai-endpoint-run.png │ │ ├── vertex-ai-endpoint.png │ │ └── vertex-ai-model.png │ └── vertex-notebook.ipynb │ ├── deploy-flux-on-vertex-ai │ ├── assets │ │ ├── flux-dev-output.png │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint-ready.png │ │ ├── vertex-ai-endpoint.png │ │ ├── vertex-ai-model-ready.png │ │ ├── vertex-ai-model-version.png │ │ └── vertex-ai-model.png │ └── vertex-notebook.ipynb │ ├── deploy-gemma-from-gcs-on-vertex-ai │ ├── assets │ │ ├── gcs-model-artifact.png │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint-logs.png │ │ ├── vertex-ai-endpoint-run.png │ │ ├── vertex-ai-endpoint.png │ │ ├── vertex-ai-model-path.png │ │ ├── vertex-ai-model.png │ │ └── vertex-ai-online-prediction.png │ └── vertex-notebook.ipynb │ ├── deploy-gemma-on-vertex-ai │ ├── assets │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint-logs-predict.png │ │ ├── vertex-ai-endpoint-logs.png │ │ ├── vertex-ai-endpoint-run.png │ │ ├── vertex-ai-endpoint.png │ │ ├── vertex-ai-model.png │ │ └── vertex-ai-online-prediction.png │ └── vertex-notebook.ipynb │ ├── deploy-llama-3-1-405b-on-vertex-ai │ ├── assets │ │ ├── a3-general-availability.png │ │ ├── a3-quota-request.png │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint.png │ │ ├── vertex-ai-model.png │ │ └── vertex-ai-online-prediction.png │ └── vertex-notebook.ipynb │ ├── deploy-llama-vision-on-vertex-ai │ ├── assets │ │ ├── model-in-hf-hub.png │ │ ├── vertex-ai-endpoint-run.png │ │ ├── vertex-ai-endpoint.png │ │ ├── vertex-ai-model.png │ │ └── vertex-ai-online-prediction.png │ └── vertex-notebook.ipynb │ ├── evaluate-llms-with-vertex-ai │ ├── assets │ │ └── experiment-results.png │ └── vertex-notebook.ipynb │ ├── trl-full-sft-fine-tuning-on-vertex-ai │ ├── assets │ │ ├── can-it-run-llm.png │ │ ├── gcs-bucket-artifacts.png │ │ ├── vertex-ai-pipeline-completed.png │ │ ├── vertex-ai-pipeline-logs.png │ │ ├── vertex-ai-pipeline-scheduled.png │ │ └── vertex-ai-run.png │ └── vertex-notebook.ipynb │ └── trl-lora-sft-fine-tuning-on-vertex-ai │ ├── assets │ ├── can-it-run-llm.png │ ├── gcs-bucket-artifacts.png │ ├── vertex-ai-pipeline-completed.png │ ├── vertex-ai-pipeline-logs.png │ └── vertex-ai-pipeline-scheduled.png │ └── vertex-notebook.ipynb └── scripts ├── README.md ├── internal └── update_example_tables.py ├── push_image_to_gcr.sh └── upload_model_to_gcs.sh /.github/workflows/doc-build.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/.github/workflows/doc-build.yml -------------------------------------------------------------------------------- /.github/workflows/doc-pr-build.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/.github/workflows/doc-pr-build.yml -------------------------------------------------------------------------------- /.github/workflows/doc-pr-upload.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/.github/workflows/doc-pr-upload.yml -------------------------------------------------------------------------------- /.github/workflows/trufflehog.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/.github/workflows/trufflehog.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/README.md -------------------------------------------------------------------------------- /containers/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/README.md -------------------------------------------------------------------------------- /containers/container.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/container.yaml -------------------------------------------------------------------------------- /containers/pytorch/inference/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/README.md -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.2.2/transformers/4.41.1/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.2.2/transformers/4.41.1/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.2.2/transformers/4.41.1/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.2.2/transformers/4.41.1/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.2.2/transformers/4.44.0/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.2.2/transformers/4.44.0/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.2.2/transformers/4.44.0/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.2.2/transformers/4.44.0/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.3.1/transformers/4.46.1/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.3.1/transformers/4.46.1/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.3.1/transformers/4.46.1/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.3.1/transformers/4.46.1/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.3.1/transformers/4.48.0/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.3.1/transformers/4.48.0/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/cpu/2.3.1/transformers/4.48.0/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/cpu/2.3.1/transformers/4.48.0/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.2.2/transformers/4.41.1/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.2.2/transformers/4.41.1/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.2.2/transformers/4.41.1/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.2.2/transformers/4.41.1/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.2.2/transformers/4.44.0/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.2.2/transformers/4.44.0/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.2.2/transformers/4.44.0/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.2.2/transformers/4.44.0/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.3.1/transformers/4.46.1/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.3.1/transformers/4.46.1/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.3.1/transformers/4.46.1/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.3.1/transformers/4.46.1/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.3.1/transformers/4.48.0/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.3.1/transformers/4.48.0/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/inference/gpu/2.3.1/transformers/4.48.0/py311/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/inference/gpu/2.3.1/transformers/4.48.0/py311/entrypoint.sh -------------------------------------------------------------------------------- /containers/pytorch/training/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/training/README.md -------------------------------------------------------------------------------- /containers/pytorch/training/gpu/2.3.0/transformers/4.41.1/py310/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/training/gpu/2.3.0/transformers/4.41.1/py310/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/training/gpu/2.3.0/transformers/4.42.3/py310/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/training/gpu/2.3.0/transformers/4.42.3/py310/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/training/gpu/2.3.1/transformers/4.48.0/py311/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/training/gpu/2.3.1/transformers/4.48.0/py311/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/training/tpu/2.4.0/transformers/4.41.1/py310/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/training/tpu/2.4.0/transformers/4.41.1/py310/Dockerfile -------------------------------------------------------------------------------- /containers/pytorch/training/tpu/2.5.1/transformers/4.46.3/py310/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/pytorch/training/tpu/2.5.1/transformers/4.46.3/py310/Dockerfile -------------------------------------------------------------------------------- /containers/tei/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/README.md -------------------------------------------------------------------------------- /containers/tei/cpu/1.2.2/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.2.2/Dockerfile -------------------------------------------------------------------------------- /containers/tei/cpu/1.4.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.4.0/Dockerfile -------------------------------------------------------------------------------- /containers/tei/cpu/1.4.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.4.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tei/cpu/1.5.1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.5.1/Dockerfile -------------------------------------------------------------------------------- /containers/tei/cpu/1.5.1/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.5.1/entrypoint.sh -------------------------------------------------------------------------------- /containers/tei/cpu/1.6.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.6.0/Dockerfile -------------------------------------------------------------------------------- /containers/tei/cpu/1.6.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/cpu/1.6.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tei/gpu/1.2.2/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.2.2/Dockerfile -------------------------------------------------------------------------------- /containers/tei/gpu/1.4.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.4.0/Dockerfile -------------------------------------------------------------------------------- /containers/tei/gpu/1.4.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.4.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tei/gpu/1.5.1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.5.1/Dockerfile -------------------------------------------------------------------------------- /containers/tei/gpu/1.5.1/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.5.1/entrypoint.sh -------------------------------------------------------------------------------- /containers/tei/gpu/1.6.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.6.0/Dockerfile -------------------------------------------------------------------------------- /containers/tei/gpu/1.6.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tei/gpu/1.6.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/README.md -------------------------------------------------------------------------------- /containers/tgi/gpu/1.4.2/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/1.4.2/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/1.4.4/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/1.4.4/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.0.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.0.0/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.0.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.0.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/2.0.1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.0.1/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.0.3/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.0.3/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.0.3/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.0.3/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/2.1.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.1.0/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.1.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.1.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/2.1.1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.1.1/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.1.1/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.1.1/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/2.2.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.2.0/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.2.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.2.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/2.3.1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.3.1/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.3.1/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.3.1/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/2.4.0/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.4.0/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/2.4.0/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/2.4.0/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/gpu/3.0.1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/3.0.1/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/gpu/3.0.1/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/gpu/3.0.1/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/tpu/0.1.4/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/tpu/0.1.4/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/tpu/0.1.4/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/tpu/0.1.4/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/tpu/0.2.2/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/tpu/0.2.2/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/tpu/0.2.2/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/tpu/0.2.2/entrypoint.sh -------------------------------------------------------------------------------- /containers/tgi/tpu/0.2.3/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/tpu/0.2.3/Dockerfile -------------------------------------------------------------------------------- /containers/tgi/tpu/0.2.3/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/containers/tgi/tpu/0.2.3/entrypoint.sh -------------------------------------------------------------------------------- /docs/scripts/auto-generate-examples.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/scripts/auto-generate-examples.py -------------------------------------------------------------------------------- /docs/scripts/auto-update-toctree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/scripts/auto-update-toctree.py -------------------------------------------------------------------------------- /docs/source/_redirects.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/_redirects.yml -------------------------------------------------------------------------------- /docs/source/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/_toctree.yml -------------------------------------------------------------------------------- /docs/source/containers/available.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/containers/available.mdx -------------------------------------------------------------------------------- /docs/source/containers/introduction.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/containers/introduction.mdx -------------------------------------------------------------------------------- /docs/source/features.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/features.mdx -------------------------------------------------------------------------------- /docs/source/index.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/index.mdx -------------------------------------------------------------------------------- /docs/source/resources.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/resources.mdx -------------------------------------------------------------------------------- /docs/source/tpu.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/docs/source/tpu.mdx -------------------------------------------------------------------------------- /examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/README.md -------------------------------------------------------------------------------- /examples/cloud-run/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/README.md -------------------------------------------------------------------------------- /examples/cloud-run/deploy-gemma-2-on-cloud-run/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/deploy-gemma-2-on-cloud-run/README.md -------------------------------------------------------------------------------- /examples/cloud-run/deploy-gemma-2-on-cloud-run/imgs/cloud-run-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/deploy-gemma-2-on-cloud-run/imgs/cloud-run-deployment.png -------------------------------------------------------------------------------- /examples/cloud-run/deploy-gemma-2-on-cloud-run/imgs/cloud-run-details.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/deploy-gemma-2-on-cloud-run/imgs/cloud-run-details.png -------------------------------------------------------------------------------- /examples/cloud-run/deploy-llama-3-1-on-cloud-run/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/deploy-llama-3-1-on-cloud-run/README.md -------------------------------------------------------------------------------- /examples/cloud-run/deploy-llama-3-1-on-cloud-run/imgs/cloud-run-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/deploy-llama-3-1-on-cloud-run/imgs/cloud-run-deployment.png -------------------------------------------------------------------------------- /examples/cloud-run/deploy-llama-3-1-on-cloud-run/imgs/cloud-run-details.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/cloud-run/deploy-llama-3-1-on-cloud-run/imgs/cloud-run-details.png -------------------------------------------------------------------------------- /examples/gke/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/README.md -------------------------------------------------------------------------------- /examples/gke/tei-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tei-deployment/cpu-config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/cpu-config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tei-deployment/cpu-config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/cpu-config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tei-deployment/cpu-config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/cpu-config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tei-deployment/gpu-config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/gpu-config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tei-deployment/gpu-config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/gpu-config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tei-deployment/gpu-config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/gpu-config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tei-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tei-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/cpu-config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/cpu-config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/cpu-config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/cpu-config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/cpu-config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/cpu-config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/cpu-config/storageclass.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/cpu-config/storageclass.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/gpu-config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/gpu-config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/gpu-config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/gpu-config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/gpu-config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/gpu-config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/gpu-config/storageclass.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/gpu-config/storageclass.yaml -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/imgs/gcs-bucket.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/imgs/gcs-bucket.png -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tei-from-gcs-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tei-from-gcs-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tgi-deployment/imgs/gke-secrets.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-deployment/imgs/gke-secrets.png -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/config/storageclass.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/config/storageclass.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/imgs/gcs-bucket.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/imgs/gcs-bucket.png -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tgi-from-gcs-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-from-gcs-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/imgs/gke-deployment-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/imgs/gke-deployment-logs.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-405b-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-405b-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/imgs/gke-deployment-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/imgs/gke-deployment-logs.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tgi-llama-vision-deployment/imgs/gke-secrets.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-llama-vision-deployment/imgs/gke-secrets.png -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/README.md -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/config/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/config/deployment.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/config/ingress.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/config/ingress.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/config/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/config/service.yaml -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/imgs/gke-deployment-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/imgs/gke-deployment-logs.png -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/imgs/gke-deployment.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/imgs/gke-deployment.png -------------------------------------------------------------------------------- /examples/gke/tgi-multi-lora-deployment/imgs/gke-secrets.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/tgi-multi-lora-deployment/imgs/gke-secrets.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/README.md -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/can-it-run-llm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/can-it-run-llm.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/gcs-bucket.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/gcs-bucket.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/gke-job-completed.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/gke-job-completed.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/gke-job-created.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/gke-job-created.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/gke-job-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/gke-job-logs.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/imgs/gke-job-running.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/imgs/gke-job-running.png -------------------------------------------------------------------------------- /examples/gke/trl-full-fine-tuning/job.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-full-fine-tuning/job.yaml -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/README.md -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/can-it-run-llm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/can-it-run-llm.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/gcs-bucket.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/gcs-bucket.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/gke-cluster.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/gke-cluster.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/gke-job-completed.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/gke-job-completed.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/gke-job-created.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/gke-job-created.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/gke-job-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/gke-job-logs.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/imgs/gke-job-running.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/imgs/gke-job-running.png -------------------------------------------------------------------------------- /examples/gke/trl-lora-fine-tuning/job.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/gke/trl-lora-fine-tuning/job.yaml -------------------------------------------------------------------------------- /examples/vertex-ai/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/README.md -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-endpoint-ready.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-endpoint-ready.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-model-ready.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-model-ready.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-model-version.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-model-version.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-bert-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint-logs-predict.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint-logs-predict.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint-logs.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint-run.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint-run.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-embedding-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/flux-dev-output.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/flux-dev-output.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-endpoint-ready.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-endpoint-ready.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-model-ready.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-model-ready.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-model-version.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-model-version.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-flux-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/gcs-model-artifact.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/gcs-model-artifact.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-endpoint-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-endpoint-logs.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-endpoint-run.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-endpoint-run.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-model-path.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-model-path.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-online-prediction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/assets/vertex-ai-online-prediction.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-from-gcs-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint-logs-predict.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint-logs-predict.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint-logs.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint-run.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint-run.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-online-prediction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/assets/vertex-ai-online-prediction.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-gemma-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/a3-general-availability.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/a3-general-availability.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/a3-quota-request.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/a3-quota-request.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/vertex-ai-online-prediction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/assets/vertex-ai-online-prediction.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-3-1-405b-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/model-in-hf-hub.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/model-in-hf-hub.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-endpoint-run.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-endpoint-run.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-endpoint.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-endpoint.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-model.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-online-prediction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/assets/vertex-ai-online-prediction.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/deploy-llama-vision-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/evaluate-llms-with-vertex-ai/assets/experiment-results.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/evaluate-llms-with-vertex-ai/assets/experiment-results.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/evaluate-llms-with-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/evaluate-llms-with-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/can-it-run-llm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/can-it-run-llm.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/gcs-bucket-artifacts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/gcs-bucket-artifacts.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-completed.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-completed.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-logs.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-scheduled.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-scheduled.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-run.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-run.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-full-sft-fine-tuning-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/can-it-run-llm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/can-it-run-llm.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/gcs-bucket-artifacts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/gcs-bucket-artifacts.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-completed.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-completed.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-logs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-logs.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-scheduled.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/assets/vertex-ai-pipeline-scheduled.png -------------------------------------------------------------------------------- /examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/vertex-notebook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/examples/vertex-ai/notebooks/trl-lora-sft-fine-tuning-on-vertex-ai/vertex-notebook.ipynb -------------------------------------------------------------------------------- /scripts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/scripts/README.md -------------------------------------------------------------------------------- /scripts/internal/update_example_tables.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/scripts/internal/update_example_tables.py -------------------------------------------------------------------------------- /scripts/push_image_to_gcr.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/scripts/push_image_to_gcr.sh -------------------------------------------------------------------------------- /scripts/upload_model_to_gcs.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/Google-Cloud-Containers/HEAD/scripts/upload_model_to_gcs.sh --------------------------------------------------------------------------------