├── .github └── pull_request_template.md ├── .gitignore ├── CODEOWNERS ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── LICENSE ├── NOTICE ├── README.md ├── archive ├── README.md ├── hf_image_classification │ └── VisionPerceiverConv.ipynb ├── hf_text_classification │ └── LanguagePerceiver.ipynb └── unet_image_segmentation │ ├── model.py │ ├── train.py │ └── unet.ipynb ├── inference-benchmarking ├── Readme.md ├── __init__.py ├── accuracy.py ├── clients │ ├── __init__.py │ ├── base.py │ ├── llm_perf │ │ ├── __init__.py │ │ ├── client.py │ │ └── scripts │ │ │ ├── __init__.py │ │ │ ├── run_llm_perf.sh │ │ │ └── setup_llm_perf.sh │ ├── lm_eval │ │ ├── __init__.py │ │ ├── client.py │ │ └── scripts │ │ │ ├── __init__.py │ │ │ ├── run_lm_eval.sh │ │ │ └── setup_lm_eval.sh │ └── long_bench │ │ ├── __init__.py │ │ ├── client.py │ │ └── prompts │ │ ├── 0shot.txt │ │ ├── 0shot_cot.txt │ │ ├── 0shot_cot_ans.txt │ │ ├── 0shot_no_context.txt │ │ ├── 0shot_rag.txt │ │ └── __init__.py ├── config.yaml ├── perf.yaml ├── performance.py ├── requirements.txt ├── server │ ├── __init__.py │ ├── scripts │ │ ├── __init__.py │ │ ├── prompt-template.jinja │ │ └── start_server.sh │ └── vllm.py ├── server_config.py └── utils │ ├── __init__.py │ ├── artifacts.py │ ├── parser.py │ ├── process.py │ ├── s3.py │ └── tee_output.py ├── releasenotes.md ├── tensorflow-neuron ├── README.md └── inference │ └── unet │ └── UnetTF2.ipynb ├── torch-neuron ├── README.md └── inference │ ├── beit │ └── BEiT.ipynb │ ├── bertbasecased │ └── BertBaseCased.ipynb │ ├── bertlargeuncased │ └── BertLargeUncased.ipynb │ ├── clip │ └── CLIP_Model_HF.ipynb │ ├── common │ ├── processing.py │ └── wrapper.py │ ├── craft │ └── Craft.ipynb │ ├── efficientnet │ └── EfficientNet.ipynb │ ├── fairseq │ └── Fairseq.ipynb │ ├── gfl_mmdet │ └── GFL.ipynb │ ├── hrnet │ └── HRnet.ipynb │ ├── marianmt │ └── MarianMT.ipynb │ ├── rcnn │ └── Rcnn.ipynb │ ├── resnet │ └── Resnet.ipynb │ ├── resnext │ └── Resnext.ipynb │ ├── robertabase │ └── RobertaBase.ipynb │ ├── ssd │ └── SSD300VGG16.ipynb │ ├── trocr │ └── TrOCR.ipynb │ ├── vgg │ └── VGG.ipynb │ ├── vit │ └── ViT.ipynb │ ├── yolof_detectron2 │ └── YoloF.ipynb │ ├── yolov5 │ └── Yolov5.ipynb │ ├── yolov6 │ └── Yolov6.ipynb │ └── yolov7 │ └── Yolov7.ipynb └── torch-neuronx ├── README.md ├── inference ├── customop_mlp │ ├── README.md │ ├── neuron-multicore │ │ ├── build.py │ │ ├── inference.py │ │ ├── model.py │ │ ├── my_ops.py │ │ ├── relu.cpp │ │ └── shape.cpp │ ├── neuron-tcm │ │ ├── build.py │ │ ├── inference.py │ │ ├── model.py │ │ ├── my_ops.py │ │ ├── relu.cpp │ │ └── shape.cpp │ └── neuron │ │ ├── build.py │ │ ├── inference.py │ │ ├── model.py │ │ ├── my_ops.py │ │ ├── relu.cpp │ │ └── shape.cpp ├── hf_pretrained_bert_inference_on_trn1.ipynb ├── hf_pretrained_clip_base_inference_on_inf2.ipynb ├── hf_pretrained_clip_large_inference_on_inf2.ipynb ├── hf_pretrained_distilbert_Inference_on_trn1.ipynb ├── hf_pretrained_gpt2_feature_extraction_on_trn1.ipynb ├── hf_pretrained_perceiver_language_inference.ipynb ├── hf_pretrained_perceiver_multimodal_inference.ipynb ├── hf_pretrained_perceiver_vision_inference.ipynb ├── hf_pretrained_pixart_alpha_inference_on_inf2.ipynb ├── hf_pretrained_pixart_sigma_1k │ ├── compile_latency_optimized.sh │ ├── compile_throughput_optimized.sh │ ├── hf_pretrained_pixart_sigma_1k_latency_optimized.ipynb │ ├── hf_pretrained_pixart_sigma_1k_throughput_optimized.ipynb │ ├── neuron_pixart_sigma │ │ ├── cache_hf_model.py │ │ ├── compile_decoder.py │ │ ├── compile_text_encoder.py │ │ ├── compile_transformer_latency_optimized.py │ │ ├── compile_transformer_throughput_optimized.py │ │ ├── neuron_commons.py │ │ └── neuron_parallel_utils.py │ └── requirements.txt ├── hf_pretrained_pixart_sigma_inference_on_inf2.ipynb ├── hf_pretrained_roberta_inference_on_frn1.ipynb ├── hf_pretrained_sd15_512_inference.ipynb ├── hf_pretrained_sd2_512_inference.ipynb ├── hf_pretrained_sd2_768_inference.ipynb ├── hf_pretrained_sd2_inpainting_936_624_inference.ipynb ├── hf_pretrained_sd_x4_upscaler_inference.ipynb ├── hf_pretrained_sdxl_base_1024_inference.ipynb ├── hf_pretrained_sdxl_base_and_refiner_1024_inference.ipynb ├── hf_pretrained_vit_inference_on_inf2.ipynb ├── hf_pretrained_wav2vec2_conformer_relpos_inference_on_inf2.ipynb ├── hf_pretrained_wav2vec2_conformer_rope_inference_on_inf2.ipynb ├── pretrained_unet_inference_on_trn1.ipynb ├── sd2_inpainting_mask.png ├── sd2_inpainting_photo.png ├── tv_pretrained_resnet50_inference_on_trn1.ipynb └── tv_pretrained_vgg_inference_on_trn1.ipynb ├── microbenchmark ├── matmult_linear.py ├── microbenchmark.ipynb └── ubench_utils.py ├── training ├── aws-batch │ ├── all-reduce │ │ ├── README.md │ │ ├── build_configs_and_setup.sh │ │ ├── docker │ │ │ ├── Dockerfile │ │ │ ├── allreduce.py │ │ │ └── allreduce.sh │ │ ├── submit_job.sh │ │ └── templates │ │ │ ├── build_docker_image.sh │ │ │ ├── compute_env.json │ │ │ ├── create_resources.sh │ │ │ ├── job_def.json │ │ │ ├── job_queue.json │ │ │ └── launch_template.json │ └── llama2 │ │ ├── README.md │ │ ├── config.txt │ │ ├── docker │ │ ├── Dockerfile │ │ └── llama_batch_training.sh │ │ ├── images │ │ └── aws-batch.png │ │ ├── scripts │ │ ├── build_and_push_docker_image.sh │ │ ├── cleanup.sh │ │ ├── create_resources.sh │ │ ├── download_and_tokenize_data.sh │ │ └── submit_batch_job.sh │ │ ├── setup.sh │ │ └── templates │ │ ├── compute_env.json │ │ ├── job_def.json │ │ ├── job_queue.json │ │ └── launch_template.json ├── common │ ├── hf_utils.py │ └── vision_utils.py ├── customop_mlp │ ├── README.md │ ├── neuron │ │ ├── build.py │ │ ├── model.py │ │ ├── my_ops.py │ │ ├── relu.cpp │ │ ├── shape.cpp │ │ └── train.py │ └── pytorch │ │ ├── build.py │ │ ├── model.py │ │ ├── my_ops.py │ │ ├── relu.cpp │ │ └── train_cpu.py ├── dp_bert_hf_pretrain │ ├── adamw_fp32_optim_params.py │ ├── adamw_fp32_params_copy.py │ ├── dp_bert_large_hf_pretrain_hdf5.py │ ├── dp_bert_large_hf_pretrain_hdf5_THIRD-PARTY-LICENSES.txt │ ├── lamb.py │ ├── requirements.txt │ ├── run_dp_bert_large_hf_pretrain_bf16_s128.sh │ ├── run_dp_bert_large_hf_pretrain_bf16_s128_lamb.sh │ ├── run_dp_bert_large_hf_pretrain_bf16_s512_lamb_phase2.sh │ └── run_dp_bert_large_hf_pretrain_bf16_s512_phase2.sh ├── hf_bert_jp │ └── bert-jp-tutorial.ipynb ├── hf_contrastive_image_text │ ├── CLIPBase.ipynb │ ├── CLIPLarge.ipynb │ └── run_clip.py ├── hf_image_classification │ ├── run_image_classification.py │ └── vit.ipynb ├── hf_language_modeling │ └── gpt2 │ │ ├── gpt2.ipynb │ │ └── run_clm.patch ├── hf_sentiment_analysis │ ├── .gitignore │ ├── 01-hf-single-neuron.ipynb │ ├── 02-hf-distributed-training.ipynb │ ├── README.md │ ├── code │ │ ├── 01-trainium-single-core │ │ │ └── train.py │ │ └── 02-trainium-distributed-training │ │ │ └── train.py │ └── data │ │ ├── data.csv │ │ ├── test.csv │ │ └── train.csv ├── hf_summarization │ ├── BartLarge.ipynb │ ├── T5Large.ipynb │ └── run_summarization.py ├── hf_text_classification │ ├── AlbertBase.ipynb │ ├── BertBaseCased.ipynb │ ├── BertBaseUncased.ipynb │ ├── BertLargeCased.ipynb │ ├── BertLargeUncased.ipynb │ ├── CamembertBase.ipynb │ ├── DistilbertBaseUncased.ipynb │ ├── ElectraSmall.ipynb │ ├── README.md │ ├── RobertaBase.ipynb │ ├── RobertaLarge.ipynb │ ├── XlmRobertaBase.ipynb │ └── run_glue.py ├── llama2 │ ├── adamw_fp32_optim_params.py │ ├── convert_checkpoints.py │ ├── get_dataset.py │ ├── modeling_llama_nxd.py │ └── requirements.txt ├── mnist_mlp │ ├── eval.py │ ├── eval_using_trace.py │ ├── model.py │ ├── train.py │ ├── train_cpu.py │ ├── train_torchrun.py │ └── train_xmp.py ├── resnet50 │ ├── resnet50.ipynb │ └── run_image_classification.py ├── stable_diffusion │ ├── requirements.txt │ ├── run.py │ └── sd_training_neuron.py ├── tp_dp_bert_hf_pretrain │ ├── requirements.txt │ └── tp_dp_bert_large_hf_pretrain_hdf5.py ├── tp_dp_gpt_neox_hf_pretrain │ └── common │ │ ├── adamw_fp32_optim_params.py │ │ ├── get_dataset.py │ │ └── requirements.txt └── zero1_gpt2 │ ├── config_1p5B_gpt2.json │ ├── neuron_utils.py │ ├── requirements.txt │ ├── run_clm.sh │ ├── run_clm.slurm │ ├── run_clm_compile.slurm │ ├── run_clm_no_trainer.py │ └── uncomment_gradaccum.sh └── transformers-neuronx ├── README.md └── inference ├── codellama-13b-16k-sampling.ipynb ├── facebook-opt-13b-sampling.ipynb ├── facebook-opt-30b-sampling.ipynb ├── facebook-opt-66b-sampling.ipynb ├── gpt-j-6b-sampling-dp.ipynb ├── gpt-j-6b-sampling.ipynb ├── gpt-j-dp.py ├── llama-3.1-405b-multinode-16k-sampling.ipynb ├── llama-3.1-70b-64k-sampling.ipynb ├── llama-3.1-70b-eagle-speculative-decoding.ipynb ├── llama-3.1-70b-speculative-decoding.ipynb ├── llama-3.1-8b-128k-sampling.ipynb ├── llama-3.1-8b-32k-sampling.ipynb ├── llama-70b-sampling.ipynb ├── meta-llama-2-13b-sampling.ipynb ├── meta-llama-3-70b-sampling.ipynb ├── meta-llama-3-8b-sampling.ipynb ├── meta-llama-3.1-70b-sampling.ipynb ├── meta-llama-3.1-8b-sampling.ipynb ├── mistralai-Mistral-7b-Instruct-v0.2.ipynb ├── mixtral-8x7b-sampling.ipynb └── speculative_sampling.ipynb /.github/pull_request_template.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/.github/pull_request_template.md -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | .DS_Store 2 | .ipynb_checkpoints 3 | **/__pycache__ 4 | -------------------------------------------------------------------------------- /CODEOWNERS: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/CODEOWNERS -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/LICENSE -------------------------------------------------------------------------------- /NOTICE: -------------------------------------------------------------------------------- 1 | Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved. 2 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/README.md -------------------------------------------------------------------------------- /archive/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/archive/README.md -------------------------------------------------------------------------------- /archive/hf_image_classification/VisionPerceiverConv.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/archive/hf_image_classification/VisionPerceiverConv.ipynb -------------------------------------------------------------------------------- /archive/hf_text_classification/LanguagePerceiver.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/archive/hf_text_classification/LanguagePerceiver.ipynb -------------------------------------------------------------------------------- /archive/unet_image_segmentation/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/archive/unet_image_segmentation/model.py -------------------------------------------------------------------------------- /archive/unet_image_segmentation/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/archive/unet_image_segmentation/train.py -------------------------------------------------------------------------------- /archive/unet_image_segmentation/unet.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/archive/unet_image_segmentation/unet.ipynb -------------------------------------------------------------------------------- /inference-benchmarking/Readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/Readme.md -------------------------------------------------------------------------------- /inference-benchmarking/__init__.py: -------------------------------------------------------------------------------- 1 | """AWSNeuronEval module.""" 2 | 3 | # Implement your code here. 4 | -------------------------------------------------------------------------------- /inference-benchmarking/accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/accuracy.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference-benchmarking/clients/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/base.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/llm_perf/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/llm_perf/__init__.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/llm_perf/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/llm_perf/client.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/llm_perf/scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference-benchmarking/clients/llm_perf/scripts/run_llm_perf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/llm_perf/scripts/run_llm_perf.sh -------------------------------------------------------------------------------- /inference-benchmarking/clients/llm_perf/scripts/setup_llm_perf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/llm_perf/scripts/setup_llm_perf.sh -------------------------------------------------------------------------------- /inference-benchmarking/clients/lm_eval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/lm_eval/__init__.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/lm_eval/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/lm_eval/client.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/lm_eval/scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference-benchmarking/clients/lm_eval/scripts/run_lm_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/lm_eval/scripts/run_lm_eval.sh -------------------------------------------------------------------------------- /inference-benchmarking/clients/lm_eval/scripts/setup_lm_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/lm_eval/scripts/setup_lm_eval.sh -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/__init__.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/client.py -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/prompts/0shot.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/prompts/0shot.txt -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/prompts/0shot_cot.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/prompts/0shot_cot.txt -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/prompts/0shot_cot_ans.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/prompts/0shot_cot_ans.txt -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/prompts/0shot_no_context.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/prompts/0shot_no_context.txt -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/prompts/0shot_rag.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/clients/long_bench/prompts/0shot_rag.txt -------------------------------------------------------------------------------- /inference-benchmarking/clients/long_bench/prompts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference-benchmarking/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/config.yaml -------------------------------------------------------------------------------- /inference-benchmarking/perf.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/perf.yaml -------------------------------------------------------------------------------- /inference-benchmarking/performance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/performance.py -------------------------------------------------------------------------------- /inference-benchmarking/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/requirements.txt -------------------------------------------------------------------------------- /inference-benchmarking/server/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference-benchmarking/server/scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference-benchmarking/server/scripts/prompt-template.jinja: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/server/scripts/prompt-template.jinja -------------------------------------------------------------------------------- /inference-benchmarking/server/scripts/start_server.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/server/scripts/start_server.sh -------------------------------------------------------------------------------- /inference-benchmarking/server/vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/server/vllm.py -------------------------------------------------------------------------------- /inference-benchmarking/server_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/server_config.py -------------------------------------------------------------------------------- /inference-benchmarking/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/utils/__init__.py -------------------------------------------------------------------------------- /inference-benchmarking/utils/artifacts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/utils/artifacts.py -------------------------------------------------------------------------------- /inference-benchmarking/utils/parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/utils/parser.py -------------------------------------------------------------------------------- /inference-benchmarking/utils/process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/utils/process.py -------------------------------------------------------------------------------- /inference-benchmarking/utils/s3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/utils/s3.py -------------------------------------------------------------------------------- /inference-benchmarking/utils/tee_output.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/inference-benchmarking/utils/tee_output.py -------------------------------------------------------------------------------- /releasenotes.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/releasenotes.md -------------------------------------------------------------------------------- /tensorflow-neuron/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/tensorflow-neuron/README.md -------------------------------------------------------------------------------- /tensorflow-neuron/inference/unet/UnetTF2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/tensorflow-neuron/inference/unet/UnetTF2.ipynb -------------------------------------------------------------------------------- /torch-neuron/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/README.md -------------------------------------------------------------------------------- /torch-neuron/inference/beit/BEiT.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/beit/BEiT.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/bertbasecased/BertBaseCased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/bertbasecased/BertBaseCased.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/bertlargeuncased/BertLargeUncased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/bertlargeuncased/BertLargeUncased.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/clip/CLIP_Model_HF.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/clip/CLIP_Model_HF.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/common/processing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/common/processing.py -------------------------------------------------------------------------------- /torch-neuron/inference/common/wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/common/wrapper.py -------------------------------------------------------------------------------- /torch-neuron/inference/craft/Craft.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/craft/Craft.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/efficientnet/EfficientNet.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/efficientnet/EfficientNet.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/fairseq/Fairseq.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/fairseq/Fairseq.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/gfl_mmdet/GFL.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/gfl_mmdet/GFL.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/hrnet/HRnet.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/hrnet/HRnet.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/marianmt/MarianMT.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/marianmt/MarianMT.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/rcnn/Rcnn.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/rcnn/Rcnn.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/resnet/Resnet.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/resnet/Resnet.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/resnext/Resnext.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/resnext/Resnext.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/robertabase/RobertaBase.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/robertabase/RobertaBase.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/ssd/SSD300VGG16.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/ssd/SSD300VGG16.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/trocr/TrOCR.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/trocr/TrOCR.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/vgg/VGG.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/vgg/VGG.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/vit/ViT.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/vit/ViT.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/yolof_detectron2/YoloF.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/yolof_detectron2/YoloF.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/yolov5/Yolov5.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/yolov5/Yolov5.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/yolov6/Yolov6.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/yolov6/Yolov6.ipynb -------------------------------------------------------------------------------- /torch-neuron/inference/yolov7/Yolov7.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuron/inference/yolov7/Yolov7.ipynb -------------------------------------------------------------------------------- /torch-neuronx/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/README.md -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/README.md -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-multicore/build.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-multicore/build.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-multicore/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-multicore/inference.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-multicore/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-multicore/model.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-multicore/my_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-multicore/my_ops.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-multicore/relu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-multicore/relu.cpp -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-multicore/shape.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-multicore/shape.cpp -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-tcm/build.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-tcm/build.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-tcm/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-tcm/inference.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-tcm/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-tcm/model.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-tcm/my_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-tcm/my_ops.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-tcm/relu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-tcm/relu.cpp -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron-tcm/shape.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron-tcm/shape.cpp -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron/build.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron/build.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron/inference.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron/model.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron/my_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron/my_ops.py -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron/relu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron/relu.cpp -------------------------------------------------------------------------------- /torch-neuronx/inference/customop_mlp/neuron/shape.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/customop_mlp/neuron/shape.cpp -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_bert_inference_on_trn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_bert_inference_on_trn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_clip_base_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_clip_base_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_clip_large_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_clip_large_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_distilbert_Inference_on_trn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_distilbert_Inference_on_trn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_gpt2_feature_extraction_on_trn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_gpt2_feature_extraction_on_trn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_perceiver_language_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_perceiver_language_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_perceiver_multimodal_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_perceiver_multimodal_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_perceiver_vision_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_perceiver_vision_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_alpha_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_alpha_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/compile_latency_optimized.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/compile_latency_optimized.sh -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/compile_throughput_optimized.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/compile_throughput_optimized.sh -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/hf_pretrained_pixart_sigma_1k_latency_optimized.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/hf_pretrained_pixart_sigma_1k_latency_optimized.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/hf_pretrained_pixart_sigma_1k_throughput_optimized.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/hf_pretrained_pixart_sigma_1k_throughput_optimized.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/cache_hf_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/cache_hf_model.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_decoder.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_text_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_text_encoder.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_transformer_latency_optimized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_transformer_latency_optimized.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_transformer_throughput_optimized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/compile_transformer_throughput_optimized.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/neuron_commons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/neuron_commons.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/neuron_parallel_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/neuron_pixart_sigma/neuron_parallel_utils.py -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_1k/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_pixart_sigma_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_pixart_sigma_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_roberta_inference_on_frn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_roberta_inference_on_frn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sd15_512_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sd15_512_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sd2_512_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sd2_512_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sd2_768_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sd2_768_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sd2_inpainting_936_624_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sd2_inpainting_936_624_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sd_x4_upscaler_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sd_x4_upscaler_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sdxl_base_1024_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sdxl_base_1024_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_sdxl_base_and_refiner_1024_inference.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_sdxl_base_and_refiner_1024_inference.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_vit_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_vit_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_wav2vec2_conformer_relpos_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_wav2vec2_conformer_relpos_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/hf_pretrained_wav2vec2_conformer_rope_inference_on_inf2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/hf_pretrained_wav2vec2_conformer_rope_inference_on_inf2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/pretrained_unet_inference_on_trn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/pretrained_unet_inference_on_trn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/sd2_inpainting_mask.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/sd2_inpainting_mask.png -------------------------------------------------------------------------------- /torch-neuronx/inference/sd2_inpainting_photo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/sd2_inpainting_photo.png -------------------------------------------------------------------------------- /torch-neuronx/inference/tv_pretrained_resnet50_inference_on_trn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/tv_pretrained_resnet50_inference_on_trn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/inference/tv_pretrained_vgg_inference_on_trn1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/inference/tv_pretrained_vgg_inference_on_trn1.ipynb -------------------------------------------------------------------------------- /torch-neuronx/microbenchmark/matmult_linear.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/microbenchmark/matmult_linear.py -------------------------------------------------------------------------------- /torch-neuronx/microbenchmark/microbenchmark.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/microbenchmark/microbenchmark.ipynb -------------------------------------------------------------------------------- /torch-neuronx/microbenchmark/ubench_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/microbenchmark/ubench_utils.py -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/README.md -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/build_configs_and_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/build_configs_and_setup.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/docker/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/docker/Dockerfile -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/docker/allreduce.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/docker/allreduce.py -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/docker/allreduce.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/docker/allreduce.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/submit_job.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/submit_job.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/templates/build_docker_image.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/templates/build_docker_image.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/templates/compute_env.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/templates/compute_env.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/templates/create_resources.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/templates/create_resources.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/templates/job_def.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/templates/job_def.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/templates/job_queue.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/templates/job_queue.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/all-reduce/templates/launch_template.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/all-reduce/templates/launch_template.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/README.md -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/config.txt -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/docker/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/docker/Dockerfile -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/docker/llama_batch_training.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/docker/llama_batch_training.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/images/aws-batch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/images/aws-batch.png -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/scripts/build_and_push_docker_image.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/scripts/build_and_push_docker_image.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/scripts/cleanup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/scripts/cleanup.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/scripts/create_resources.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/scripts/create_resources.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/scripts/download_and_tokenize_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/scripts/download_and_tokenize_data.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/scripts/submit_batch_job.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/scripts/submit_batch_job.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/setup.sh -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/templates/compute_env.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/templates/compute_env.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/templates/job_def.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/templates/job_def.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/templates/job_queue.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/templates/job_queue.json -------------------------------------------------------------------------------- /torch-neuronx/training/aws-batch/llama2/templates/launch_template.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/aws-batch/llama2/templates/launch_template.json -------------------------------------------------------------------------------- /torch-neuronx/training/common/hf_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/common/hf_utils.py -------------------------------------------------------------------------------- /torch-neuronx/training/common/vision_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/common/vision_utils.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/README.md -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/neuron/build.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/neuron/build.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/neuron/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/neuron/model.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/neuron/my_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/neuron/my_ops.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/neuron/relu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/neuron/relu.cpp -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/neuron/shape.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/neuron/shape.cpp -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/neuron/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/neuron/train.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/pytorch/build.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/pytorch/build.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/pytorch/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/pytorch/model.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/pytorch/my_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/pytorch/my_ops.py -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/pytorch/relu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/pytorch/relu.cpp -------------------------------------------------------------------------------- /torch-neuronx/training/customop_mlp/pytorch/train_cpu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/customop_mlp/pytorch/train_cpu.py -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/adamw_fp32_optim_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/adamw_fp32_optim_params.py -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/adamw_fp32_params_copy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/adamw_fp32_params_copy.py -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/dp_bert_large_hf_pretrain_hdf5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/dp_bert_large_hf_pretrain_hdf5.py -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/dp_bert_large_hf_pretrain_hdf5_THIRD-PARTY-LICENSES.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/dp_bert_large_hf_pretrain_hdf5_THIRD-PARTY-LICENSES.txt -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/lamb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/lamb.py -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s128.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s128.sh -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s128_lamb.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s128_lamb.sh -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s512_lamb_phase2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s512_lamb_phase2.sh -------------------------------------------------------------------------------- /torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s512_phase2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/dp_bert_hf_pretrain/run_dp_bert_large_hf_pretrain_bf16_s512_phase2.sh -------------------------------------------------------------------------------- /torch-neuronx/training/hf_bert_jp/bert-jp-tutorial.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_bert_jp/bert-jp-tutorial.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_contrastive_image_text/CLIPBase.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_contrastive_image_text/CLIPBase.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_contrastive_image_text/CLIPLarge.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_contrastive_image_text/CLIPLarge.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_contrastive_image_text/run_clip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_contrastive_image_text/run_clip.py -------------------------------------------------------------------------------- /torch-neuronx/training/hf_image_classification/run_image_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_image_classification/run_image_classification.py -------------------------------------------------------------------------------- /torch-neuronx/training/hf_image_classification/vit.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_image_classification/vit.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_language_modeling/gpt2/gpt2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_language_modeling/gpt2/gpt2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_language_modeling/gpt2/run_clm.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_language_modeling/gpt2/run_clm.patch -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/.gitignore -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/01-hf-single-neuron.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/01-hf-single-neuron.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/02-hf-distributed-training.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/02-hf-distributed-training.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/README.md -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/code/01-trainium-single-core/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/code/01-trainium-single-core/train.py -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/code/02-trainium-distributed-training/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/code/02-trainium-distributed-training/train.py -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/data/data.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/data/data.csv -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/data/test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/data/test.csv -------------------------------------------------------------------------------- /torch-neuronx/training/hf_sentiment_analysis/data/train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_sentiment_analysis/data/train.csv -------------------------------------------------------------------------------- /torch-neuronx/training/hf_summarization/BartLarge.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_summarization/BartLarge.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_summarization/T5Large.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_summarization/T5Large.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_summarization/run_summarization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_summarization/run_summarization.py -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/AlbertBase.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/AlbertBase.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/BertBaseCased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/BertBaseCased.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/BertBaseUncased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/BertBaseUncased.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/BertLargeCased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/BertLargeCased.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/BertLargeUncased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/BertLargeUncased.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/CamembertBase.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/CamembertBase.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/DistilbertBaseUncased.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/DistilbertBaseUncased.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/ElectraSmall.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/ElectraSmall.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/README.md -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/RobertaBase.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/RobertaBase.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/RobertaLarge.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/RobertaLarge.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/XlmRobertaBase.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/XlmRobertaBase.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/hf_text_classification/run_glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/hf_text_classification/run_glue.py -------------------------------------------------------------------------------- /torch-neuronx/training/llama2/adamw_fp32_optim_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/llama2/adamw_fp32_optim_params.py -------------------------------------------------------------------------------- /torch-neuronx/training/llama2/convert_checkpoints.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/llama2/convert_checkpoints.py -------------------------------------------------------------------------------- /torch-neuronx/training/llama2/get_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/llama2/get_dataset.py -------------------------------------------------------------------------------- /torch-neuronx/training/llama2/modeling_llama_nxd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/llama2/modeling_llama_nxd.py -------------------------------------------------------------------------------- /torch-neuronx/training/llama2/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/llama2/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/eval.py -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/eval_using_trace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/eval_using_trace.py -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/model.py -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/train.py -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/train_cpu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/train_cpu.py -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/train_torchrun.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/train_torchrun.py -------------------------------------------------------------------------------- /torch-neuronx/training/mnist_mlp/train_xmp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/mnist_mlp/train_xmp.py -------------------------------------------------------------------------------- /torch-neuronx/training/resnet50/resnet50.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/resnet50/resnet50.ipynb -------------------------------------------------------------------------------- /torch-neuronx/training/resnet50/run_image_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/resnet50/run_image_classification.py -------------------------------------------------------------------------------- /torch-neuronx/training/stable_diffusion/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/stable_diffusion/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/training/stable_diffusion/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/stable_diffusion/run.py -------------------------------------------------------------------------------- /torch-neuronx/training/stable_diffusion/sd_training_neuron.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/stable_diffusion/sd_training_neuron.py -------------------------------------------------------------------------------- /torch-neuronx/training/tp_dp_bert_hf_pretrain/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/tp_dp_bert_hf_pretrain/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/training/tp_dp_bert_hf_pretrain/tp_dp_bert_large_hf_pretrain_hdf5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/tp_dp_bert_hf_pretrain/tp_dp_bert_large_hf_pretrain_hdf5.py -------------------------------------------------------------------------------- /torch-neuronx/training/tp_dp_gpt_neox_hf_pretrain/common/adamw_fp32_optim_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/tp_dp_gpt_neox_hf_pretrain/common/adamw_fp32_optim_params.py -------------------------------------------------------------------------------- /torch-neuronx/training/tp_dp_gpt_neox_hf_pretrain/common/get_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/tp_dp_gpt_neox_hf_pretrain/common/get_dataset.py -------------------------------------------------------------------------------- /torch-neuronx/training/tp_dp_gpt_neox_hf_pretrain/common/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/tp_dp_gpt_neox_hf_pretrain/common/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/config_1p5B_gpt2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/config_1p5B_gpt2.json -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/neuron_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/neuron_utils.py -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/requirements.txt -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/run_clm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/run_clm.sh -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/run_clm.slurm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/run_clm.slurm -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/run_clm_compile.slurm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/run_clm_compile.slurm -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/run_clm_no_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/run_clm_no_trainer.py -------------------------------------------------------------------------------- /torch-neuronx/training/zero1_gpt2/uncomment_gradaccum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/training/zero1_gpt2/uncomment_gradaccum.sh -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/README.md -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/codellama-13b-16k-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/codellama-13b-16k-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/facebook-opt-13b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/facebook-opt-13b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/facebook-opt-30b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/facebook-opt-30b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/facebook-opt-66b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/facebook-opt-66b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/gpt-j-6b-sampling-dp.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/gpt-j-6b-sampling-dp.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/gpt-j-6b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/gpt-j-6b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/gpt-j-dp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/gpt-j-dp.py -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-3.1-405b-multinode-16k-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-3.1-405b-multinode-16k-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-3.1-70b-64k-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-3.1-70b-64k-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-3.1-70b-eagle-speculative-decoding.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-3.1-70b-eagle-speculative-decoding.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-3.1-70b-speculative-decoding.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-3.1-70b-speculative-decoding.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-3.1-8b-128k-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-3.1-8b-128k-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-3.1-8b-32k-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-3.1-8b-32k-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/llama-70b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/llama-70b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/meta-llama-2-13b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/meta-llama-2-13b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/meta-llama-3-70b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/meta-llama-3-70b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/meta-llama-3-8b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/meta-llama-3-8b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/meta-llama-3.1-70b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/meta-llama-3.1-70b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/meta-llama-3.1-8b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/meta-llama-3.1-8b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/mistralai-Mistral-7b-Instruct-v0.2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/mistralai-Mistral-7b-Instruct-v0.2.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/mixtral-8x7b-sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/mixtral-8x7b-sampling.ipynb -------------------------------------------------------------------------------- /torch-neuronx/transformers-neuronx/inference/speculative_sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aws-neuron/aws-neuron-samples/HEAD/torch-neuronx/transformers-neuronx/inference/speculative_sampling.ipynb --------------------------------------------------------------------------------